{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:ERWOZK2E5NN3Q3TMQROZQ73V75","short_pith_number":"pith:ERWOZK2E","canonical_record":{"source":{"id":"2606.32034","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-30T17:58:23Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"60558250c3730d18a38e7a462a2a379ab8fd23f40cfb0bcd933b8c0fd2c7df38","abstract_canon_sha256":"d79517a4c59be96ac4dca3626fed427ecd0d01424c4828aeaf47c006cf25bdaa"},"schema_version":"1.0"},"canonical_sha256":"246cecab44eb5bb86e6c845d987f75ff4cf6ac28a3bfb5598057709e71feee54","source":{"kind":"arxiv","id":"2606.32034","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.32034","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.32034v1","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.32034","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"pith_short_12","alias_value":"ERWOZK2E5NN3","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"pith_short_16","alias_value":"ERWOZK2E5NN3Q3TM","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"pith_short_8","alias_value":"ERWOZK2E","created_at":"2026-07-01T02:17:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:ERWOZK2E5NN3Q3TMQROZQ73V75","target":"record","payload":{"canonical_record":{"source":{"id":"2606.32034","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-30T17:58:23Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"60558250c3730d18a38e7a462a2a379ab8fd23f40cfb0bcd933b8c0fd2c7df38","abstract_canon_sha256":"d79517a4c59be96ac4dca3626fed427ecd0d01424c4828aeaf47c006cf25bdaa"},"schema_version":"1.0"},"canonical_sha256":"246cecab44eb5bb86e6c845d987f75ff4cf6ac28a3bfb5598057709e71feee54","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-01T02:17:47.864380Z","signature_b64":"DM54qMWHjfryuz//YlmEHq6Bud35RQM1E+3G3Gjot4ICvOXtmipf8txtRn+W4qLmKLuUz/9UHQIvMZeVSwa5CA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"246cecab44eb5bb86e6c845d987f75ff4cf6ac28a3bfb5598057709e71feee54","last_reissued_at":"2026-07-01T02:17:47.863976Z","signature_status":"signed_v1","first_computed_at":"2026-07-01T02:17:47.863976Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.32034","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T02:17:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"H7D1iiqJ6J+0/6WXExbNQNxcKWXZeCVZIWOq1ZxwP6eeo4mnPUvO6UoOlFZjhYfB/gVU+yM8x4k6WtR5lapUDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T21:06:02.212679Z"},"content_sha256":"a1fdf3b5df8d6ee0d347c5c8356c79f270ea6d257aa6aae78a42efc2d843d91a","schema_version":"1.0","event_id":"sha256:a1fdf3b5df8d6ee0d347c5c8356c79f270ea6d257aa6aae78a42efc2d843d91a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:ERWOZK2E5NN3Q3TMQROZQ73V75","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"QVal: Cheaply Evaluating Dense Supervision Signals for Long-Horizon LLM Agents","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.LG","authors_text":"Ameya Prabhu, Ilze Amanda Auzina, Joschka Str\\\"uber, Matteo Merler, Matthias Bethge, Sergio Hern\\'andez-Guti\\'errez","submitted_at":"2026-06-30T17:58:23Z","abstract_excerpt":"LLM agents increasingly act over long horizons, where a single trajectory can contain hundreds or thousands of actions. In these settings, outcome-only rewards provide too sparse guidance, failing to inform the model about the goodness of intermediate actions. Dense supervision methods aim to solve this problem by scoring intermediate steps, from intrinsic confidence to self-distillation and embedding similarities. However, it is common practice to evaluate them by measuring the downstream performance of a training pipeline that integrates them. This is expensive, conflates supervision quality"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.32034","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.32034/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T02:17:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Bb+1UdRYzD3RjiKjLmmTx0peljPiPuIs2+If9c2ugrP5jpX98jMNUINFB3mak3A+3CV9Z7f4fppUep5KE+zCBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-01T21:06:02.213074Z"},"content_sha256":"5f1b236479b8a0fc44a5fe53e47eb4a23bb98916cf29a9a52c264455a72c537d","schema_version":"1.0","event_id":"sha256:5f1b236479b8a0fc44a5fe53e47eb4a23bb98916cf29a9a52c264455a72c537d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ERWOZK2E5NN3Q3TMQROZQ73V75/bundle.json","state_url":"https://pith.science/pith/ERWOZK2E5NN3Q3TMQROZQ73V75/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ERWOZK2E5NN3Q3TMQROZQ73V75/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-01T21:06:02Z","links":{"resolver":"https://pith.science/pith/ERWOZK2E5NN3Q3TMQROZQ73V75","bundle":"https://pith.science/pith/ERWOZK2E5NN3Q3TMQROZQ73V75/bundle.json","state":"https://pith.science/pith/ERWOZK2E5NN3Q3TMQROZQ73V75/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ERWOZK2E5NN3Q3TMQROZQ73V75/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:ERWOZK2E5NN3Q3TMQROZQ73V75","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d79517a4c59be96ac4dca3626fed427ecd0d01424c4828aeaf47c006cf25bdaa","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-30T17:58:23Z","title_canon_sha256":"60558250c3730d18a38e7a462a2a379ab8fd23f40cfb0bcd933b8c0fd2c7df38"},"schema_version":"1.0","source":{"id":"2606.32034","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.32034","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.32034v1","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.32034","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"pith_short_12","alias_value":"ERWOZK2E5NN3","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"pith_short_16","alias_value":"ERWOZK2E5NN3Q3TM","created_at":"2026-07-01T02:17:47Z"},{"alias_kind":"pith_short_8","alias_value":"ERWOZK2E","created_at":"2026-07-01T02:17:47Z"}],"graph_snapshots":[{"event_id":"sha256:5f1b236479b8a0fc44a5fe53e47eb4a23bb98916cf29a9a52c264455a72c537d","target":"graph","created_at":"2026-07-01T02:17:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.32034/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"LLM agents increasingly act over long horizons, where a single trajectory can contain hundreds or thousands of actions. In these settings, outcome-only rewards provide too sparse guidance, failing to inform the model about the goodness of intermediate actions. Dense supervision methods aim to solve this problem by scoring intermediate steps, from intrinsic confidence to self-distillation and embedding similarities. However, it is common practice to evaluate them by measuring the downstream performance of a training pipeline that integrates them. This is expensive, conflates supervision quality","authors_text":"Ameya Prabhu, Ilze Amanda Auzina, Joschka Str\\\"uber, Matteo Merler, Matthias Bethge, Sergio Hern\\'andez-Guti\\'errez","cross_cats":["cs.AI","cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-30T17:58:23Z","title":"QVal: Cheaply Evaluating Dense Supervision Signals for Long-Horizon LLM Agents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.32034","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a1fdf3b5df8d6ee0d347c5c8356c79f270ea6d257aa6aae78a42efc2d843d91a","target":"record","created_at":"2026-07-01T02:17:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d79517a4c59be96ac4dca3626fed427ecd0d01424c4828aeaf47c006cf25bdaa","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-30T17:58:23Z","title_canon_sha256":"60558250c3730d18a38e7a462a2a379ab8fd23f40cfb0bcd933b8c0fd2c7df38"},"schema_version":"1.0","source":{"id":"2606.32034","kind":"arxiv","version":1}},"canonical_sha256":"246cecab44eb5bb86e6c845d987f75ff4cf6ac28a3bfb5598057709e71feee54","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"246cecab44eb5bb86e6c845d987f75ff4cf6ac28a3bfb5598057709e71feee54","first_computed_at":"2026-07-01T02:17:47.863976Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-01T02:17:47.863976Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"DM54qMWHjfryuz//YlmEHq6Bud35RQM1E+3G3Gjot4ICvOXtmipf8txtRn+W4qLmKLuUz/9UHQIvMZeVSwa5CA==","signature_status":"signed_v1","signed_at":"2026-07-01T02:17:47.864380Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.32034","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a1fdf3b5df8d6ee0d347c5c8356c79f270ea6d257aa6aae78a42efc2d843d91a","sha256:5f1b236479b8a0fc44a5fe53e47eb4a23bb98916cf29a9a52c264455a72c537d"],"state_sha256":"a6140c99e27869c45bd3893cec27f4c252c1d3f9960cf66843a9b5d17de2258b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Gfv+MIf8TZn6QtPqQFqf7du2m6S+kZupYgNo33thYI1k4AD5l/vJvoqb7nNalbJWWfrArhTq20tImN+cOhw8Aw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-01T21:06:02.215122Z","bundle_sha256":"e2bbc0d8c419212bbf10b583e670ad3de052b92cef19f3ae214346974a0fbef3"}}