{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:7DL6QNVWR6JABM7T2ZLG4SEFNG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c582fe6c4d2d726ee38ecbee20b7fa73bf28f2a13e43efd12220c20d20546658","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-06-29T06:19:35Z","title_canon_sha256":"3291361582b66cb0520207ce380cffda8807d1ab53d8f191a7866d034f57eb56"},"schema_version":"1.0","source":{"id":"2606.29834","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.29834","created_at":"2026-06-30T02:17:37Z"},{"alias_kind":"arxiv_version","alias_value":"2606.29834v1","created_at":"2026-06-30T02:17:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.29834","created_at":"2026-06-30T02:17:37Z"},{"alias_kind":"pith_short_12","alias_value":"7DL6QNVWR6JA","created_at":"2026-06-30T02:17:37Z"},{"alias_kind":"pith_short_16","alias_value":"7DL6QNVWR6JABM7T","created_at":"2026-06-30T02:17:37Z"},{"alias_kind":"pith_short_8","alias_value":"7DL6QNVW","created_at":"2026-06-30T02:17:37Z"}],"graph_snapshots":[{"event_id":"sha256:85b9e055f72e9a6008bbfd0d751395c54a4a6c7e0db97c2b7b63dd31a1f5fbc3","target":"graph","created_at":"2026-06-30T02:17:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.29834/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Real-world robot learning increasingly relies on heterogeneous data, but demonstrations and rollouts often mix useful progress with stalls, corrections, and suboptimal behavior. Effective policy learning therefore requires frame-level advantages that distinguish reliable local progress from failures and regressions. We propose Self-supervised Temporal Ensemble Advantage Modeling (STEAM), a label-free method that learns such advantages from expert demonstrations. STEAM trains an ensemble of temporal-offset predictors on frame pairs within expert trajectories, using the normalized temporal offse","authors_text":"Chao Yu, Dongming Qiao, Feng Gao, Guoliang Fan, Jincheng Yu, Kang Chen, Liangzhi Shi, Qiuyi Gu, Quanlu Zhang, Shuaihang Chen, Tianxing Zhou, Xiaodan Liang, Xinlei Chen, Yitao Wang, Yixian Zhang, Yu Wang, Zefang Huang, Zhen Guo, Zhihao Liu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-06-29T06:19:35Z","title":"STEAM: Self-Supervised Temporal Ensemble Advantage Modeling for Real-World Robot Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.29834","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:fe06064736828d5eedec817a27885464962b70b4cb233f3d21003f5e8ac31b81","target":"record","created_at":"2026-06-30T02:17:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c582fe6c4d2d726ee38ecbee20b7fa73bf28f2a13e43efd12220c20d20546658","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-06-29T06:19:35Z","title_canon_sha256":"3291361582b66cb0520207ce380cffda8807d1ab53d8f191a7866d034f57eb56"},"schema_version":"1.0","source":{"id":"2606.29834","kind":"arxiv","version":1}},"canonical_sha256":"f8d7e836b68f9200b3f3d6566e48856999bd81d5af416b6d19394958f81221ed","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f8d7e836b68f9200b3f3d6566e48856999bd81d5af416b6d19394958f81221ed","first_computed_at":"2026-06-30T02:17:37.429393Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-30T02:17:37.429393Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"6+7pkRynEqkejYEGTYMAYYv6MONtyTLS8AteRL3Yrf07FBT2yri4lc3P7VdCA0PWJ+1iDGa+f4aefK6kz0huBA==","signature_status":"signed_v1","signed_at":"2026-06-30T02:17:37.429991Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.29834","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:fe06064736828d5eedec817a27885464962b70b4cb233f3d21003f5e8ac31b81","sha256:85b9e055f72e9a6008bbfd0d751395c54a4a6c7e0db97c2b7b63dd31a1f5fbc3"],"state_sha256":"804d30c66e44a0dad7a44bc7e38a09649674b5184ba3640058181639edad4c2a"}