{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:B5ISACWY42VG7WEWE5VDQ7WC2W","short_pith_number":"pith:B5ISACWY","canonical_record":{"source":{"id":"2606.31958","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-30T17:00:33Z","cross_cats_sorted":[],"title_canon_sha256":"adbd714556209b3400824463c944272ff5e9855f7cb9967b0f7ad29a9a5cd66c","abstract_canon_sha256":"68c8f04f25bf31ee4eb860e0b0d4201639a9134ffae3f708f3660fa11d3a1eb4"},"schema_version":"1.0"},"canonical_sha256":"0f51200ad8e6aa6fd896276a387ec2d5aa90d773642d679bcdfd2665131da133","source":{"kind":"arxiv","id":"2606.31958","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.31958","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"arxiv_version","alias_value":"2606.31958v1","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.31958","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"pith_short_12","alias_value":"B5ISACWY42VG","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"pith_short_16","alias_value":"B5ISACWY42VG7WEW","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"pith_short_8","alias_value":"B5ISACWY","created_at":"2026-07-01T01:18:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:B5ISACWY42VG7WEWE5VDQ7WC2W","target":"record","payload":{"canonical_record":{"source":{"id":"2606.31958","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-30T17:00:33Z","cross_cats_sorted":[],"title_canon_sha256":"adbd714556209b3400824463c944272ff5e9855f7cb9967b0f7ad29a9a5cd66c","abstract_canon_sha256":"68c8f04f25bf31ee4eb860e0b0d4201639a9134ffae3f708f3660fa11d3a1eb4"},"schema_version":"1.0"},"canonical_sha256":"0f51200ad8e6aa6fd896276a387ec2d5aa90d773642d679bcdfd2665131da133","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-01T01:18:27.005810Z","signature_b64":"5bdPAXynYOnH/qSvZkkgaE4h/hLVtAPPh/4kclCqBssbvoORyjDj1iOqPhh7cIfOvUOfn6ZPr2OXMY6pAfzYDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0f51200ad8e6aa6fd896276a387ec2d5aa90d773642d679bcdfd2665131da133","last_reissued_at":"2026-07-01T01:18:27.005357Z","signature_status":"signed_v1","first_computed_at":"2026-07-01T01:18:27.005357Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.31958","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T01:18:27Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jwvpITFIduv7BReuWa+PMFS8axgKURwnnVmnRWB2N6eB8P6FyFfv5YTH3cU3iBr/ZmA+W8P74j7Cjnu/ZuHwDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T03:19:08.702268Z"},"content_sha256":"bf4bf130f723e00b3feb2871251c0be85c432c02256ded1002a30930a7b79eb1","schema_version":"1.0","event_id":"sha256:bf4bf130f723e00b3feb2871251c0be85c432c02256ded1002a30930a7b79eb1"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:B5ISACWY42VG7WEWE5VDQ7WC2W","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Adapting Generalist Robot Policies with Semantic Reinforcement Learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.RO","authors_text":"Andrew Wagenmaker, Jagdeep Singh Bhatia, Sergey Levine, William Chen","submitted_at":"2026-06-30T17:00:33Z","abstract_excerpt":"Generalist robot policies learn a diverse repertoire of behaviors from large-scale pretraining. In principle, this makes them excellent priors for downstream adaptation via reinforcement learning (RL). In practice, however, standard RL methods leveraging this prior optimize directly over robot actions, requiring the base policy's action distribution to be close to that of a performant policy from the start. This assumption breaks down for complex or long-horizon tasks that fall outside the pretraining distribution. Our key insight is that, for sufficiently expressive generalist policies, langu"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.31958","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.31958/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-01T01:18:27Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0nsy/Oze2IRdxNKTzgIRpgARdXRvnQJJtUOcytbT8DcbwfwtfJNnK5DZac/DHDGxSJqS4BJUjWLKBZ8EY/qIAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T03:19:08.702697Z"},"content_sha256":"7fb51f3763bc6a9c5a7aa39788cb2327e0dc7ba197f3bf41733f89221428234f","schema_version":"1.0","event_id":"sha256:7fb51f3763bc6a9c5a7aa39788cb2327e0dc7ba197f3bf41733f89221428234f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/B5ISACWY42VG7WEWE5VDQ7WC2W/bundle.json","state_url":"https://pith.science/pith/B5ISACWY42VG7WEWE5VDQ7WC2W/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/B5ISACWY42VG7WEWE5VDQ7WC2W/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T03:19:08Z","links":{"resolver":"https://pith.science/pith/B5ISACWY42VG7WEWE5VDQ7WC2W","bundle":"https://pith.science/pith/B5ISACWY42VG7WEWE5VDQ7WC2W/bundle.json","state":"https://pith.science/pith/B5ISACWY42VG7WEWE5VDQ7WC2W/state.json","well_known_bundle":"https://pith.science/.well-known/pith/B5ISACWY42VG7WEWE5VDQ7WC2W/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:B5ISACWY42VG7WEWE5VDQ7WC2W","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"68c8f04f25bf31ee4eb860e0b0d4201639a9134ffae3f708f3660fa11d3a1eb4","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-30T17:00:33Z","title_canon_sha256":"adbd714556209b3400824463c944272ff5e9855f7cb9967b0f7ad29a9a5cd66c"},"schema_version":"1.0","source":{"id":"2606.31958","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.31958","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"arxiv_version","alias_value":"2606.31958v1","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.31958","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"pith_short_12","alias_value":"B5ISACWY42VG","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"pith_short_16","alias_value":"B5ISACWY42VG7WEW","created_at":"2026-07-01T01:18:27Z"},{"alias_kind":"pith_short_8","alias_value":"B5ISACWY","created_at":"2026-07-01T01:18:27Z"}],"graph_snapshots":[{"event_id":"sha256:7fb51f3763bc6a9c5a7aa39788cb2327e0dc7ba197f3bf41733f89221428234f","target":"graph","created_at":"2026-07-01T01:18:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.31958/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Generalist robot policies learn a diverse repertoire of behaviors from large-scale pretraining. In principle, this makes them excellent priors for downstream adaptation via reinforcement learning (RL). In practice, however, standard RL methods leveraging this prior optimize directly over robot actions, requiring the base policy's action distribution to be close to that of a performant policy from the start. This assumption breaks down for complex or long-horizon tasks that fall outside the pretraining distribution. Our key insight is that, for sufficiently expressive generalist policies, langu","authors_text":"Andrew Wagenmaker, Jagdeep Singh Bhatia, Sergey Levine, William Chen","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-30T17:00:33Z","title":"Adapting Generalist Robot Policies with Semantic Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.31958","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:bf4bf130f723e00b3feb2871251c0be85c432c02256ded1002a30930a7b79eb1","target":"record","created_at":"2026-07-01T01:18:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"68c8f04f25bf31ee4eb860e0b0d4201639a9134ffae3f708f3660fa11d3a1eb4","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.RO","submitted_at":"2026-06-30T17:00:33Z","title_canon_sha256":"adbd714556209b3400824463c944272ff5e9855f7cb9967b0f7ad29a9a5cd66c"},"schema_version":"1.0","source":{"id":"2606.31958","kind":"arxiv","version":1}},"canonical_sha256":"0f51200ad8e6aa6fd896276a387ec2d5aa90d773642d679bcdfd2665131da133","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0f51200ad8e6aa6fd896276a387ec2d5aa90d773642d679bcdfd2665131da133","first_computed_at":"2026-07-01T01:18:27.005357Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-01T01:18:27.005357Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"5bdPAXynYOnH/qSvZkkgaE4h/hLVtAPPh/4kclCqBssbvoORyjDj1iOqPhh7cIfOvUOfn6ZPr2OXMY6pAfzYDg==","signature_status":"signed_v1","signed_at":"2026-07-01T01:18:27.005810Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.31958","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:bf4bf130f723e00b3feb2871251c0be85c432c02256ded1002a30930a7b79eb1","sha256:7fb51f3763bc6a9c5a7aa39788cb2327e0dc7ba197f3bf41733f89221428234f"],"state_sha256":"d9685a14c74cd9937c5a29b02c7e7bd820f403a1d9656d4f9748351fc75a4cb7"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SQyX4vO1RxNnlAn9Vxk2HT91FOdNmVci0D7zGREjLPaSkq41tp/6iqJPNxFaXVpmTZm++0q9aPH5Ix/Gn/9UAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T03:19:08.705468Z","bundle_sha256":"c18bc651fb2ce1586e5933f46fb7ed9e6e80e7095119d2af27e74bfda49a1250"}}