{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:NE24O737TWEUMURUWJ5MPNK3JT","short_pith_number":"pith:NE24O737","canonical_record":{"source":{"id":"2606.00054","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-05-18T06:19:16Z","cross_cats_sorted":["cs.AI","cs.CV"],"title_canon_sha256":"68e33b8834a3882a945234120357e58a6b97447377823b6e2893b2057e709124","abstract_canon_sha256":"0c07f6f00c4a7ffbab3798ecaa25b4348ff3d5c678ab2668f74a7b5772e9680f"},"schema_version":"1.0"},"canonical_sha256":"6935c77f7f9d89465234b27ac7b55b4cfdf0759948c8fa68b2a193c754105dc9","source":{"kind":"arxiv","id":"2606.00054","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00054","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00054v1","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00054","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"pith_short_12","alias_value":"NE24O737TWEU","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"pith_short_16","alias_value":"NE24O737TWEUMURU","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"pith_short_8","alias_value":"NE24O737","created_at":"2026-06-02T00:03:13Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:NE24O737TWEUMURUWJ5MPNK3JT","target":"record","payload":{"canonical_record":{"source":{"id":"2606.00054","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-05-18T06:19:16Z","cross_cats_sorted":["cs.AI","cs.CV"],"title_canon_sha256":"68e33b8834a3882a945234120357e58a6b97447377823b6e2893b2057e709124","abstract_canon_sha256":"0c07f6f00c4a7ffbab3798ecaa25b4348ff3d5c678ab2668f74a7b5772e9680f"},"schema_version":"1.0"},"canonical_sha256":"6935c77f7f9d89465234b27ac7b55b4cfdf0759948c8fa68b2a193c754105dc9","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T00:03:13.562756Z","signature_b64":"ISJc1zmlaFwLsSEQymfiA8lbQraX6+Zv4OrfLiqGl3cFcEFs6jxfVjI0q7maqrmFfhFQxDz5qVwUUM6KtxYODw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6935c77f7f9d89465234b27ac7b55b4cfdf0759948c8fa68b2a193c754105dc9","last_reissued_at":"2026-06-02T00:03:13.562162Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T00:03:13.562162Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.00054","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T00:03:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Dz2AtpSzPMuV30rG8T2Clp2iI9EukFZf+Km6YJkyAXv13dwgq9zqGRuvLKHwATZaCMFAuyDVO3ER0/+KASk4DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T18:41:56.206276Z"},"content_sha256":"baa72530d25487038b208f68704bfaeacfba8a91f8cc5b4a7b57b75ddc19847e","schema_version":"1.0","event_id":"sha256:baa72530d25487038b208f68704bfaeacfba8a91f8cc5b4a7b57b75ddc19847e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:NE24O737TWEUMURUWJ5MPNK3JT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"From Human Videos to Robot Manipulation: A Survey on Scalable Vision-Language-Action Learning with Human-Centric Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CV"],"primary_cat":"cs.RO","authors_text":"Baining Guo, Hao Zhao, Huizhi Liang, Jiaolong Yang, Li Zhao, Marc Pollefeys, Oier Mees, Qixiu Li, Rushuai Yang, Yichao Shen, Yu Deng, Zhaowei Zhang, Zhiying Du, Zhiyuan Feng, Zongqing Lu","submitted_at":"2026-05-18T06:19:16Z","abstract_excerpt":"Recent progress in generalizable embodied control has been driven by large-scale pretraining of Vision-Language-Action (VLA) models. However, most existing approaches rely on large collections of robot demonstrations, which are costly to obtain and tightly coupled to specific embodiments. Human videos, by contrast, are abundant and capture rich interactions, providing diverse semantic and physical cues for real-world manipulation. Yet, embodiment differences and the frequent absence of task-aligned annotations make their direct use in VLA models challenging. This survey provides a unified view"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00054","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.00054/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T00:03:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9vZspYcx3EqXMqpkBpvbNR+SZsUjNSQvT4Bn+umaye/9aMG39j99QhfWjNZC8ZLUFwXJY6tTSbrm9+E0CPxbAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T18:41:56.206990Z"},"content_sha256":"a52ea7ce691db49be0c80a70e8940b6485138121a1201ffc82da9a8c2cdafb07","schema_version":"1.0","event_id":"sha256:a52ea7ce691db49be0c80a70e8940b6485138121a1201ffc82da9a8c2cdafb07"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NE24O737TWEUMURUWJ5MPNK3JT/bundle.json","state_url":"https://pith.science/pith/NE24O737TWEUMURUWJ5MPNK3JT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NE24O737TWEUMURUWJ5MPNK3JT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T18:41:56Z","links":{"resolver":"https://pith.science/pith/NE24O737TWEUMURUWJ5MPNK3JT","bundle":"https://pith.science/pith/NE24O737TWEUMURUWJ5MPNK3JT/bundle.json","state":"https://pith.science/pith/NE24O737TWEUMURUWJ5MPNK3JT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NE24O737TWEUMURUWJ5MPNK3JT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:NE24O737TWEUMURUWJ5MPNK3JT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0c07f6f00c4a7ffbab3798ecaa25b4348ff3d5c678ab2668f74a7b5772e9680f","cross_cats_sorted":["cs.AI","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-05-18T06:19:16Z","title_canon_sha256":"68e33b8834a3882a945234120357e58a6b97447377823b6e2893b2057e709124"},"schema_version":"1.0","source":{"id":"2606.00054","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00054","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00054v1","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00054","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"pith_short_12","alias_value":"NE24O737TWEU","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"pith_short_16","alias_value":"NE24O737TWEUMURU","created_at":"2026-06-02T00:03:13Z"},{"alias_kind":"pith_short_8","alias_value":"NE24O737","created_at":"2026-06-02T00:03:13Z"}],"graph_snapshots":[{"event_id":"sha256:a52ea7ce691db49be0c80a70e8940b6485138121a1201ffc82da9a8c2cdafb07","target":"graph","created_at":"2026-06-02T00:03:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.00054/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Recent progress in generalizable embodied control has been driven by large-scale pretraining of Vision-Language-Action (VLA) models. However, most existing approaches rely on large collections of robot demonstrations, which are costly to obtain and tightly coupled to specific embodiments. Human videos, by contrast, are abundant and capture rich interactions, providing diverse semantic and physical cues for real-world manipulation. Yet, embodiment differences and the frequent absence of task-aligned annotations make their direct use in VLA models challenging. This survey provides a unified view","authors_text":"Baining Guo, Hao Zhao, Huizhi Liang, Jiaolong Yang, Li Zhao, Marc Pollefeys, Oier Mees, Qixiu Li, Rushuai Yang, Yichao Shen, Yu Deng, Zhaowei Zhang, Zhiying Du, Zhiyuan Feng, Zongqing Lu","cross_cats":["cs.AI","cs.CV"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-05-18T06:19:16Z","title":"From Human Videos to Robot Manipulation: A Survey on Scalable Vision-Language-Action Learning with Human-Centric Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00054","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:baa72530d25487038b208f68704bfaeacfba8a91f8cc5b4a7b57b75ddc19847e","target":"record","created_at":"2026-06-02T00:03:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0c07f6f00c4a7ffbab3798ecaa25b4348ff3d5c678ab2668f74a7b5772e9680f","cross_cats_sorted":["cs.AI","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2026-05-18T06:19:16Z","title_canon_sha256":"68e33b8834a3882a945234120357e58a6b97447377823b6e2893b2057e709124"},"schema_version":"1.0","source":{"id":"2606.00054","kind":"arxiv","version":1}},"canonical_sha256":"6935c77f7f9d89465234b27ac7b55b4cfdf0759948c8fa68b2a193c754105dc9","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6935c77f7f9d89465234b27ac7b55b4cfdf0759948c8fa68b2a193c754105dc9","first_computed_at":"2026-06-02T00:03:13.562162Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T00:03:13.562162Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ISJc1zmlaFwLsSEQymfiA8lbQraX6+Zv4OrfLiqGl3cFcEFs6jxfVjI0q7maqrmFfhFQxDz5qVwUUM6KtxYODw==","signature_status":"signed_v1","signed_at":"2026-06-02T00:03:13.562756Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.00054","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:baa72530d25487038b208f68704bfaeacfba8a91f8cc5b4a7b57b75ddc19847e","sha256:a52ea7ce691db49be0c80a70e8940b6485138121a1201ffc82da9a8c2cdafb07"],"state_sha256":"d2401ee39bf9ad64d2d57e4b05f739239c7e5bf1371ae69950666c0d408a83f8"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RyL3oYPBKed68WDMlXgAj/sttJZ3IGJJ220dBEUy+pdwZtrM7AtSaaPMONRzL/CfYu3gtXfqjpRYLdPtdg/SBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T18:41:56.210197Z","bundle_sha256":"ed163cf98dd18e1482ea5a184295465a3cf945520fe34db9955a19e06830320a"}}