{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:GVFY2EOUK2EJMSWLD3JDOCT2PE","short_pith_number":"pith:GVFY2EOU","canonical_record":{"source":{"id":"1703.09788","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-03-28T20:28:52Z","cross_cats_sorted":[],"title_canon_sha256":"78009b9adbb78ee93f1b1213775f825017b684142aba678bede006743c4fd751","abstract_canon_sha256":"6717943aec0f4ad55172171f98bcc3fd932c402f6f5b96a06ada0fcdff1c69c0"},"schema_version":"1.0"},"canonical_sha256":"354b8d11d45688964acb1ed2370a7a790fdb3853875d14663c3ad60186a0b20b","source":{"kind":"arxiv","id":"1703.09788","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.09788","created_at":"2026-05-18T00:29:51Z"},{"alias_kind":"arxiv_version","alias_value":"1703.09788v3","created_at":"2026-05-18T00:29:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.09788","created_at":"2026-05-18T00:29:51Z"},{"alias_kind":"pith_short_12","alias_value":"GVFY2EOUK2EJ","created_at":"2026-05-18T12:31:18Z"},{"alias_kind":"pith_short_16","alias_value":"GVFY2EOUK2EJMSWL","created_at":"2026-05-18T12:31:18Z"},{"alias_kind":"pith_short_8","alias_value":"GVFY2EOU","created_at":"2026-05-18T12:31:18Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:GVFY2EOUK2EJMSWLD3JDOCT2PE","target":"record","payload":{"canonical_record":{"source":{"id":"1703.09788","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-03-28T20:28:52Z","cross_cats_sorted":[],"title_canon_sha256":"78009b9adbb78ee93f1b1213775f825017b684142aba678bede006743c4fd751","abstract_canon_sha256":"6717943aec0f4ad55172171f98bcc3fd932c402f6f5b96a06ada0fcdff1c69c0"},"schema_version":"1.0"},"canonical_sha256":"354b8d11d45688964acb1ed2370a7a790fdb3853875d14663c3ad60186a0b20b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:29:51.778825Z","signature_b64":"fje4qA4VZ4rwbITq9Ggi1hbnwYLTWzFcU1c90kHHR5SJEikwR0oIAInuehXO2YgbB0YoGdJM4qPleTE0lCkoCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"354b8d11d45688964acb1ed2370a7a790fdb3853875d14663c3ad60186a0b20b","last_reissued_at":"2026-05-18T00:29:51.778282Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:29:51.778282Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1703.09788","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:29:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1J3aRrrrRWyKyDQpJ4BuzjWciVwovaFtixC3XR6/3VBdH1eHFcXWwVFWacHtcgwzKjfdwZ76t7bFER2OSEABCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T08:15:04.751394Z"},"content_sha256":"9775d3ba4b3b9e5ae07960772ae2bc891ddec8cf1fe9f82072ee0bbdaf07ada5","schema_version":"1.0","event_id":"sha256:9775d3ba4b3b9e5ae07960772ae2bc891ddec8cf1fe9f82072ee0bbdaf07ada5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:GVFY2EOUK2EJMSWLD3JDOCT2PE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Towards Automatic Learning of Procedures from Web Instructional Videos","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Chenliang Xu, Jason J. Corso, Luowei Zhou","submitted_at":"2017-03-28T20:28:52Z","abstract_excerpt":"The potential for agents, whether embodied or software, to learn by observing other agents performing procedures involving objects and actions is rich. Current research on automatic procedure learning heavily relies on action labels or video subtitles, even during the evaluation phase, which makes them infeasible in real-world scenarios. This leads to our question: can the human-consensus structure of a procedure be learned from a large set of long, unconstrained videos (e.g., instructional videos from YouTube) with only visual evidence? To answer this question, we introduce the problem of pro"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.09788","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:29:51Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"IN6M7tzUXtW8C4H4Sah+xFu2yQG0Xy9glXeOtOKMIlY+7hxUvlINyZXVXB4Gp6hssXNztjCUvY6lsK+QITD5BA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-24T08:15:04.752060Z"},"content_sha256":"6e1f2eca03f1e8ca0a6e9ab04ce2914a3fe0135b95727e7f8d162156d1bd0835","schema_version":"1.0","event_id":"sha256:6e1f2eca03f1e8ca0a6e9ab04ce2914a3fe0135b95727e7f8d162156d1bd0835"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/GVFY2EOUK2EJMSWLD3JDOCT2PE/bundle.json","state_url":"https://pith.science/pith/GVFY2EOUK2EJMSWLD3JDOCT2PE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/GVFY2EOUK2EJMSWLD3JDOCT2PE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-24T08:15:04Z","links":{"resolver":"https://pith.science/pith/GVFY2EOUK2EJMSWLD3JDOCT2PE","bundle":"https://pith.science/pith/GVFY2EOUK2EJMSWLD3JDOCT2PE/bundle.json","state":"https://pith.science/pith/GVFY2EOUK2EJMSWLD3JDOCT2PE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/GVFY2EOUK2EJMSWLD3JDOCT2PE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:GVFY2EOUK2EJMSWLD3JDOCT2PE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"6717943aec0f4ad55172171f98bcc3fd932c402f6f5b96a06ada0fcdff1c69c0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-03-28T20:28:52Z","title_canon_sha256":"78009b9adbb78ee93f1b1213775f825017b684142aba678bede006743c4fd751"},"schema_version":"1.0","source":{"id":"1703.09788","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1703.09788","created_at":"2026-05-18T00:29:51Z"},{"alias_kind":"arxiv_version","alias_value":"1703.09788v3","created_at":"2026-05-18T00:29:51Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1703.09788","created_at":"2026-05-18T00:29:51Z"},{"alias_kind":"pith_short_12","alias_value":"GVFY2EOUK2EJ","created_at":"2026-05-18T12:31:18Z"},{"alias_kind":"pith_short_16","alias_value":"GVFY2EOUK2EJMSWL","created_at":"2026-05-18T12:31:18Z"},{"alias_kind":"pith_short_8","alias_value":"GVFY2EOU","created_at":"2026-05-18T12:31:18Z"}],"graph_snapshots":[{"event_id":"sha256:6e1f2eca03f1e8ca0a6e9ab04ce2914a3fe0135b95727e7f8d162156d1bd0835","target":"graph","created_at":"2026-05-18T00:29:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The potential for agents, whether embodied or software, to learn by observing other agents performing procedures involving objects and actions is rich. Current research on automatic procedure learning heavily relies on action labels or video subtitles, even during the evaluation phase, which makes them infeasible in real-world scenarios. This leads to our question: can the human-consensus structure of a procedure be learned from a large set of long, unconstrained videos (e.g., instructional videos from YouTube) with only visual evidence? To answer this question, we introduce the problem of pro","authors_text":"Chenliang Xu, Jason J. Corso, Luowei Zhou","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-03-28T20:28:52Z","title":"Towards Automatic Learning of Procedures from Web Instructional Videos"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1703.09788","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9775d3ba4b3b9e5ae07960772ae2bc891ddec8cf1fe9f82072ee0bbdaf07ada5","target":"record","created_at":"2026-05-18T00:29:51Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"6717943aec0f4ad55172171f98bcc3fd932c402f6f5b96a06ada0fcdff1c69c0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-03-28T20:28:52Z","title_canon_sha256":"78009b9adbb78ee93f1b1213775f825017b684142aba678bede006743c4fd751"},"schema_version":"1.0","source":{"id":"1703.09788","kind":"arxiv","version":3}},"canonical_sha256":"354b8d11d45688964acb1ed2370a7a790fdb3853875d14663c3ad60186a0b20b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"354b8d11d45688964acb1ed2370a7a790fdb3853875d14663c3ad60186a0b20b","first_computed_at":"2026-05-18T00:29:51.778282Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:29:51.778282Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"fje4qA4VZ4rwbITq9Ggi1hbnwYLTWzFcU1c90kHHR5SJEikwR0oIAInuehXO2YgbB0YoGdJM4qPleTE0lCkoCA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:29:51.778825Z","signed_message":"canonical_sha256_bytes"},"source_id":"1703.09788","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9775d3ba4b3b9e5ae07960772ae2bc891ddec8cf1fe9f82072ee0bbdaf07ada5","sha256:6e1f2eca03f1e8ca0a6e9ab04ce2914a3fe0135b95727e7f8d162156d1bd0835"],"state_sha256":"119ed1f026127982cbe3d038df65faeaf6be7568a1082730fa63c926818cd646"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JIZnKSimWgDHLCgC/M3TZrxiJc13oGCqfP97S7xDK5e4V3tLzrdXwat5a30QzqXEum6ouTaCUyediDt5NoXoDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-24T08:15:04.756201Z","bundle_sha256":"7bb43053faf64ecdaa61eb9ae884fd84d914eca0e22d789d783ca5756b4e4667"}}