{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:JBSARKAELJPA3JU57GWES7S3G6","short_pith_number":"pith:JBSARKAE","canonical_record":{"source":{"id":"1708.01641","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-04T18:57:52Z","cross_cats_sorted":[],"title_canon_sha256":"394c3afbf85e4dae35ab5deea0f86eeb875175f9fed523cc0a4e617c37731c95","abstract_canon_sha256":"b84af76dd4645ff593961e1053be15d924c32dac6cbfa2ac816e856ba536aa27"},"schema_version":"1.0"},"canonical_sha256":"486408a8045a5e0da69df9ac497e5b37ba3f4cc541bef0c95c2b30717a037dca","source":{"kind":"arxiv","id":"1708.01641","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.01641","created_at":"2026-05-18T00:38:31Z"},{"alias_kind":"arxiv_version","alias_value":"1708.01641v1","created_at":"2026-05-18T00:38:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.01641","created_at":"2026-05-18T00:38:31Z"},{"alias_kind":"pith_short_12","alias_value":"JBSARKAELJPA","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_16","alias_value":"JBSARKAELJPA3JU5","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_8","alias_value":"JBSARKAE","created_at":"2026-05-18T12:31:21Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:JBSARKAELJPA3JU57GWES7S3G6","target":"record","payload":{"canonical_record":{"source":{"id":"1708.01641","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-04T18:57:52Z","cross_cats_sorted":[],"title_canon_sha256":"394c3afbf85e4dae35ab5deea0f86eeb875175f9fed523cc0a4e617c37731c95","abstract_canon_sha256":"b84af76dd4645ff593961e1053be15d924c32dac6cbfa2ac816e856ba536aa27"},"schema_version":"1.0"},"canonical_sha256":"486408a8045a5e0da69df9ac497e5b37ba3f4cc541bef0c95c2b30717a037dca","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:38:31.973622Z","signature_b64":"op1hf0zi79iiBXrh5mAK5PLZtCWS7t3EejlyRyKe4mjQWRbBUstn+IxpV2CQzf37tk9LTr8Fdwizk9a7y6mgBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"486408a8045a5e0da69df9ac497e5b37ba3f4cc541bef0c95c2b30717a037dca","last_reissued_at":"2026-05-18T00:38:31.973141Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:38:31.973141Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1708.01641","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:38:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YZqFFQJOFSk2lWw47/68AGTgZ52a6GGnMQ6JCvcqzArTsUTNE9g3aA21gGh69v8C4aMkrhAEhGtIQVzvBgwICw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T10:40:21.109255Z"},"content_sha256":"5194b4be68ab807be18291da4db6876ea4d47e4c3caabe18d900e727ff51f258","schema_version":"1.0","event_id":"sha256:5194b4be68ab807be18291da4db6876ea4d47e4c3caabe18d900e727ff51f258"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:JBSARKAELJPA3JU57GWES7S3G6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Localizing Moments in Video with Natural Language","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bryan Russell, Eli Shechtman, Josef Sivic, Lisa Anne Hendricks, Oliver Wang, Trevor Darrell","submitted_at":"2017-08-04T18:57:52Z","abstract_excerpt":"We consider retrieving a specific temporal segment, or moment, from a video given a natural language text description. Methods designed to retrieve whole video clips with natural language determine what occurs in a video but not when. To address this issue, we propose the Moment Context Network (MCN) which effectively localizes natural language queries in videos by integrating local and global video features over time. A key obstacle to training our MCN model is that current video datasets do not include pairs of localized video segments and referring expressions, or text descriptions which un"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.01641","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:38:31Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CePfSJ/gfjrfN9/mK4+Xa8B4xVq/AhGuKUZFffle8T8N0aUSdeFML+ORXBg8vGL2VsUZXNE1ZTdylg/A8pJqBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T10:40:21.109614Z"},"content_sha256":"23df55698401f8cfdc66714dde7a06c7940b6722db4b0e8030f1de94ef8f4be7","schema_version":"1.0","event_id":"sha256:23df55698401f8cfdc66714dde7a06c7940b6722db4b0e8030f1de94ef8f4be7"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JBSARKAELJPA3JU57GWES7S3G6/bundle.json","state_url":"https://pith.science/pith/JBSARKAELJPA3JU57GWES7S3G6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JBSARKAELJPA3JU57GWES7S3G6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T10:40:21Z","links":{"resolver":"https://pith.science/pith/JBSARKAELJPA3JU57GWES7S3G6","bundle":"https://pith.science/pith/JBSARKAELJPA3JU57GWES7S3G6/bundle.json","state":"https://pith.science/pith/JBSARKAELJPA3JU57GWES7S3G6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JBSARKAELJPA3JU57GWES7S3G6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:JBSARKAELJPA3JU57GWES7S3G6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b84af76dd4645ff593961e1053be15d924c32dac6cbfa2ac816e856ba536aa27","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-04T18:57:52Z","title_canon_sha256":"394c3afbf85e4dae35ab5deea0f86eeb875175f9fed523cc0a4e617c37731c95"},"schema_version":"1.0","source":{"id":"1708.01641","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.01641","created_at":"2026-05-18T00:38:31Z"},{"alias_kind":"arxiv_version","alias_value":"1708.01641v1","created_at":"2026-05-18T00:38:31Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.01641","created_at":"2026-05-18T00:38:31Z"},{"alias_kind":"pith_short_12","alias_value":"JBSARKAELJPA","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_16","alias_value":"JBSARKAELJPA3JU5","created_at":"2026-05-18T12:31:21Z"},{"alias_kind":"pith_short_8","alias_value":"JBSARKAE","created_at":"2026-05-18T12:31:21Z"}],"graph_snapshots":[{"event_id":"sha256:23df55698401f8cfdc66714dde7a06c7940b6722db4b0e8030f1de94ef8f4be7","target":"graph","created_at":"2026-05-18T00:38:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We consider retrieving a specific temporal segment, or moment, from a video given a natural language text description. Methods designed to retrieve whole video clips with natural language determine what occurs in a video but not when. To address this issue, we propose the Moment Context Network (MCN) which effectively localizes natural language queries in videos by integrating local and global video features over time. A key obstacle to training our MCN model is that current video datasets do not include pairs of localized video segments and referring expressions, or text descriptions which un","authors_text":"Bryan Russell, Eli Shechtman, Josef Sivic, Lisa Anne Hendricks, Oliver Wang, Trevor Darrell","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-04T18:57:52Z","title":"Localizing Moments in Video with Natural Language"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.01641","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5194b4be68ab807be18291da4db6876ea4d47e4c3caabe18d900e727ff51f258","target":"record","created_at":"2026-05-18T00:38:31Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b84af76dd4645ff593961e1053be15d924c32dac6cbfa2ac816e856ba536aa27","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-04T18:57:52Z","title_canon_sha256":"394c3afbf85e4dae35ab5deea0f86eeb875175f9fed523cc0a4e617c37731c95"},"schema_version":"1.0","source":{"id":"1708.01641","kind":"arxiv","version":1}},"canonical_sha256":"486408a8045a5e0da69df9ac497e5b37ba3f4cc541bef0c95c2b30717a037dca","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"486408a8045a5e0da69df9ac497e5b37ba3f4cc541bef0c95c2b30717a037dca","first_computed_at":"2026-05-18T00:38:31.973141Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:38:31.973141Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"op1hf0zi79iiBXrh5mAK5PLZtCWS7t3EejlyRyKe4mjQWRbBUstn+IxpV2CQzf37tk9LTr8Fdwizk9a7y6mgBg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:38:31.973622Z","signed_message":"canonical_sha256_bytes"},"source_id":"1708.01641","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5194b4be68ab807be18291da4db6876ea4d47e4c3caabe18d900e727ff51f258","sha256:23df55698401f8cfdc66714dde7a06c7940b6722db4b0e8030f1de94ef8f4be7"],"state_sha256":"fc5c7d85ca9538db6be3fafb0f796ec4c0b1a51e1ffcb2e3fac602b48bd768e9"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FxtFRYbuf+WHFc67UN3DihNgbC9mUlozwzXcyOmi147ZfslNJFGNl8VF604oEGNv9UonQo8t2oB1zBZwphtcCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T10:40:21.111539Z","bundle_sha256":"3bc2d99021e5b9d81b1f4450f6f1ad9baf0ec1b20e61e5f98a411fa81f4fc8ef"}}