{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:3NJA56M2QYR7XXLSG6754XFLDJ","short_pith_number":"pith:3NJA56M2","canonical_record":{"source":{"id":"1807.10018","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-26T08:57:24Z","cross_cats_sorted":[],"title_canon_sha256":"67da4e4d1dd06dbe1d9b708c3a9b8f4ff71472ee09f19f81459e9fc8cbfbb3f0","abstract_canon_sha256":"a26634052c2d857a3f0dd4833d979889117d62bb43284dc026e2384300e29973"},"schema_version":"1.0"},"canonical_sha256":"db520ef99a8623fbdd7237bfde5cab1a4c4c6ffef01f7ecfa2468d1d02292553","source":{"kind":"arxiv","id":"1807.10018","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.10018","created_at":"2026-05-18T00:09:45Z"},{"alias_kind":"arxiv_version","alias_value":"1807.10018v1","created_at":"2026-05-18T00:09:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.10018","created_at":"2026-05-18T00:09:45Z"},{"alias_kind":"pith_short_12","alias_value":"3NJA56M2QYR7","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_16","alias_value":"3NJA56M2QYR7XXLS","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_8","alias_value":"3NJA56M2","created_at":"2026-05-18T12:32:02Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:3NJA56M2QYR7XXLSG6754XFLDJ","target":"record","payload":{"canonical_record":{"source":{"id":"1807.10018","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-26T08:57:24Z","cross_cats_sorted":[],"title_canon_sha256":"67da4e4d1dd06dbe1d9b708c3a9b8f4ff71472ee09f19f81459e9fc8cbfbb3f0","abstract_canon_sha256":"a26634052c2d857a3f0dd4833d979889117d62bb43284dc026e2384300e29973"},"schema_version":"1.0"},"canonical_sha256":"db520ef99a8623fbdd7237bfde5cab1a4c4c6ffef01f7ecfa2468d1d02292553","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:09:45.663288Z","signature_b64":"wDV0+0M4nREMT+I+FB0bCGLsgd/TpCv0xdbJdBPErxU7GT64VvWmkN5hlPWoNsIs41ABNTP2rdERpJqMzbDGCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"db520ef99a8623fbdd7237bfde5cab1a4c4c6ffef01f7ecfa2468d1d02292553","last_reissued_at":"2026-05-18T00:09:45.662649Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:09:45.662649Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1807.10018","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:09:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"P3ockdVDkIQa+WXb4eBIg5qKjH5m1mtpXFKSlYT854yPXcoUjUbl4Q/jUyENUy8Xbi/S8qZUiGTZ2DKICLcxCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T22:15:41.215581Z"},"content_sha256":"3dea7128dcd64774937ea2f87312b3a7198d2da55976509c96ef65e01495b589","schema_version":"1.0","event_id":"sha256:3dea7128dcd64774937ea2f87312b3a7198d2da55976509c96ef65e01495b589"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:3NJA56M2QYR7XXLSG6754XFLDJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Move Forward and Tell: A Progressive Generator of Video Descriptions","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bo Dai, Dahua Lin, Yilei Xiong","submitted_at":"2018-07-26T08:57:24Z","abstract_excerpt":"We present an efficient framework that can generate a coherent paragraph to describe a given video. Previous works on video captioning usually focus on video clips. They typically treat an entire video as a whole and generate the caption conditioned on a single embedding. On the contrary, we consider videos with rich temporal structures and aim to generate paragraph descriptions that can preserve the story flow while being coherent and concise. Towards this goal, we propose a new approach, which produces a descriptive paragraph by assembling temporally localized descriptions. Given a video, it"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.10018","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:09:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"q7uJVRFtLDC3gO4Ku+GOrNQC49TV6i3HWh7DON0RChzbS3pZZ/nWMBFxx3iNwD/q3Yhqcg+TQLhU7IOn/qgvCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T22:15:41.216236Z"},"content_sha256":"9599fedcc30edb72d06820f0b8593c985e6823c059edb09d028252ab697563c5","schema_version":"1.0","event_id":"sha256:9599fedcc30edb72d06820f0b8593c985e6823c059edb09d028252ab697563c5"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3NJA56M2QYR7XXLSG6754XFLDJ/bundle.json","state_url":"https://pith.science/pith/3NJA56M2QYR7XXLSG6754XFLDJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3NJA56M2QYR7XXLSG6754XFLDJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-23T22:15:41Z","links":{"resolver":"https://pith.science/pith/3NJA56M2QYR7XXLSG6754XFLDJ","bundle":"https://pith.science/pith/3NJA56M2QYR7XXLSG6754XFLDJ/bundle.json","state":"https://pith.science/pith/3NJA56M2QYR7XXLSG6754XFLDJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3NJA56M2QYR7XXLSG6754XFLDJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:3NJA56M2QYR7XXLSG6754XFLDJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a26634052c2d857a3f0dd4833d979889117d62bb43284dc026e2384300e29973","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-26T08:57:24Z","title_canon_sha256":"67da4e4d1dd06dbe1d9b708c3a9b8f4ff71472ee09f19f81459e9fc8cbfbb3f0"},"schema_version":"1.0","source":{"id":"1807.10018","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1807.10018","created_at":"2026-05-18T00:09:45Z"},{"alias_kind":"arxiv_version","alias_value":"1807.10018v1","created_at":"2026-05-18T00:09:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1807.10018","created_at":"2026-05-18T00:09:45Z"},{"alias_kind":"pith_short_12","alias_value":"3NJA56M2QYR7","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_16","alias_value":"3NJA56M2QYR7XXLS","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_8","alias_value":"3NJA56M2","created_at":"2026-05-18T12:32:02Z"}],"graph_snapshots":[{"event_id":"sha256:9599fedcc30edb72d06820f0b8593c985e6823c059edb09d028252ab697563c5","target":"graph","created_at":"2026-05-18T00:09:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We present an efficient framework that can generate a coherent paragraph to describe a given video. Previous works on video captioning usually focus on video clips. They typically treat an entire video as a whole and generate the caption conditioned on a single embedding. On the contrary, we consider videos with rich temporal structures and aim to generate paragraph descriptions that can preserve the story flow while being coherent and concise. Towards this goal, we propose a new approach, which produces a descriptive paragraph by assembling temporally localized descriptions. Given a video, it","authors_text":"Bo Dai, Dahua Lin, Yilei Xiong","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-26T08:57:24Z","title":"Move Forward and Tell: A Progressive Generator of Video Descriptions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1807.10018","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3dea7128dcd64774937ea2f87312b3a7198d2da55976509c96ef65e01495b589","target":"record","created_at":"2026-05-18T00:09:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a26634052c2d857a3f0dd4833d979889117d62bb43284dc026e2384300e29973","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-07-26T08:57:24Z","title_canon_sha256":"67da4e4d1dd06dbe1d9b708c3a9b8f4ff71472ee09f19f81459e9fc8cbfbb3f0"},"schema_version":"1.0","source":{"id":"1807.10018","kind":"arxiv","version":1}},"canonical_sha256":"db520ef99a8623fbdd7237bfde5cab1a4c4c6ffef01f7ecfa2468d1d02292553","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"db520ef99a8623fbdd7237bfde5cab1a4c4c6ffef01f7ecfa2468d1d02292553","first_computed_at":"2026-05-18T00:09:45.662649Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:09:45.662649Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"wDV0+0M4nREMT+I+FB0bCGLsgd/TpCv0xdbJdBPErxU7GT64VvWmkN5hlPWoNsIs41ABNTP2rdERpJqMzbDGCA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:09:45.663288Z","signed_message":"canonical_sha256_bytes"},"source_id":"1807.10018","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3dea7128dcd64774937ea2f87312b3a7198d2da55976509c96ef65e01495b589","sha256:9599fedcc30edb72d06820f0b8593c985e6823c059edb09d028252ab697563c5"],"state_sha256":"0799f517477f75e8fe93ed4be0650e1e472b8cba170eddd955b7cf8f78f65593"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Yts/SgyyT/zgb2hZp+z6mTbo0oGTLinn2299tZiwoNKAYLtT+DP7qpX7znTTFuRiNw5qUay2xrIKI33tZQzLCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-23T22:15:41.219734Z","bundle_sha256":"3718b864f12c2c58b250388170576309596c4c9bc7b0e84c43ee180a78cae41e"}}