{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:XC3NXIOKD25FBXA5GFJSKKWSUA","short_pith_number":"pith:XC3NXIOK","canonical_record":{"source":{"id":"1604.03968","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-04-13T20:27:43Z","cross_cats_sorted":["cs.AI","cs.CV"],"title_canon_sha256":"e13a62f91d570e36a4a1923ca81a0ed01e24f06c73e487a21e25937f0bf420e8","abstract_canon_sha256":"4f45a3e9cf9aa48c3201f80a57a094fd8e6b9f1f41e4fc3838b1381483227cf3"},"schema_version":"1.0"},"canonical_sha256":"b8b6dba1ca1eba50dc1d3153252ad2a0189d12bb5fa57d33da0964a4e6f43598","source":{"kind":"arxiv","id":"1604.03968","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.03968","created_at":"2026-05-18T01:17:07Z"},{"alias_kind":"arxiv_version","alias_value":"1604.03968v1","created_at":"2026-05-18T01:17:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.03968","created_at":"2026-05-18T01:17:07Z"},{"alias_kind":"pith_short_12","alias_value":"XC3NXIOKD25F","created_at":"2026-05-18T12:30:51Z"},{"alias_kind":"pith_short_16","alias_value":"XC3NXIOKD25FBXA5","created_at":"2026-05-18T12:30:51Z"},{"alias_kind":"pith_short_8","alias_value":"XC3NXIOK","created_at":"2026-05-18T12:30:51Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:XC3NXIOKD25FBXA5GFJSKKWSUA","target":"record","payload":{"canonical_record":{"source":{"id":"1604.03968","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-04-13T20:27:43Z","cross_cats_sorted":["cs.AI","cs.CV"],"title_canon_sha256":"e13a62f91d570e36a4a1923ca81a0ed01e24f06c73e487a21e25937f0bf420e8","abstract_canon_sha256":"4f45a3e9cf9aa48c3201f80a57a094fd8e6b9f1f41e4fc3838b1381483227cf3"},"schema_version":"1.0"},"canonical_sha256":"b8b6dba1ca1eba50dc1d3153252ad2a0189d12bb5fa57d33da0964a4e6f43598","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:17:07.104889Z","signature_b64":"UTVpV+syIiDTBSnSjZjkDZ6ltYw7cuYAW+uw4Zv9nHOu0TC5VdZxjVdvB3c6Jcv8iT6kJ3yDVzfORJU9feIIBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b8b6dba1ca1eba50dc1d3153252ad2a0189d12bb5fa57d33da0964a4e6f43598","last_reissued_at":"2026-05-18T01:17:07.104016Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:17:07.104016Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1604.03968","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:17:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MDpIOnrdaFyxnQ1gqNGjo1odOOkguDMhngAoay/md7MztqJnwyrn4Gr6DCv6p/4vbEWLNPQCLQnRrDLre3WFCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T09:13:35.437427Z"},"content_sha256":"6c0fbc22bf1610344f830c5d534f0562350391858cc92802de066d85b0d1b8f8","schema_version":"1.0","event_id":"sha256:6c0fbc22bf1610344f830c5d534f0562350391858cc92802de066d85b0d1b8f8"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:XC3NXIOKD25FBXA5GFJSKKWSUA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Visual Storytelling","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CV"],"primary_cat":"cs.CL","authors_text":"Aishwarya Agrawal, C. Lawrence Zitnick, Devi Parikh, Dhruv Batra, Francis Ferraro, Ishan Misra, Jacob Devlin, Lucy Vanderwende, Margaret Mitchell, Michel Galley, Nasrin Mostafazadeh, Pushmeet Kohli, Ross Girshick, Ting-Hao (Kenneth) Huang, Xiaodong He","submitted_at":"2016-04-13T20:27:43Z","abstract_excerpt":"We introduce the first dataset for sequential vision-to-language, and explore how this data may be used for the task of visual storytelling. The first release of this dataset, SIND v.1, includes 81,743 unique photos in 20,211 sequences, aligned to both descriptive (caption) and story language. We establish several strong baselines for the storytelling task, and motivate an automatic metric to benchmark progress. Modelling concrete description as well as figurative and social language, as provided in this dataset and the storytelling task, has the potential to move artificial intelligence from "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.03968","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:17:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ylUu8SWDFjTVv4FehEa44rLA265gCYu1JORV+1qepMWXIqle10mWrQDt9wC/w6UgMDuoBehkSsHrrYrSySM3Bw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T09:13:35.437780Z"},"content_sha256":"285c2b15b882dbbc5004bb23d2c9773245719ecba69335f3f11b6d9f02621d27","schema_version":"1.0","event_id":"sha256:285c2b15b882dbbc5004bb23d2c9773245719ecba69335f3f11b6d9f02621d27"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XC3NXIOKD25FBXA5GFJSKKWSUA/bundle.json","state_url":"https://pith.science/pith/XC3NXIOKD25FBXA5GFJSKKWSUA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XC3NXIOKD25FBXA5GFJSKKWSUA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T09:13:35Z","links":{"resolver":"https://pith.science/pith/XC3NXIOKD25FBXA5GFJSKKWSUA","bundle":"https://pith.science/pith/XC3NXIOKD25FBXA5GFJSKKWSUA/bundle.json","state":"https://pith.science/pith/XC3NXIOKD25FBXA5GFJSKKWSUA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XC3NXIOKD25FBXA5GFJSKKWSUA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:XC3NXIOKD25FBXA5GFJSKKWSUA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4f45a3e9cf9aa48c3201f80a57a094fd8e6b9f1f41e4fc3838b1381483227cf3","cross_cats_sorted":["cs.AI","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-04-13T20:27:43Z","title_canon_sha256":"e13a62f91d570e36a4a1923ca81a0ed01e24f06c73e487a21e25937f0bf420e8"},"schema_version":"1.0","source":{"id":"1604.03968","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.03968","created_at":"2026-05-18T01:17:07Z"},{"alias_kind":"arxiv_version","alias_value":"1604.03968v1","created_at":"2026-05-18T01:17:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.03968","created_at":"2026-05-18T01:17:07Z"},{"alias_kind":"pith_short_12","alias_value":"XC3NXIOKD25F","created_at":"2026-05-18T12:30:51Z"},{"alias_kind":"pith_short_16","alias_value":"XC3NXIOKD25FBXA5","created_at":"2026-05-18T12:30:51Z"},{"alias_kind":"pith_short_8","alias_value":"XC3NXIOK","created_at":"2026-05-18T12:30:51Z"}],"graph_snapshots":[{"event_id":"sha256:285c2b15b882dbbc5004bb23d2c9773245719ecba69335f3f11b6d9f02621d27","target":"graph","created_at":"2026-05-18T01:17:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We introduce the first dataset for sequential vision-to-language, and explore how this data may be used for the task of visual storytelling. The first release of this dataset, SIND v.1, includes 81,743 unique photos in 20,211 sequences, aligned to both descriptive (caption) and story language. We establish several strong baselines for the storytelling task, and motivate an automatic metric to benchmark progress. Modelling concrete description as well as figurative and social language, as provided in this dataset and the storytelling task, has the potential to move artificial intelligence from ","authors_text":"Aishwarya Agrawal, C. Lawrence Zitnick, Devi Parikh, Dhruv Batra, Francis Ferraro, Ishan Misra, Jacob Devlin, Lucy Vanderwende, Margaret Mitchell, Michel Galley, Nasrin Mostafazadeh, Pushmeet Kohli, Ross Girshick, Ting-Hao (Kenneth) Huang, Xiaodong He","cross_cats":["cs.AI","cs.CV"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-04-13T20:27:43Z","title":"Visual Storytelling"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.03968","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:6c0fbc22bf1610344f830c5d534f0562350391858cc92802de066d85b0d1b8f8","target":"record","created_at":"2026-05-18T01:17:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4f45a3e9cf9aa48c3201f80a57a094fd8e6b9f1f41e4fc3838b1381483227cf3","cross_cats_sorted":["cs.AI","cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2016-04-13T20:27:43Z","title_canon_sha256":"e13a62f91d570e36a4a1923ca81a0ed01e24f06c73e487a21e25937f0bf420e8"},"schema_version":"1.0","source":{"id":"1604.03968","kind":"arxiv","version":1}},"canonical_sha256":"b8b6dba1ca1eba50dc1d3153252ad2a0189d12bb5fa57d33da0964a4e6f43598","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b8b6dba1ca1eba50dc1d3153252ad2a0189d12bb5fa57d33da0964a4e6f43598","first_computed_at":"2026-05-18T01:17:07.104016Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:17:07.104016Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UTVpV+syIiDTBSnSjZjkDZ6ltYw7cuYAW+uw4Zv9nHOu0TC5VdZxjVdvB3c6Jcv8iT6kJ3yDVzfORJU9feIIBg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:17:07.104889Z","signed_message":"canonical_sha256_bytes"},"source_id":"1604.03968","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:6c0fbc22bf1610344f830c5d534f0562350391858cc92802de066d85b0d1b8f8","sha256:285c2b15b882dbbc5004bb23d2c9773245719ecba69335f3f11b6d9f02621d27"],"state_sha256":"958e0901b2d39db35eca198845dc1e2d62eac26c75d2f318c39c976a882819df"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vOYIrYVDQSNlyKTWmKAMeZroQg81EjnzIbe4B/jO/BMloaFVGFY4vaVAlnpX+c5Xk+GptTEeYKjQYxwFBjIKDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T09:13:35.439780Z","bundle_sha256":"69a7b3103bc3ded0c3441a8063d867626532f0a8b4927150175e94c4304d28a7"}}