{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:CBKBG2OKGASCMKGZ5X5SYJCUAC","short_pith_number":"pith:CBKBG2OK","canonical_record":{"source":{"id":"1708.02478","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-08T13:27:13Z","cross_cats_sorted":[],"title_canon_sha256":"74ba6f8d5bba7d99a02a7b3321b66441f720c07a261b865e8dce71bb162c6912","abstract_canon_sha256":"5a14ea9932a971ff8be2bfe489191bb11bc3311648487a38bd82d9fb79b38ab0"},"schema_version":"1.0"},"canonical_sha256":"10541369ca30242628d9edfb2c24540086fbde419f92c518822d0e97b6ca5e16","source":{"kind":"arxiv","id":"1708.02478","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.02478","created_at":"2026-05-18T00:32:25Z"},{"alias_kind":"arxiv_version","alias_value":"1708.02478v2","created_at":"2026-05-18T00:32:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.02478","created_at":"2026-05-18T00:32:25Z"},{"alias_kind":"pith_short_12","alias_value":"CBKBG2OKGASC","created_at":"2026-05-18T12:31:10Z"},{"alias_kind":"pith_short_16","alias_value":"CBKBG2OKGASCMKGZ","created_at":"2026-05-18T12:31:10Z"},{"alias_kind":"pith_short_8","alias_value":"CBKBG2OK","created_at":"2026-05-18T12:31:10Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:CBKBG2OKGASCMKGZ5X5SYJCUAC","target":"record","payload":{"canonical_record":{"source":{"id":"1708.02478","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-08T13:27:13Z","cross_cats_sorted":[],"title_canon_sha256":"74ba6f8d5bba7d99a02a7b3321b66441f720c07a261b865e8dce71bb162c6912","abstract_canon_sha256":"5a14ea9932a971ff8be2bfe489191bb11bc3311648487a38bd82d9fb79b38ab0"},"schema_version":"1.0"},"canonical_sha256":"10541369ca30242628d9edfb2c24540086fbde419f92c518822d0e97b6ca5e16","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:32:25.518640Z","signature_b64":"st1pbkObvMF+cSbV80rCybhbtp7HavDIHcWTBOsgyZYE+/XyXrFLhXNgj5+XLY/m8GlQTFO87lpLyeXJ3driBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"10541369ca30242628d9edfb2c24540086fbde419f92c518822d0e97b6ca5e16","last_reissued_at":"2026-05-18T00:32:25.517860Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:32:25.517860Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1708.02478","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:32:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yeRcYy5Do9jcLjaHzJE3jeZr9SVhzspC+M7HbKfzhL3Fgth38KSBJg8e6VQMjMfieuUYC5D+dvDnyqH7fYw3Dg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T05:01:41.004451Z"},"content_sha256":"8fd4da8cb2fdfabb61a86f5c7c12c491d68c586549720f32831e8d664c2b66d5","schema_version":"1.0","event_id":"sha256:8fd4da8cb2fdfabb61a86f5c7c12c491d68c586549720f32831e8d664c2b66d5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:CBKBG2OKGASCMKGZ5X5SYJCUAC","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"From Deterministic to Generative: Multi-Modal Stochastic RNNs for Video Captioning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Alan Hanjalic, Heng Tao Shen, Jingkuan Song, Lianli Gao, Xuelong Li, Yuyu Guo","submitted_at":"2017-08-08T13:27:13Z","abstract_excerpt":"Video captioning in essential is a complex natural process, which is affected by various uncertainties stemming from video content, subjective judgment, etc. In this paper we build on the recent progress in using encoder-decoder framework for video captioning and address what we find to be a critical deficiency of the existing methods, that most of the decoders propagate deterministic hidden states. Such complex uncertainty cannot be modeled efficiently by the deterministic models. In this paper, we propose a generative approach, referred to as multi-modal stochastic RNNs networks (MS-RNN), wh"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.02478","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:32:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/ogn/D2aU8btnSQ8hbz1yCorHdDqTPGfGyPl1vcKi61wDRD0mLSAMfvbWnLRU1O0yASr5pwQGHAOMlp6wbqRAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T05:01:41.004823Z"},"content_sha256":"0757e2f41f733fc4ed43fee031446e29710edb3d65ee62a82a7c2a237a01bea9","schema_version":"1.0","event_id":"sha256:0757e2f41f733fc4ed43fee031446e29710edb3d65ee62a82a7c2a237a01bea9"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CBKBG2OKGASCMKGZ5X5SYJCUAC/bundle.json","state_url":"https://pith.science/pith/CBKBG2OKGASCMKGZ5X5SYJCUAC/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CBKBG2OKGASCMKGZ5X5SYJCUAC/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T05:01:41Z","links":{"resolver":"https://pith.science/pith/CBKBG2OKGASCMKGZ5X5SYJCUAC","bundle":"https://pith.science/pith/CBKBG2OKGASCMKGZ5X5SYJCUAC/bundle.json","state":"https://pith.science/pith/CBKBG2OKGASCMKGZ5X5SYJCUAC/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CBKBG2OKGASCMKGZ5X5SYJCUAC/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:CBKBG2OKGASCMKGZ5X5SYJCUAC","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5a14ea9932a971ff8be2bfe489191bb11bc3311648487a38bd82d9fb79b38ab0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-08T13:27:13Z","title_canon_sha256":"74ba6f8d5bba7d99a02a7b3321b66441f720c07a261b865e8dce71bb162c6912"},"schema_version":"1.0","source":{"id":"1708.02478","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.02478","created_at":"2026-05-18T00:32:25Z"},{"alias_kind":"arxiv_version","alias_value":"1708.02478v2","created_at":"2026-05-18T00:32:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.02478","created_at":"2026-05-18T00:32:25Z"},{"alias_kind":"pith_short_12","alias_value":"CBKBG2OKGASC","created_at":"2026-05-18T12:31:10Z"},{"alias_kind":"pith_short_16","alias_value":"CBKBG2OKGASCMKGZ","created_at":"2026-05-18T12:31:10Z"},{"alias_kind":"pith_short_8","alias_value":"CBKBG2OK","created_at":"2026-05-18T12:31:10Z"}],"graph_snapshots":[{"event_id":"sha256:0757e2f41f733fc4ed43fee031446e29710edb3d65ee62a82a7c2a237a01bea9","target":"graph","created_at":"2026-05-18T00:32:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Video captioning in essential is a complex natural process, which is affected by various uncertainties stemming from video content, subjective judgment, etc. In this paper we build on the recent progress in using encoder-decoder framework for video captioning and address what we find to be a critical deficiency of the existing methods, that most of the decoders propagate deterministic hidden states. Such complex uncertainty cannot be modeled efficiently by the deterministic models. In this paper, we propose a generative approach, referred to as multi-modal stochastic RNNs networks (MS-RNN), wh","authors_text":"Alan Hanjalic, Heng Tao Shen, Jingkuan Song, Lianli Gao, Xuelong Li, Yuyu Guo","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-08T13:27:13Z","title":"From Deterministic to Generative: Multi-Modal Stochastic RNNs for Video Captioning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.02478","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8fd4da8cb2fdfabb61a86f5c7c12c491d68c586549720f32831e8d664c2b66d5","target":"record","created_at":"2026-05-18T00:32:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5a14ea9932a971ff8be2bfe489191bb11bc3311648487a38bd82d9fb79b38ab0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-08T13:27:13Z","title_canon_sha256":"74ba6f8d5bba7d99a02a7b3321b66441f720c07a261b865e8dce71bb162c6912"},"schema_version":"1.0","source":{"id":"1708.02478","kind":"arxiv","version":2}},"canonical_sha256":"10541369ca30242628d9edfb2c24540086fbde419f92c518822d0e97b6ca5e16","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"10541369ca30242628d9edfb2c24540086fbde419f92c518822d0e97b6ca5e16","first_computed_at":"2026-05-18T00:32:25.517860Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:32:25.517860Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"st1pbkObvMF+cSbV80rCybhbtp7HavDIHcWTBOsgyZYE+/XyXrFLhXNgj5+XLY/m8GlQTFO87lpLyeXJ3driBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:32:25.518640Z","signed_message":"canonical_sha256_bytes"},"source_id":"1708.02478","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8fd4da8cb2fdfabb61a86f5c7c12c491d68c586549720f32831e8d664c2b66d5","sha256:0757e2f41f733fc4ed43fee031446e29710edb3d65ee62a82a7c2a237a01bea9"],"state_sha256":"d0dc59f50d85c1acfa0866b06a947e07429581ea33fe88154d58c3ed589dd623"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YvSCiXAg+Fagnhv6/EOHhZnSakbN94SjrE5vP/Xspb/A5DpWzK53oGqbg1EKnqdvu5NjGTa0X9UZXz+8XG69Dw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T05:01:41.008077Z","bundle_sha256":"160327e556b5d27cb3a073b3a40bb5f25a0c7eec7de26a5d90b41a4d59aac245"}}