{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:67O7667FZH2TVZLYCNHKARVZ6D","short_pith_number":"pith:67O7667F","canonical_record":{"source":{"id":"1610.02947","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-10-10T15:03:15Z","cross_cats_sorted":[],"title_canon_sha256":"a8339f6f6cc94b9c75c4fd4d2d1f6cf5516cc0a43cfe71fd455e85db7cd690f5","abstract_canon_sha256":"c90de6856ac614a3cae2d517014e71003b9f3b8927dea75aa40f39419519dcd0"},"schema_version":"1.0"},"canonical_sha256":"f7ddff7be5c9f53ae578134ea046b9f0e8e7c72ab844ca87b48900e69afb248f","source":{"kind":"arxiv","id":"1610.02947","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1610.02947","created_at":"2026-05-18T00:39:40Z"},{"alias_kind":"arxiv_version","alias_value":"1610.02947v3","created_at":"2026-05-18T00:39:40Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1610.02947","created_at":"2026-05-18T00:39:40Z"},{"alias_kind":"pith_short_12","alias_value":"67O7667FZH2T","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_16","alias_value":"67O7667FZH2TVZLY","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_8","alias_value":"67O7667F","created_at":"2026-05-18T12:30:01Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:67O7667FZH2TVZLYCNHKARVZ6D","target":"record","payload":{"canonical_record":{"source":{"id":"1610.02947","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-10-10T15:03:15Z","cross_cats_sorted":[],"title_canon_sha256":"a8339f6f6cc94b9c75c4fd4d2d1f6cf5516cc0a43cfe71fd455e85db7cd690f5","abstract_canon_sha256":"c90de6856ac614a3cae2d517014e71003b9f3b8927dea75aa40f39419519dcd0"},"schema_version":"1.0"},"canonical_sha256":"f7ddff7be5c9f53ae578134ea046b9f0e8e7c72ab844ca87b48900e69afb248f","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:39:40.034993Z","signature_b64":"1poqLAmf+h+p2a8lUQ0k5bAljlPgsc9/p25vHE8JiP+rIABvwgZzxpaOW2DQ1BnN4DbdjYcu4++sbR8D88UfBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f7ddff7be5c9f53ae578134ea046b9f0e8e7c72ab844ca87b48900e69afb248f","last_reissued_at":"2026-05-18T00:39:40.034468Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:39:40.034468Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1610.02947","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:40Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pjtLOK7XLwC93ZP+VpBHewtzpWZrCUPArlO5iolb0ajCSpt75pHberVZmBYXJpBB0VbtVlfBrTWFRJGuSRNeAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T11:13:43.783932Z"},"content_sha256":"57ec5a871375d93847c441d2c7ec0632f8b7e65fc2574efa7f46723dab9f56de","schema_version":"1.0","event_id":"sha256:57ec5a871375d93847c441d2c7ec0632f8b7e65fc2574efa7f46723dab9f56de"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:67O7667FZH2TVZLYCNHKARVZ6D","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"End-to-end Concept Word Detection for Video Captioning, Retrieval, and Question Answering","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Gunhee Kim, Hyungjin Ko, Jongwook Choi, Youngjae Yu","submitted_at":"2016-10-10T15:03:15Z","abstract_excerpt":"We propose a high-level concept word detector that can be integrated with any video-to-language models. It takes a video as input and generates a list of concept words as useful semantic priors for language generation models. The proposed word detector has two important properties. First, it does not require any external knowledge sources for training. Second, the proposed word detector is trainable in an end-to-end manner jointly with any video-to-language models. To maximize the values of detected words, we also develop a semantic attention mechanism that selectively focuses on the detected "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1610.02947","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:39:40Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YBYRq5Exawc8IWrEsEymKHEtHHj7zzKmfEVbIMPVAiNgdPiS85PSosMaxmsLjKdMLXDXoDx++BGvrXFkgbnRBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T11:13:43.784283Z"},"content_sha256":"ae831ee0ace0241c41d67130f9210629d1d2a259a0febdb7dd5ec6fac769127a","schema_version":"1.0","event_id":"sha256:ae831ee0ace0241c41d67130f9210629d1d2a259a0febdb7dd5ec6fac769127a"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/67O7667FZH2TVZLYCNHKARVZ6D/bundle.json","state_url":"https://pith.science/pith/67O7667FZH2TVZLYCNHKARVZ6D/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/67O7667FZH2TVZLYCNHKARVZ6D/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T11:13:43Z","links":{"resolver":"https://pith.science/pith/67O7667FZH2TVZLYCNHKARVZ6D","bundle":"https://pith.science/pith/67O7667FZH2TVZLYCNHKARVZ6D/bundle.json","state":"https://pith.science/pith/67O7667FZH2TVZLYCNHKARVZ6D/state.json","well_known_bundle":"https://pith.science/.well-known/pith/67O7667FZH2TVZLYCNHKARVZ6D/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:67O7667FZH2TVZLYCNHKARVZ6D","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c90de6856ac614a3cae2d517014e71003b9f3b8927dea75aa40f39419519dcd0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-10-10T15:03:15Z","title_canon_sha256":"a8339f6f6cc94b9c75c4fd4d2d1f6cf5516cc0a43cfe71fd455e85db7cd690f5"},"schema_version":"1.0","source":{"id":"1610.02947","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1610.02947","created_at":"2026-05-18T00:39:40Z"},{"alias_kind":"arxiv_version","alias_value":"1610.02947v3","created_at":"2026-05-18T00:39:40Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1610.02947","created_at":"2026-05-18T00:39:40Z"},{"alias_kind":"pith_short_12","alias_value":"67O7667FZH2T","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_16","alias_value":"67O7667FZH2TVZLY","created_at":"2026-05-18T12:30:01Z"},{"alias_kind":"pith_short_8","alias_value":"67O7667F","created_at":"2026-05-18T12:30:01Z"}],"graph_snapshots":[{"event_id":"sha256:ae831ee0ace0241c41d67130f9210629d1d2a259a0febdb7dd5ec6fac769127a","target":"graph","created_at":"2026-05-18T00:39:40Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We propose a high-level concept word detector that can be integrated with any video-to-language models. It takes a video as input and generates a list of concept words as useful semantic priors for language generation models. The proposed word detector has two important properties. First, it does not require any external knowledge sources for training. Second, the proposed word detector is trainable in an end-to-end manner jointly with any video-to-language models. To maximize the values of detected words, we also develop a semantic attention mechanism that selectively focuses on the detected ","authors_text":"Gunhee Kim, Hyungjin Ko, Jongwook Choi, Youngjae Yu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-10-10T15:03:15Z","title":"End-to-end Concept Word Detection for Video Captioning, Retrieval, and Question Answering"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1610.02947","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:57ec5a871375d93847c441d2c7ec0632f8b7e65fc2574efa7f46723dab9f56de","target":"record","created_at":"2026-05-18T00:39:40Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c90de6856ac614a3cae2d517014e71003b9f3b8927dea75aa40f39419519dcd0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-10-10T15:03:15Z","title_canon_sha256":"a8339f6f6cc94b9c75c4fd4d2d1f6cf5516cc0a43cfe71fd455e85db7cd690f5"},"schema_version":"1.0","source":{"id":"1610.02947","kind":"arxiv","version":3}},"canonical_sha256":"f7ddff7be5c9f53ae578134ea046b9f0e8e7c72ab844ca87b48900e69afb248f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f7ddff7be5c9f53ae578134ea046b9f0e8e7c72ab844ca87b48900e69afb248f","first_computed_at":"2026-05-18T00:39:40.034468Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:39:40.034468Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"1poqLAmf+h+p2a8lUQ0k5bAljlPgsc9/p25vHE8JiP+rIABvwgZzxpaOW2DQ1BnN4DbdjYcu4++sbR8D88UfBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:39:40.034993Z","signed_message":"canonical_sha256_bytes"},"source_id":"1610.02947","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:57ec5a871375d93847c441d2c7ec0632f8b7e65fc2574efa7f46723dab9f56de","sha256:ae831ee0ace0241c41d67130f9210629d1d2a259a0febdb7dd5ec6fac769127a"],"state_sha256":"8b39a1be494173f32bcef22223d001fffa4f8e2c694d89c7c9c95a2d781102be"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"O8U8H0sgpnjCi6LXAyxo5jgVKzOLepsY5gc7fVIphS7WnI9qmNr7616R6lSHd/p0aQylmC5V9N3Yp/NgjznWBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T11:13:43.786381Z","bundle_sha256":"dbd2bdc1dce76fbeb7f1748be91787db5bcfdbaf3369a6276cf403737aed3de6"}}