{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:3HVYGLVOR7U7XVZKB5DG5AAVHA","short_pith_number":"pith:3HVYGLVO","canonical_record":{"source":{"id":"1809.08761","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-24T05:00:05Z","cross_cats_sorted":["cs.CV"],"title_canon_sha256":"99ec91e694d16c8c2993ed680d8ae4d685963cecc8d5e2f6353118a7d53c3375","abstract_canon_sha256":"8a796d474d1e3f3779ce13ec9f75d6eac318df7b5b2a57bb5604eb4cd23994b8"},"schema_version":"1.0"},"canonical_sha256":"d9eb832eae8fe9fbd72a0f466e80153814a96cc206988d3dd2f0b21b68855f54","source":{"kind":"arxiv","id":"1809.08761","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.08761","created_at":"2026-05-18T00:05:03Z"},{"alias_kind":"arxiv_version","alias_value":"1809.08761v1","created_at":"2026-05-18T00:05:03Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.08761","created_at":"2026-05-18T00:05:03Z"},{"alias_kind":"pith_short_12","alias_value":"3HVYGLVOR7U7","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_16","alias_value":"3HVYGLVOR7U7XVZK","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_8","alias_value":"3HVYGLVO","created_at":"2026-05-18T12:32:02Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:3HVYGLVOR7U7XVZKB5DG5AAVHA","target":"record","payload":{"canonical_record":{"source":{"id":"1809.08761","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-24T05:00:05Z","cross_cats_sorted":["cs.CV"],"title_canon_sha256":"99ec91e694d16c8c2993ed680d8ae4d685963cecc8d5e2f6353118a7d53c3375","abstract_canon_sha256":"8a796d474d1e3f3779ce13ec9f75d6eac318df7b5b2a57bb5604eb4cd23994b8"},"schema_version":"1.0"},"canonical_sha256":"d9eb832eae8fe9fbd72a0f466e80153814a96cc206988d3dd2f0b21b68855f54","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:05:03.642686Z","signature_b64":"wBIcdH+xDX37yplq+odhIthlf7N5q4UTAk885B7gqthcgrSh//VmwixroUaKmFckZY0PRYfqB7Pa3SmC50fTCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d9eb832eae8fe9fbd72a0f466e80153814a96cc206988d3dd2f0b21b68855f54","last_reissued_at":"2026-05-18T00:05:03.642049Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:05:03.642049Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1809.08761","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:03Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"l0ZU03U0WeN150hobxEVbnDGM2fBo2r/jV16noNeUN8EcGVnOL7fDFoZIH+EnniAz3AXFKJjUyuX+LJ9OKSZCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T11:37:36.364036Z"},"content_sha256":"49f651b3b64bfcaee621e880a2d8eb4eec0018a956ab5c94097d0e79d789a660","schema_version":"1.0","event_id":"sha256:49f651b3b64bfcaee621e880a2d8eb4eec0018a956ab5c94097d0e79d789a660"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:3HVYGLVOR7U7XVZKB5DG5AAVHA","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Speaker Naming in Movies","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CV"],"primary_cat":"cs.CL","authors_text":"Jia Deng, Mahmoud Azab, Max Smith, Mingzhe Wang, Noriyuki Kojima, Rada Mihalcea","submitted_at":"2018-09-24T05:00:05Z","abstract_excerpt":"We propose a new model for speaker naming in movies that leverages visual, textual, and acoustic modalities in an unified optimization framework. To evaluate the performance of our model, we introduce a new dataset consisting of six episodes of the Big Bang Theory TV show and eighteen full movies covering different genres. Our experiments show that our multimodal model significantly outperforms several competitive baselines on the average weighted F-score metric. To demonstrate the effectiveness of our framework, we design an end-to-end memory network model that leverages our speaker naming mo"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.08761","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:03Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ij+fKil3KVayDSCxbMay069Z6FQQyu6m3e6XMhS7T0hXL4n1rZJODm/eEdLnBKK8mJl7dEYwTns2LNxtnqtgCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T11:37:36.364753Z"},"content_sha256":"a121d6acb9426f7abaf8fb633eda18a97b0787f31847d6d13793ce964facf11d","schema_version":"1.0","event_id":"sha256:a121d6acb9426f7abaf8fb633eda18a97b0787f31847d6d13793ce964facf11d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3HVYGLVOR7U7XVZKB5DG5AAVHA/bundle.json","state_url":"https://pith.science/pith/3HVYGLVOR7U7XVZKB5DG5AAVHA/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3HVYGLVOR7U7XVZKB5DG5AAVHA/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T11:37:36Z","links":{"resolver":"https://pith.science/pith/3HVYGLVOR7U7XVZKB5DG5AAVHA","bundle":"https://pith.science/pith/3HVYGLVOR7U7XVZKB5DG5AAVHA/bundle.json","state":"https://pith.science/pith/3HVYGLVOR7U7XVZKB5DG5AAVHA/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3HVYGLVOR7U7XVZKB5DG5AAVHA/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:3HVYGLVOR7U7XVZKB5DG5AAVHA","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"8a796d474d1e3f3779ce13ec9f75d6eac318df7b5b2a57bb5604eb4cd23994b8","cross_cats_sorted":["cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-24T05:00:05Z","title_canon_sha256":"99ec91e694d16c8c2993ed680d8ae4d685963cecc8d5e2f6353118a7d53c3375"},"schema_version":"1.0","source":{"id":"1809.08761","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1809.08761","created_at":"2026-05-18T00:05:03Z"},{"alias_kind":"arxiv_version","alias_value":"1809.08761v1","created_at":"2026-05-18T00:05:03Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.08761","created_at":"2026-05-18T00:05:03Z"},{"alias_kind":"pith_short_12","alias_value":"3HVYGLVOR7U7","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_16","alias_value":"3HVYGLVOR7U7XVZK","created_at":"2026-05-18T12:32:02Z"},{"alias_kind":"pith_short_8","alias_value":"3HVYGLVO","created_at":"2026-05-18T12:32:02Z"}],"graph_snapshots":[{"event_id":"sha256:a121d6acb9426f7abaf8fb633eda18a97b0787f31847d6d13793ce964facf11d","target":"graph","created_at":"2026-05-18T00:05:03Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We propose a new model for speaker naming in movies that leverages visual, textual, and acoustic modalities in an unified optimization framework. To evaluate the performance of our model, we introduce a new dataset consisting of six episodes of the Big Bang Theory TV show and eighteen full movies covering different genres. Our experiments show that our multimodal model significantly outperforms several competitive baselines on the average weighted F-score metric. To demonstrate the effectiveness of our framework, we design an end-to-end memory network model that leverages our speaker naming mo","authors_text":"Jia Deng, Mahmoud Azab, Max Smith, Mingzhe Wang, Noriyuki Kojima, Rada Mihalcea","cross_cats":["cs.CV"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-24T05:00:05Z","title":"Speaker Naming in Movies"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.08761","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:49f651b3b64bfcaee621e880a2d8eb4eec0018a956ab5c94097d0e79d789a660","target":"record","created_at":"2026-05-18T00:05:03Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"8a796d474d1e3f3779ce13ec9f75d6eac318df7b5b2a57bb5604eb4cd23994b8","cross_cats_sorted":["cs.CV"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-09-24T05:00:05Z","title_canon_sha256":"99ec91e694d16c8c2993ed680d8ae4d685963cecc8d5e2f6353118a7d53c3375"},"schema_version":"1.0","source":{"id":"1809.08761","kind":"arxiv","version":1}},"canonical_sha256":"d9eb832eae8fe9fbd72a0f466e80153814a96cc206988d3dd2f0b21b68855f54","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d9eb832eae8fe9fbd72a0f466e80153814a96cc206988d3dd2f0b21b68855f54","first_computed_at":"2026-05-18T00:05:03.642049Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:05:03.642049Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"wBIcdH+xDX37yplq+odhIthlf7N5q4UTAk885B7gqthcgrSh//VmwixroUaKmFckZY0PRYfqB7Pa3SmC50fTCw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:05:03.642686Z","signed_message":"canonical_sha256_bytes"},"source_id":"1809.08761","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:49f651b3b64bfcaee621e880a2d8eb4eec0018a956ab5c94097d0e79d789a660","sha256:a121d6acb9426f7abaf8fb633eda18a97b0787f31847d6d13793ce964facf11d"],"state_sha256":"02d53a02abef9cd887d1fb654448052a9e3b7fbf9beefef728ac5e2c828dc240"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yS3Bba1I7On4QaQOxUKVad1OsmgRWC7eobY8vRutTrL29BtaaCsV5VTFLrxBuZwz7wmnECCclg7RpgVjJJVhCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T11:37:36.368785Z","bundle_sha256":"839387ef1f5a3189c9839f338faa783d4bd7b52e7bca353bb2d3df58e570c254"}}