{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:D53YU44R7OINXQXZSBE7R5PINM","short_pith_number":"pith:D53YU44R","canonical_record":{"source":{"id":"1907.03609","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-07-08T13:37:48Z","cross_cats_sorted":[],"title_canon_sha256":"1a323090ca160877236a0bab4bce883f7a2d6ac2dcbd831c15f827f5358c46f5","abstract_canon_sha256":"36fbcd941f75d1025373e9648443528c940c22ea882f258b859c57984675c1c8"},"schema_version":"1.0"},"canonical_sha256":"1f778a7391fb90dbc2f99049f8f5e86b1ac193201062f0dce24d69a47fbd18d6","source":{"kind":"arxiv","id":"1907.03609","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.03609","created_at":"2026-05-17T23:41:14Z"},{"alias_kind":"arxiv_version","alias_value":"1907.03609v1","created_at":"2026-05-17T23:41:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.03609","created_at":"2026-05-17T23:41:14Z"},{"alias_kind":"pith_short_12","alias_value":"D53YU44R7OIN","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_16","alias_value":"D53YU44R7OINXQXZ","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_8","alias_value":"D53YU44R","created_at":"2026-05-18T12:33:15Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:D53YU44R7OINXQXZSBE7R5PINM","target":"record","payload":{"canonical_record":{"source":{"id":"1907.03609","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-07-08T13:37:48Z","cross_cats_sorted":[],"title_canon_sha256":"1a323090ca160877236a0bab4bce883f7a2d6ac2dcbd831c15f827f5358c46f5","abstract_canon_sha256":"36fbcd941f75d1025373e9648443528c940c22ea882f258b859c57984675c1c8"},"schema_version":"1.0"},"canonical_sha256":"1f778a7391fb90dbc2f99049f8f5e86b1ac193201062f0dce24d69a47fbd18d6","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:14.199570Z","signature_b64":"k52p6M/V/jyGVGXR1kfBIXGicLC92IlFn9dBGEvUPU1HqR/yJhChqKJcbBdmxbZloQeInFv0SEhyzB792/5+Dw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1f778a7391fb90dbc2f99049f8f5e86b1ac193201062f0dce24d69a47fbd18d6","last_reissued_at":"2026-05-17T23:41:14.199075Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:14.199075Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1907.03609","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"tZ7aFyoAxGe7R2np1ClUcQfY+ZF/DVsu4LiqBZZhchsC26ZWOLz10qXbGsdCjmMcTWKHGSXJkAz7EtAKkV5bCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T10:44:31.359527Z"},"content_sha256":"22bd3d93a69b203764e69fb83b43005ccc8213dfe7fb6af8ff639bcf7a5b64fa","schema_version":"1.0","event_id":"sha256:22bd3d93a69b203764e69fb83b43005ccc8213dfe7fb6af8ff639bcf7a5b64fa"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:D53YU44R7OINXQXZSBE7R5PINM","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Variational Context: Exploiting Visual and Textual Context for Grounding Referring Expressions","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Hanwang Zhang, Shih-Fu Chang, Yulei Niu, Zhiwu Lu","submitted_at":"2019-07-08T13:37:48Z","abstract_excerpt":"We focus on grounding (i.e., localizing or linking) referring expressions in images, e.g., ``largest elephant standing behind baby elephant''. This is a general yet challenging vision-language task since it does not only require the localization of objects, but also the multimodal comprehension of context -- visual attributes (e.g., ``largest'', ``baby'') and relationships (e.g., ``behind'') that help to distinguish the referent from other objects, especially those of the same category. Due to the exponential complexity involved in modeling the context associated with multiple image regions, e"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.03609","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:41:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QVb+MzFQYIxyADFMBLMlh7O+MBCzihRM+WSoy4Jbrh0ToQElyhFw9hUUXz1Me1BuBlyN92tM7SKPL0QkukBgCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T10:44:31.360223Z"},"content_sha256":"bb96c03ded586075f35c8d26fd7bbcf17b6df404665a1d7016186e01c48b3d6e","schema_version":"1.0","event_id":"sha256:bb96c03ded586075f35c8d26fd7bbcf17b6df404665a1d7016186e01c48b3d6e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/D53YU44R7OINXQXZSBE7R5PINM/bundle.json","state_url":"https://pith.science/pith/D53YU44R7OINXQXZSBE7R5PINM/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/D53YU44R7OINXQXZSBE7R5PINM/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T10:44:31Z","links":{"resolver":"https://pith.science/pith/D53YU44R7OINXQXZSBE7R5PINM","bundle":"https://pith.science/pith/D53YU44R7OINXQXZSBE7R5PINM/bundle.json","state":"https://pith.science/pith/D53YU44R7OINXQXZSBE7R5PINM/state.json","well_known_bundle":"https://pith.science/.well-known/pith/D53YU44R7OINXQXZSBE7R5PINM/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:D53YU44R7OINXQXZSBE7R5PINM","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"36fbcd941f75d1025373e9648443528c940c22ea882f258b859c57984675c1c8","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-07-08T13:37:48Z","title_canon_sha256":"1a323090ca160877236a0bab4bce883f7a2d6ac2dcbd831c15f827f5358c46f5"},"schema_version":"1.0","source":{"id":"1907.03609","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1907.03609","created_at":"2026-05-17T23:41:14Z"},{"alias_kind":"arxiv_version","alias_value":"1907.03609v1","created_at":"2026-05-17T23:41:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1907.03609","created_at":"2026-05-17T23:41:14Z"},{"alias_kind":"pith_short_12","alias_value":"D53YU44R7OIN","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_16","alias_value":"D53YU44R7OINXQXZ","created_at":"2026-05-18T12:33:15Z"},{"alias_kind":"pith_short_8","alias_value":"D53YU44R","created_at":"2026-05-18T12:33:15Z"}],"graph_snapshots":[{"event_id":"sha256:bb96c03ded586075f35c8d26fd7bbcf17b6df404665a1d7016186e01c48b3d6e","target":"graph","created_at":"2026-05-17T23:41:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We focus on grounding (i.e., localizing or linking) referring expressions in images, e.g., ``largest elephant standing behind baby elephant''. This is a general yet challenging vision-language task since it does not only require the localization of objects, but also the multimodal comprehension of context -- visual attributes (e.g., ``largest'', ``baby'') and relationships (e.g., ``behind'') that help to distinguish the referent from other objects, especially those of the same category. Due to the exponential complexity involved in modeling the context associated with multiple image regions, e","authors_text":"Hanwang Zhang, Shih-Fu Chang, Yulei Niu, Zhiwu Lu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-07-08T13:37:48Z","title":"Variational Context: Exploiting Visual and Textual Context for Grounding Referring Expressions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1907.03609","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:22bd3d93a69b203764e69fb83b43005ccc8213dfe7fb6af8ff639bcf7a5b64fa","target":"record","created_at":"2026-05-17T23:41:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"36fbcd941f75d1025373e9648443528c940c22ea882f258b859c57984675c1c8","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2019-07-08T13:37:48Z","title_canon_sha256":"1a323090ca160877236a0bab4bce883f7a2d6ac2dcbd831c15f827f5358c46f5"},"schema_version":"1.0","source":{"id":"1907.03609","kind":"arxiv","version":1}},"canonical_sha256":"1f778a7391fb90dbc2f99049f8f5e86b1ac193201062f0dce24d69a47fbd18d6","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1f778a7391fb90dbc2f99049f8f5e86b1ac193201062f0dce24d69a47fbd18d6","first_computed_at":"2026-05-17T23:41:14.199075Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:41:14.199075Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"k52p6M/V/jyGVGXR1kfBIXGicLC92IlFn9dBGEvUPU1HqR/yJhChqKJcbBdmxbZloQeInFv0SEhyzB792/5+Dw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:41:14.199570Z","signed_message":"canonical_sha256_bytes"},"source_id":"1907.03609","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:22bd3d93a69b203764e69fb83b43005ccc8213dfe7fb6af8ff639bcf7a5b64fa","sha256:bb96c03ded586075f35c8d26fd7bbcf17b6df404665a1d7016186e01c48b3d6e"],"state_sha256":"653311d06d1dd9aac62ae907581ac3aa6dc879999c4fe59eb4189508920bc21e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8jc1A7ko2bmPtHW3PUZ1Fk5yL4/WzC4hT326ZWu+zCcyZgBRFdD+wns9VokoQgst4hsJ2Maj6La0cnBWv+iACw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T10:44:31.363954Z","bundle_sha256":"70a6dbbbb3af9c7cfef6184a1859975214443146457e667b320d89c512e6932b"}}