{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:XO7DD3QZ74M5JARCCFIDZ3BUIL","short_pith_number":"pith:XO7DD3QZ","canonical_record":{"source":{"id":"1712.00609","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-12-02T14:14:50Z","cross_cats_sorted":[],"title_canon_sha256":"fb4bab9d25f4d43ab8c41117e7083bdcf7641dc220f1518044fa7a68c7bc6600","abstract_canon_sha256":"0dbb434ca607a73340e6c3ef77ca68a34d7b641cb18f12cfad52c0c11bb14116"},"schema_version":"1.0"},"canonical_sha256":"bbbe31ee19ff19d4822211503cec3442c16cfd8e75322b5567bc98ae425173c1","source":{"kind":"arxiv","id":"1712.00609","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.00609","created_at":"2026-05-18T00:29:04Z"},{"alias_kind":"arxiv_version","alias_value":"1712.00609v1","created_at":"2026-05-18T00:29:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.00609","created_at":"2026-05-18T00:29:04Z"},{"alias_kind":"pith_short_12","alias_value":"XO7DD3QZ74M5","created_at":"2026-05-18T12:31:56Z"},{"alias_kind":"pith_short_16","alias_value":"XO7DD3QZ74M5JARC","created_at":"2026-05-18T12:31:56Z"},{"alias_kind":"pith_short_8","alias_value":"XO7DD3QZ","created_at":"2026-05-18T12:31:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:XO7DD3QZ74M5JARCCFIDZ3BUIL","target":"record","payload":{"canonical_record":{"source":{"id":"1712.00609","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-12-02T14:14:50Z","cross_cats_sorted":[],"title_canon_sha256":"fb4bab9d25f4d43ab8c41117e7083bdcf7641dc220f1518044fa7a68c7bc6600","abstract_canon_sha256":"0dbb434ca607a73340e6c3ef77ca68a34d7b641cb18f12cfad52c0c11bb14116"},"schema_version":"1.0"},"canonical_sha256":"bbbe31ee19ff19d4822211503cec3442c16cfd8e75322b5567bc98ae425173c1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:29:04.652877Z","signature_b64":"TgU6ejzmsxw4+QACzppWsj/IOJT/cnrFahPLrxFsGuNvO7soU9a8jIyi1fm+GguVvgTDllfYgs829HDJQgF1AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"bbbe31ee19ff19d4822211503cec3442c16cfd8e75322b5567bc98ae425173c1","last_reissued_at":"2026-05-18T00:29:04.652155Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:29:04.652155Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1712.00609","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:29:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Lcua3PvwBIWRZFKIEGKgnvotI5L+9K9HMeYSrp8j9gHrDei/X4iZbmiBu8sfKqn2VOosTKy6vD1HoqvoIVcvDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T07:34:10.811471Z"},"content_sha256":"7d18ff48ed55ff2d35ab06823b00f0d6e271ccb73d02296343b46c06a8c54c00","schema_version":"1.0","event_id":"sha256:7d18ff48ed55ff2d35ab06823b00f0d6e271ccb73d02296343b46c06a8c54c00"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:XO7DD3QZ74M5JARCCFIDZ3BUIL","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Improving Visually Grounded Sentence Representations with Self-Attention","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Kang Min Yoo, Sang-goo Lee, Youhyun Shin","submitted_at":"2017-12-02T14:14:50Z","abstract_excerpt":"Sentence representation models trained only on language could potentially suffer from the grounding problem. Recent work has shown promising results in improving the qualities of sentence representations by jointly training them with associated image features. However, the grounding capability is limited due to distant connection between input sentences and image features by the design of the architecture. In order to further close the gap, we propose applying self-attention mechanism to the sentence encoder to deepen the grounding effect. Our results on transfer tasks show that self-attentive"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.00609","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:29:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"f0wygI43EIBth7k/K2dDHhAA/G1F928ccgL17SIIXgCOmFjHm+r5s6llzBpTK0J2ADja/Fwe2V7H0S31PfrACQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T07:34:10.811830Z"},"content_sha256":"bb3ba8ec399df44e3528a026ab9897f158428bb75c8483b35859ce2131bf0708","schema_version":"1.0","event_id":"sha256:bb3ba8ec399df44e3528a026ab9897f158428bb75c8483b35859ce2131bf0708"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XO7DD3QZ74M5JARCCFIDZ3BUIL/bundle.json","state_url":"https://pith.science/pith/XO7DD3QZ74M5JARCCFIDZ3BUIL/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XO7DD3QZ74M5JARCCFIDZ3BUIL/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T07:34:10Z","links":{"resolver":"https://pith.science/pith/XO7DD3QZ74M5JARCCFIDZ3BUIL","bundle":"https://pith.science/pith/XO7DD3QZ74M5JARCCFIDZ3BUIL/bundle.json","state":"https://pith.science/pith/XO7DD3QZ74M5JARCCFIDZ3BUIL/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XO7DD3QZ74M5JARCCFIDZ3BUIL/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:XO7DD3QZ74M5JARCCFIDZ3BUIL","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0dbb434ca607a73340e6c3ef77ca68a34d7b641cb18f12cfad52c0c11bb14116","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-12-02T14:14:50Z","title_canon_sha256":"fb4bab9d25f4d43ab8c41117e7083bdcf7641dc220f1518044fa7a68c7bc6600"},"schema_version":"1.0","source":{"id":"1712.00609","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.00609","created_at":"2026-05-18T00:29:04Z"},{"alias_kind":"arxiv_version","alias_value":"1712.00609v1","created_at":"2026-05-18T00:29:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.00609","created_at":"2026-05-18T00:29:04Z"},{"alias_kind":"pith_short_12","alias_value":"XO7DD3QZ74M5","created_at":"2026-05-18T12:31:56Z"},{"alias_kind":"pith_short_16","alias_value":"XO7DD3QZ74M5JARC","created_at":"2026-05-18T12:31:56Z"},{"alias_kind":"pith_short_8","alias_value":"XO7DD3QZ","created_at":"2026-05-18T12:31:56Z"}],"graph_snapshots":[{"event_id":"sha256:bb3ba8ec399df44e3528a026ab9897f158428bb75c8483b35859ce2131bf0708","target":"graph","created_at":"2026-05-18T00:29:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Sentence representation models trained only on language could potentially suffer from the grounding problem. Recent work has shown promising results in improving the qualities of sentence representations by jointly training them with associated image features. However, the grounding capability is limited due to distant connection between input sentences and image features by the design of the architecture. In order to further close the gap, we propose applying self-attention mechanism to the sentence encoder to deepen the grounding effect. Our results on transfer tasks show that self-attentive","authors_text":"Kang Min Yoo, Sang-goo Lee, Youhyun Shin","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-12-02T14:14:50Z","title":"Improving Visually Grounded Sentence Representations with Self-Attention"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.00609","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7d18ff48ed55ff2d35ab06823b00f0d6e271ccb73d02296343b46c06a8c54c00","target":"record","created_at":"2026-05-18T00:29:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0dbb434ca607a73340e6c3ef77ca68a34d7b641cb18f12cfad52c0c11bb14116","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2017-12-02T14:14:50Z","title_canon_sha256":"fb4bab9d25f4d43ab8c41117e7083bdcf7641dc220f1518044fa7a68c7bc6600"},"schema_version":"1.0","source":{"id":"1712.00609","kind":"arxiv","version":1}},"canonical_sha256":"bbbe31ee19ff19d4822211503cec3442c16cfd8e75322b5567bc98ae425173c1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"bbbe31ee19ff19d4822211503cec3442c16cfd8e75322b5567bc98ae425173c1","first_computed_at":"2026-05-18T00:29:04.652155Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:29:04.652155Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"TgU6ejzmsxw4+QACzppWsj/IOJT/cnrFahPLrxFsGuNvO7soU9a8jIyi1fm+GguVvgTDllfYgs829HDJQgF1AA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:29:04.652877Z","signed_message":"canonical_sha256_bytes"},"source_id":"1712.00609","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7d18ff48ed55ff2d35ab06823b00f0d6e271ccb73d02296343b46c06a8c54c00","sha256:bb3ba8ec399df44e3528a026ab9897f158428bb75c8483b35859ce2131bf0708"],"state_sha256":"d3dd43eb98e7f0f0a5714f3dd98a4368ba53789877d5909199bf7a8a8e40748a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"NlmpJqQ3CnkUWUMF3SSnWu5WDaLe1qzV2u4ps9lcAUK6UcccfuLWDJ0IdpHL4ljEnmPJS+EeImAOjXRRxf7RBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T07:34:10.814225Z","bundle_sha256":"afeef1ac4de4bc271f5ed791f4dab1c8c0e6bcbbc80ac53172c52218964662f1"}}