{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:T5FYZRKPNBEKH5JNQXLSSDSL2I","short_pith_number":"pith:T5FYZRKP","canonical_record":{"source":{"id":"1606.06108","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-06-20T13:28:35Z","cross_cats_sorted":[],"title_canon_sha256":"fa42ae6fdd5cb729b7203ae10b4362d319e2a9319dad46c6ee1e447b469a0eaa","abstract_canon_sha256":"f95b420e3f136447adb7915cac68de99a4265d869bc7641e87e779e1cba677a0"},"schema_version":"1.0"},"canonical_sha256":"9f4b8cc54f6848a3f52d85d7290e4bd214ae4d423f79c323b96aebcdb609f6d6","source":{"kind":"arxiv","id":"1606.06108","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1606.06108","created_at":"2026-05-18T00:45:02Z"},{"alias_kind":"arxiv_version","alias_value":"1606.06108v2","created_at":"2026-05-18T00:45:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1606.06108","created_at":"2026-05-18T00:45:02Z"},{"alias_kind":"pith_short_12","alias_value":"T5FYZRKPNBEK","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_16","alias_value":"T5FYZRKPNBEKH5JN","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_8","alias_value":"T5FYZRKP","created_at":"2026-05-18T12:30:44Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:T5FYZRKPNBEKH5JNQXLSSDSL2I","target":"record","payload":{"canonical_record":{"source":{"id":"1606.06108","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-06-20T13:28:35Z","cross_cats_sorted":[],"title_canon_sha256":"fa42ae6fdd5cb729b7203ae10b4362d319e2a9319dad46c6ee1e447b469a0eaa","abstract_canon_sha256":"f95b420e3f136447adb7915cac68de99a4265d869bc7641e87e779e1cba677a0"},"schema_version":"1.0"},"canonical_sha256":"9f4b8cc54f6848a3f52d85d7290e4bd214ae4d423f79c323b96aebcdb609f6d6","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:45:02.702456Z","signature_b64":"sFYk/8sA6X7KUKj+uPPyXNHsUguuHT4QFUOGxtL7WtYbHrMEmAGxLy+LPOwQPy7cIB7HKq1anT7hn//VTxBkCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9f4b8cc54f6848a3f52d85d7290e4bd214ae4d423f79c323b96aebcdb609f6d6","last_reissued_at":"2026-05-18T00:45:02.702088Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:45:02.702088Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1606.06108","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:45:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EIr1f2+seuWI3zvYyPFQU8wExnvK42LfExm+7zAjldeECvS7no93/tcE7wq10Os+RwbONp++9Sc8yOCGoPbEBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T04:00:39.371793Z"},"content_sha256":"b4536d7dfc2ed06a3e94dda58198ffdd790a1e2e963fd4ecc003e0296b973792","schema_version":"1.0","event_id":"sha256:b4536d7dfc2ed06a3e94dda58198ffdd790a1e2e963fd4ecc003e0296b973792"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:T5FYZRKPNBEKH5JNQXLSSDSL2I","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"DualNet: Domain-Invariant Network for Visual Question Answering","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Andrew Shin, Kuniaki Saito, Tatsuya Harada, Yoshitaka Ushiku","submitted_at":"2016-06-20T13:28:35Z","abstract_excerpt":"Visual question answering (VQA) task not only bridges the gap between images and language, but also requires that specific contents within the image are understood as indicated by linguistic context of the question, in order to generate the accurate answers. Thus, it is critical to build an efficient embedding of images and texts. We implement DualNet, which fully takes advantage of discriminative power of both image and textual features by separately performing two operations. Building an ensemble of DualNet further boosts the performance. Contrary to common belief, our method proved effectiv"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1606.06108","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:45:02Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"UkviFWhjvJY5s2JUPupzD5blfzfayVhLqI6sVs8r4NDHuXqqoDt8dlbtxjHDXuwolnqq641x0dXaw6Vcgm9xBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T04:00:39.372140Z"},"content_sha256":"e2963a1fff68c1d82761191b7aa1860b756b7fb9a7dc03d9953f2d1c1f7cf51c","schema_version":"1.0","event_id":"sha256:e2963a1fff68c1d82761191b7aa1860b756b7fb9a7dc03d9953f2d1c1f7cf51c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/T5FYZRKPNBEKH5JNQXLSSDSL2I/bundle.json","state_url":"https://pith.science/pith/T5FYZRKPNBEKH5JNQXLSSDSL2I/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/T5FYZRKPNBEKH5JNQXLSSDSL2I/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T04:00:39Z","links":{"resolver":"https://pith.science/pith/T5FYZRKPNBEKH5JNQXLSSDSL2I","bundle":"https://pith.science/pith/T5FYZRKPNBEKH5JNQXLSSDSL2I/bundle.json","state":"https://pith.science/pith/T5FYZRKPNBEKH5JNQXLSSDSL2I/state.json","well_known_bundle":"https://pith.science/.well-known/pith/T5FYZRKPNBEKH5JNQXLSSDSL2I/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:T5FYZRKPNBEKH5JNQXLSSDSL2I","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f95b420e3f136447adb7915cac68de99a4265d869bc7641e87e779e1cba677a0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-06-20T13:28:35Z","title_canon_sha256":"fa42ae6fdd5cb729b7203ae10b4362d319e2a9319dad46c6ee1e447b469a0eaa"},"schema_version":"1.0","source":{"id":"1606.06108","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1606.06108","created_at":"2026-05-18T00:45:02Z"},{"alias_kind":"arxiv_version","alias_value":"1606.06108v2","created_at":"2026-05-18T00:45:02Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1606.06108","created_at":"2026-05-18T00:45:02Z"},{"alias_kind":"pith_short_12","alias_value":"T5FYZRKPNBEK","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_16","alias_value":"T5FYZRKPNBEKH5JN","created_at":"2026-05-18T12:30:44Z"},{"alias_kind":"pith_short_8","alias_value":"T5FYZRKP","created_at":"2026-05-18T12:30:44Z"}],"graph_snapshots":[{"event_id":"sha256:e2963a1fff68c1d82761191b7aa1860b756b7fb9a7dc03d9953f2d1c1f7cf51c","target":"graph","created_at":"2026-05-18T00:45:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Visual question answering (VQA) task not only bridges the gap between images and language, but also requires that specific contents within the image are understood as indicated by linguistic context of the question, in order to generate the accurate answers. Thus, it is critical to build an efficient embedding of images and texts. We implement DualNet, which fully takes advantage of discriminative power of both image and textual features by separately performing two operations. Building an ensemble of DualNet further boosts the performance. Contrary to common belief, our method proved effectiv","authors_text":"Andrew Shin, Kuniaki Saito, Tatsuya Harada, Yoshitaka Ushiku","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-06-20T13:28:35Z","title":"DualNet: Domain-Invariant Network for Visual Question Answering"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1606.06108","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b4536d7dfc2ed06a3e94dda58198ffdd790a1e2e963fd4ecc003e0296b973792","target":"record","created_at":"2026-05-18T00:45:02Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f95b420e3f136447adb7915cac68de99a4265d869bc7641e87e779e1cba677a0","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-06-20T13:28:35Z","title_canon_sha256":"fa42ae6fdd5cb729b7203ae10b4362d319e2a9319dad46c6ee1e447b469a0eaa"},"schema_version":"1.0","source":{"id":"1606.06108","kind":"arxiv","version":2}},"canonical_sha256":"9f4b8cc54f6848a3f52d85d7290e4bd214ae4d423f79c323b96aebcdb609f6d6","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9f4b8cc54f6848a3f52d85d7290e4bd214ae4d423f79c323b96aebcdb609f6d6","first_computed_at":"2026-05-18T00:45:02.702088Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:45:02.702088Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"sFYk/8sA6X7KUKj+uPPyXNHsUguuHT4QFUOGxtL7WtYbHrMEmAGxLy+LPOwQPy7cIB7HKq1anT7hn//VTxBkCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:45:02.702456Z","signed_message":"canonical_sha256_bytes"},"source_id":"1606.06108","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b4536d7dfc2ed06a3e94dda58198ffdd790a1e2e963fd4ecc003e0296b973792","sha256:e2963a1fff68c1d82761191b7aa1860b756b7fb9a7dc03d9953f2d1c1f7cf51c"],"state_sha256":"451a48e2315579538876242ec862a9825c27f87ae2cc98b28b1f333f00627cf2"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"J9yFIV2JjzmWmqG1C4vUyfdxI3ixgYj/nFX9E6IBsmj0N+Rv+CJT1EAw19DGSbJBl7vbuiq/mMNz6kRRwFlzBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T04:00:39.374234Z","bundle_sha256":"bc9bb49faa13d53ecdde38962b42a99b34e1799e240b6bf823c3813eca3050fc"}}