{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:QXUIY7F4ZNQ3LGICOAVIQX2FYN","short_pith_number":"pith:QXUIY7F4","schema_version":"1.0","canonical_sha256":"85e88c7cbccb61b59902702a885f45c3592b3dece0a57b0b545c3778d0cb5854","source":{"kind":"arxiv","id":"1604.01485","version":1},"attestation_state":"computed","paper":{"title":"A Focused Dynamic Attention Model for Visual Question Answering","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.NE"],"primary_cat":"cs.CV","authors_text":"Ilija Ilievski, Jiashi Feng, Shuicheng Yan","submitted_at":"2016-04-06T05:16:10Z","abstract_excerpt":"Visual Question and Answering (VQA) problems are attracting increasing interest from multiple research disciplines. Solving VQA problems requires techniques from both computer vision for understanding the visual contents of a presented image or video, as well as the ones from natural language processing for understanding semantics of the question and generating the answers. Regarding visual content modeling, most of existing VQA methods adopt the strategy of extracting global features from the image or video, which inevitably fails in capturing fine-grained information such as spatial configur"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1604.01485","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-04-06T05:16:10Z","cross_cats_sorted":["cs.CL","cs.NE"],"title_canon_sha256":"70efb1fe1ed186132388e311b8dbfcbb15d688d22ebcedcdd18e0e8b87ea51f8","abstract_canon_sha256":"cff3152fc88acbbe7328a59a247b3488c68a459fbd9e709a5279e592f165360d"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:17:36.283792Z","signature_b64":"J/3Rn7Nmqi652YRdTfoEHu+N+8MM1BrB6k32sBe0xKIyqq4PMFGQkkSMoTJDlWy1A/XIOFV8er70P8GmWuXtBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"85e88c7cbccb61b59902702a885f45c3592b3dece0a57b0b545c3778d0cb5854","last_reissued_at":"2026-05-18T01:17:36.283110Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:17:36.283110Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"A Focused Dynamic Attention Model for Visual Question Answering","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.NE"],"primary_cat":"cs.CV","authors_text":"Ilija Ilievski, Jiashi Feng, Shuicheng Yan","submitted_at":"2016-04-06T05:16:10Z","abstract_excerpt":"Visual Question and Answering (VQA) problems are attracting increasing interest from multiple research disciplines. Solving VQA problems requires techniques from both computer vision for understanding the visual contents of a presented image or video, as well as the ones from natural language processing for understanding semantics of the question and generating the answers. Regarding visual content modeling, most of existing VQA methods adopt the strategy of extracting global features from the image or video, which inevitably fails in capturing fine-grained information such as spatial configur"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.01485","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1604.01485","created_at":"2026-05-18T01:17:36.283221+00:00"},{"alias_kind":"arxiv_version","alias_value":"1604.01485v1","created_at":"2026-05-18T01:17:36.283221+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.01485","created_at":"2026-05-18T01:17:36.283221+00:00"},{"alias_kind":"pith_short_12","alias_value":"QXUIY7F4ZNQ3","created_at":"2026-05-18T12:30:41.710351+00:00"},{"alias_kind":"pith_short_16","alias_value":"QXUIY7F4ZNQ3LGIC","created_at":"2026-05-18T12:30:41.710351+00:00"},{"alias_kind":"pith_short_8","alias_value":"QXUIY7F4","created_at":"2026-05-18T12:30:41.710351+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN","json":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN.json","graph_json":"https://pith.science/api/pith-number/QXUIY7F4ZNQ3LGICOAVIQX2FYN/graph.json","events_json":"https://pith.science/api/pith-number/QXUIY7F4ZNQ3LGICOAVIQX2FYN/events.json","paper":"https://pith.science/paper/QXUIY7F4"},"agent_actions":{"view_html":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN","download_json":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN.json","view_paper":"https://pith.science/paper/QXUIY7F4","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1604.01485&json=true","fetch_graph":"https://pith.science/api/pith-number/QXUIY7F4ZNQ3LGICOAVIQX2FYN/graph.json","fetch_events":"https://pith.science/api/pith-number/QXUIY7F4ZNQ3LGICOAVIQX2FYN/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN/action/timestamp_anchor","attest_storage":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN/action/storage_attestation","attest_author":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN/action/author_attestation","sign_citation":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN/action/citation_signature","submit_replication":"https://pith.science/pith/QXUIY7F4ZNQ3LGICOAVIQX2FYN/action/replication_record"}},"created_at":"2026-05-18T01:17:36.283221+00:00","updated_at":"2026-05-18T01:17:36.283221+00:00"}