{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2017:7TF5S2ENCXT5A24OT46PRH6FJL","short_pith_number":"pith:7TF5S2EN","schema_version":"1.0","canonical_sha256":"fccbd9688d15e7d06b8e9f3cf89fc54ade487ca7384b5c953e44d119ea44209a","source":{"kind":"arxiv","id":"1711.06330","version":2},"attestation_state":"computed","paper":{"title":"Attend and Interact: Higher-Order Object Interactions for Video Understanding","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Asim Kadav, Chih-Yao Ma, Ghassan AlRegib, Hans Peter Graf, Iain Melvin, Zsolt Kira","submitted_at":"2017-11-16T22:14:52Z","abstract_excerpt":"Human actions often involve complex interactions across several inter-related objects in the scene. However, existing approaches to fine-grained video understanding or visual relationship detection often rely on single object representation or pairwise object relationships. Furthermore, learning interactions across multiple objects in hundreds of frames for video is computationally infeasible and performance may suffer since a large combinatorial space has to be modeled. In this paper, we propose to efficiently learn higher-order interactions between arbitrary subgroups of objects for fine-gra"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1711.06330","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-11-16T22:14:52Z","cross_cats_sorted":[],"title_canon_sha256":"17800f887f7943db60fc012f8093a3764e5747fa5311edb51b6922426e0e98d2","abstract_canon_sha256":"a2131514f9706dee8b4db6dcf84ddeca75d0e60fc7e2eb18cf3c460cae7f18c3"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:20:30.000008Z","signature_b64":"vZaaui1x5ss72E/u4wWlQfRgKONGPSM5btaw2m6uD/IPkNPf3AMVMBv4TrAbgmAc3hs/i53Q3fVEiysnrbGYDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"fccbd9688d15e7d06b8e9f3cf89fc54ade487ca7384b5c953e44d119ea44209a","last_reissued_at":"2026-05-18T00:20:29.999627Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:20:29.999627Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Attend and Interact: Higher-Order Object Interactions for Video Understanding","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Asim Kadav, Chih-Yao Ma, Ghassan AlRegib, Hans Peter Graf, Iain Melvin, Zsolt Kira","submitted_at":"2017-11-16T22:14:52Z","abstract_excerpt":"Human actions often involve complex interactions across several inter-related objects in the scene. However, existing approaches to fine-grained video understanding or visual relationship detection often rely on single object representation or pairwise object relationships. Furthermore, learning interactions across multiple objects in hundreds of frames for video is computationally infeasible and performance may suffer since a large combinatorial space has to be modeled. In this paper, we propose to efficiently learn higher-order interactions between arbitrary subgroups of objects for fine-gra"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1711.06330","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1711.06330","created_at":"2026-05-18T00:20:29.999694+00:00"},{"alias_kind":"arxiv_version","alias_value":"1711.06330v2","created_at":"2026-05-18T00:20:29.999694+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1711.06330","created_at":"2026-05-18T00:20:29.999694+00:00"},{"alias_kind":"pith_short_12","alias_value":"7TF5S2ENCXT5","created_at":"2026-05-18T12:31:05.417338+00:00"},{"alias_kind":"pith_short_16","alias_value":"7TF5S2ENCXT5A24O","created_at":"2026-05-18T12:31:05.417338+00:00"},{"alias_kind":"pith_short_8","alias_value":"7TF5S2EN","created_at":"2026-05-18T12:31:05.417338+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL","json":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL.json","graph_json":"https://pith.science/api/pith-number/7TF5S2ENCXT5A24OT46PRH6FJL/graph.json","events_json":"https://pith.science/api/pith-number/7TF5S2ENCXT5A24OT46PRH6FJL/events.json","paper":"https://pith.science/paper/7TF5S2EN"},"agent_actions":{"view_html":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL","download_json":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL.json","view_paper":"https://pith.science/paper/7TF5S2EN","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1711.06330&json=true","fetch_graph":"https://pith.science/api/pith-number/7TF5S2ENCXT5A24OT46PRH6FJL/graph.json","fetch_events":"https://pith.science/api/pith-number/7TF5S2ENCXT5A24OT46PRH6FJL/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL/action/timestamp_anchor","attest_storage":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL/action/storage_attestation","attest_author":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL/action/author_attestation","sign_citation":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL/action/citation_signature","submit_replication":"https://pith.science/pith/7TF5S2ENCXT5A24OT46PRH6FJL/action/replication_record"}},"created_at":"2026-05-18T00:20:29.999694+00:00","updated_at":"2026-05-18T00:20:29.999694+00:00"}