{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:MHKVTQM5LPBDD56S6CHWUPDUWT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ed88aa5f8b92c269cd91cd7d6e1fac608f010b5ee53df0709dab5b30dc123c7e","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-03T11:53:57Z","title_canon_sha256":"3f3c30dd7829980db2c759892c5fc3abed5b44047e5d584b9e87a0679d372adf"},"schema_version":"1.0","source":{"id":"2606.04773","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.04773","created_at":"2026-06-04T01:09:29Z"},{"alias_kind":"arxiv_version","alias_value":"2606.04773v1","created_at":"2026-06-04T01:09:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.04773","created_at":"2026-06-04T01:09:29Z"},{"alias_kind":"pith_short_12","alias_value":"MHKVTQM5LPBD","created_at":"2026-06-04T01:09:29Z"},{"alias_kind":"pith_short_16","alias_value":"MHKVTQM5LPBDD56S","created_at":"2026-06-04T01:09:29Z"},{"alias_kind":"pith_short_8","alias_value":"MHKVTQM5","created_at":"2026-06-04T01:09:29Z"}],"graph_snapshots":[{"event_id":"sha256:038dd292fdfb4e39e9f9330d3113020e6b23c13232a8ae1b30a0d8e96f000011","target":"graph","created_at":"2026-06-04T01:09:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.04773/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reliable evaluation of human motion understanding is fundamental to advancing embodied AI, robotics, and animation. However, existing benchmarks suffer from coarse semantic granularity, undifferentiated difficulty, limited annotation quality, and pervasive answer ambiguity, leaving them unable to diagnose where current models fail. To bridge this gap, we introduce NextMotionQA, a comprehensive benchmark that leverages vision-language models (VLMs) for semi-automated, expert-verified dataset. NextMotionQA features three complementary tasks: multiple-choice question answering, video captioning, ","authors_text":"Andreas Geiger, Chuqiao Li, Gerard Pons-Moll, Xianghui Xie, Yong Cao","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-03T11:53:57Z","title":"NextMotionQA: Benchmarking and Judging Human Motion Understanding with Vision-Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.04773","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9cfac5111f882d28d66de51543ba92e98905f7d0d018e4c325ca52d31d5ea71b","target":"record","created_at":"2026-06-04T01:09:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ed88aa5f8b92c269cd91cd7d6e1fac608f010b5ee53df0709dab5b30dc123c7e","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-06-03T11:53:57Z","title_canon_sha256":"3f3c30dd7829980db2c759892c5fc3abed5b44047e5d584b9e87a0679d372adf"},"schema_version":"1.0","source":{"id":"2606.04773","kind":"arxiv","version":1}},"canonical_sha256":"61d559c19d5bc231f7d2f08f6a3c74b4c8c21d90b5c3700b3ad320b74f2968f3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"61d559c19d5bc231f7d2f08f6a3c74b4c8c21d90b5c3700b3ad320b74f2968f3","first_computed_at":"2026-06-04T01:09:29.491386Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-04T01:09:29.491386Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"b2oqasYObJf0MydkCNu52FdPDcNB31HqhGtWlOR713Gv+4/IgdvMzvoGSfP2fvbARm+pDN4M7EILLk+shho5Bg==","signature_status":"signed_v1","signed_at":"2026-06-04T01:09:29.491881Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.04773","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9cfac5111f882d28d66de51543ba92e98905f7d0d018e4c325ca52d31d5ea71b","sha256:038dd292fdfb4e39e9f9330d3113020e6b23c13232a8ae1b30a0d8e96f000011"],"state_sha256":"7eee16b03ced2b1bb6bf63c0f097c523c27383164433313d622c09cea3905520"}