{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:OULZ3PQLSKDAVQNERTQXV626GZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ceadcbfe397879f5ffeede537f1583cfb8adc2fbc4e35985d4723c0cc080f4e9","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T06:56:57Z","title_canon_sha256":"1ca61be3528a3e9c8af97ab86261df7e92b860e0b8005f33d334bdebe250b622"},"schema_version":"1.0","source":{"id":"2605.14462","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.14462","created_at":"2026-05-17T23:39:06Z"},{"alias_kind":"arxiv_version","alias_value":"2605.14462v1","created_at":"2026-05-17T23:39:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14462","created_at":"2026-05-17T23:39:06Z"},{"alias_kind":"pith_short_12","alias_value":"OULZ3PQLSKDA","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"OULZ3PQLSKDAVQNE","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"OULZ3PQL","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:965603174a4d0f258f3f0a8304d1fa37107eff03e80c2c1f560e2fa5b17b01c1","target":"graph","created_at":"2026-05-17T23:39:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Across benchmark and in-the-wild videos, HA-HOI improves human-object alignment, contact consistency, temporal stability, and simulation readiness over prior monocular HOI reconstruction methods."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That accurate human motion recovered from monocular video can serve as a reliable interaction anchor whose kinematic trajectory, when projected into physics simulation, produces stable contacts and functional manipulation without additional constraints or post-processing."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"HA-HOI produces physically plausible 4D HOI animations from monocular videos by anchoring object reconstruction to human motion and refining the result in a physics-based humanoid-object simulator."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"HA-HOI recovers 4D human-object interactions from monocular videos that remain stable under physics simulation."}],"snapshot_sha256":"c5c7f52e41c48fd048a144edf80124b98d3437f88d02a82c39528575e2ac668a"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"70fe5a8d7661199c1f495fdc2d135338e5e31f1ff341aec8201eb16bdad97d63"},"paper":{"abstract_excerpt":"Recovering 4D human-object interaction (HOI) from monocular video is a key step toward scalable 3D content creation, embodied AI, and simulation-based learning. Recent methods can reconstruct temporally coherent human and object trajectories, but these trajectories often remain visual artifacts while failing to preserve stable contact, functional manipulation, or physical plausibility when used as reference motions for humanoid-object simulation. This reveals a fundamental interaction gap: HOI reconstruction should not stop at tracking a human and an object, but should recover the relation tha","authors_text":"Chengfeng Zhao, Chi-Keung Tang, Yuan Liu, Yubo Zhao, Yujin Chai, Yunao Dong, Zijiao Zeng","cross_cats":[],"headline":"HA-HOI recovers 4D human-object interactions from monocular videos that remain stable under physics simulation.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T06:56:57Z","title":"Real2Sim in HOI: Toward Physically Plausible HOI Reconstruction from Monocular Videos"},"references":{"count":15,"internal_anchors":3,"resolved_work":15,"sample":[{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":1,"title":"arXiv preprint arXiv:2507.21045 (2025) 1, 3","work_id":"d1dfd87a-04ea-454f-810f-0e3484b07ed5","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":2,"title":"//arxiv.org/abs/2212.06870","work_id":"aae2e7fc-c8d3-49a0-89aa-229fca9e29cc","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":3,"title":"arXiv preprint arXiv:2509.07920 (2025)","work_id":"8fc3503e-7edd-4db3-83ad-7cc1839ce064","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":4,"title":"Unish: Unify- ing scene and human reconstruction in a feed-forward pass","work_id":"680c4d44-7039-44d4-a3ad-db7b781e308e","year":null},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":5,"title":"Track4world: Feedforward world-centric dense 3d tracking of all pixels.arXiv preprint arXiv:2603.02573,","work_id":"237ea51d-002d-48f3-aa30-23c8bc3fed03","year":null}],"snapshot_sha256":"347e7a5804d3667762662583aed7e590d8534e83f70f784711203847cbe8c14f"},"source":{"id":"2605.14462","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-15T02:40:43.037392Z","id":"72d8df62-7c14-475a-ba48-c1a7ecb73d21","model_set":{"reader":"grok-4.3"},"one_line_summary":"HA-HOI produces physically plausible 4D HOI animations from monocular videos by anchoring object reconstruction to human motion and refining the result in a physics-based humanoid-object simulator.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"HA-HOI recovers 4D human-object interactions from monocular videos that remain stable under physics simulation.","strongest_claim":"Across benchmark and in-the-wild videos, HA-HOI improves human-object alignment, contact consistency, temporal stability, and simulation readiness over prior monocular HOI reconstruction methods.","weakest_assumption":"That accurate human motion recovered from monocular video can serve as a reliable interaction anchor whose kinematic trajectory, when projected into physics simulation, produces stable contacts and functional manipulation without additional constraints or post-processing."}},"verdict_id":"72d8df62-7c14-475a-ba48-c1a7ecb73d21"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:898322ff5e0bad72903f6bb28477386eb6afd099ec45426472c77427713ea7f8","target":"record","created_at":"2026-05-17T23:39:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ceadcbfe397879f5ffeede537f1583cfb8adc2fbc4e35985d4723c0cc080f4e9","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T06:56:57Z","title_canon_sha256":"1ca61be3528a3e9c8af97ab86261df7e92b860e0b8005f33d334bdebe250b622"},"schema_version":"1.0","source":{"id":"2605.14462","kind":"arxiv","version":1}},"canonical_sha256":"75179dbe0b92860ac1a48ce17afb5e364caadd7c2eec2119bf13b1017c0a5080","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"75179dbe0b92860ac1a48ce17afb5e364caadd7c2eec2119bf13b1017c0a5080","first_computed_at":"2026-05-17T23:39:06.766204Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:39:06.766204Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"k/c/txUcTRGXwY+D8SnOyOgP9q8/kJQX4RLFuKvUD3FNFb14XQhMtM6kxvss77TSHOwEXsJzo8b5X8vg9ea+DA==","signature_status":"signed_v1","signed_at":"2026-05-17T23:39:06.766861Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.14462","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:898322ff5e0bad72903f6bb28477386eb6afd099ec45426472c77427713ea7f8","sha256:965603174a4d0f258f3f0a8304d1fa37107eff03e80c2c1f560e2fa5b17b01c1"],"state_sha256":"b47583922315ee09e4bf19c4927b9a07f1324489a0da28049547ffff0c4b799e"}