{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:M5XYYPEJLZNHUOANE4A5NGOW37","short_pith_number":"pith:M5XYYPEJ","schema_version":"1.0","canonical_sha256":"676f8c3c895e5a7a380d2701d699d6dff818f1b5533d4a3b4b96f865a8e70561","source":{"kind":"arxiv","id":"2605.18956","version":1},"attestation_state":"computed","paper":{"title":"MotionMERGE: A Multi-granular Framework for Human Motion Editing, Reasoning, Generation, and Explanation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bizhu Wu, Jianfeng Ren, Jinheng Xie, Linlin Shen, Rong Qu, Ruibin Bai, Wenting Chen, Zhe Kong","submitted_at":"2026-05-18T18:00:04Z","abstract_excerpt":"Recent motion-language models unify tasks like comprehension and generation but operate at a coarse granularity, lacking fine-grained understanding and nuanced control over body parts needed for animation or interaction. This stems from fundamental issues in both the model and the data, in which the model can't focus on motion's localized pattern, and the training data lacks fine-grained supervision. To tackle this, we propose MotionMERGE, a unified framework that bridges the granularity gap. First, we pioneer the study of fine-grained languageguided motion control, including detailed understa"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.18956","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-18T18:00:04Z","cross_cats_sorted":[],"title_canon_sha256":"26e3628999a4995af6ce882a3ca401397c26dfb0b990bda958c63cac67bae040","abstract_canon_sha256":"6cb7b566c985bcbd1f3d0b351c56bfcb25fded40d2939c2f422a079f87557c01"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:06:38.465128Z","signature_b64":"dTkY4j2FYzA1aVXJHPFTlGI/8/P61sMPOXYsSfrdn4PENmekl7gTCCc7ff0V+LFL9XhVe+HLUYr0OOtBASzcDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"676f8c3c895e5a7a380d2701d699d6dff818f1b5533d4a3b4b96f865a8e70561","last_reissued_at":"2026-05-20T00:06:38.464362Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:06:38.464362Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"MotionMERGE: A Multi-granular Framework for Human Motion Editing, Reasoning, Generation, and Explanation","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bizhu Wu, Jianfeng Ren, Jinheng Xie, Linlin Shen, Rong Qu, Ruibin Bai, Wenting Chen, Zhe Kong","submitted_at":"2026-05-18T18:00:04Z","abstract_excerpt":"Recent motion-language models unify tasks like comprehension and generation but operate at a coarse granularity, lacking fine-grained understanding and nuanced control over body parts needed for animation or interaction. This stems from fundamental issues in both the model and the data, in which the model can't focus on motion's localized pattern, and the training data lacks fine-grained supervision. To tackle this, we propose MotionMERGE, a unified framework that bridges the granularity gap. First, we pioneer the study of fine-grained languageguided motion control, including detailed understa"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18956","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18956/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.18956","created_at":"2026-05-20T00:06:38.464472+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.18956v1","created_at":"2026-05-20T00:06:38.464472+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18956","created_at":"2026-05-20T00:06:38.464472+00:00"},{"alias_kind":"pith_short_12","alias_value":"M5XYYPEJLZNH","created_at":"2026-05-20T00:06:38.464472+00:00"},{"alias_kind":"pith_short_16","alias_value":"M5XYYPEJLZNHUOAN","created_at":"2026-05-20T00:06:38.464472+00:00"},{"alias_kind":"pith_short_8","alias_value":"M5XYYPEJ","created_at":"2026-05-20T00:06:38.464472+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37","json":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37.json","graph_json":"https://pith.science/api/pith-number/M5XYYPEJLZNHUOANE4A5NGOW37/graph.json","events_json":"https://pith.science/api/pith-number/M5XYYPEJLZNHUOANE4A5NGOW37/events.json","paper":"https://pith.science/paper/M5XYYPEJ"},"agent_actions":{"view_html":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37","download_json":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37.json","view_paper":"https://pith.science/paper/M5XYYPEJ","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.18956&json=true","fetch_graph":"https://pith.science/api/pith-number/M5XYYPEJLZNHUOANE4A5NGOW37/graph.json","fetch_events":"https://pith.science/api/pith-number/M5XYYPEJLZNHUOANE4A5NGOW37/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37/action/timestamp_anchor","attest_storage":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37/action/storage_attestation","attest_author":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37/action/author_attestation","sign_citation":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37/action/citation_signature","submit_replication":"https://pith.science/pith/M5XYYPEJLZNHUOANE4A5NGOW37/action/replication_record"}},"created_at":"2026-05-20T00:06:38.464472+00:00","updated_at":"2026-05-20T00:06:38.464472+00:00"}