{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:5JVWW2JHOWF4473VCMTK3YPTWS","short_pith_number":"pith:5JVWW2JH","canonical_record":{"source":{"id":"2605.05765","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T06:58:34Z","cross_cats_sorted":[],"title_canon_sha256":"cea5e84d506d4c570fcbb21e7c5bad7bc53bae3d04451a329018fb5ff0190c01","abstract_canon_sha256":"4bbaf9a8e2276ecc29bb9287d89b655a81a46c982e19d565f9ccd8aaf6576779"},"schema_version":"1.0"},"canonical_sha256":"ea6b6b6927758bce7f751326ade1f3b4845cc052d3955a50f1645695b86ac0a2","source":{"kind":"arxiv","id":"2605.05765","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.05765","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"arxiv_version","alias_value":"2605.05765v2","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.05765","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"pith_short_12","alias_value":"5JVWW2JHOWF4","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"pith_short_16","alias_value":"5JVWW2JHOWF4473V","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"pith_short_8","alias_value":"5JVWW2JH","created_at":"2026-05-22T01:04:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:5JVWW2JHOWF4473VCMTK3YPTWS","target":"record","payload":{"canonical_record":{"source":{"id":"2605.05765","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T06:58:34Z","cross_cats_sorted":[],"title_canon_sha256":"cea5e84d506d4c570fcbb21e7c5bad7bc53bae3d04451a329018fb5ff0190c01","abstract_canon_sha256":"4bbaf9a8e2276ecc29bb9287d89b655a81a46c982e19d565f9ccd8aaf6576779"},"schema_version":"1.0"},"canonical_sha256":"ea6b6b6927758bce7f751326ade1f3b4845cc052d3955a50f1645695b86ac0a2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-22T01:04:04.870525Z","signature_b64":"7vCd+otwXCZjtnApJHR4BuVTNBNVVXtMOLWzZ127NVFuaIfV3SItvjToRNgbnH89IS2LND6CJZDKGUY3RfXwBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"ea6b6b6927758bce7f751326ade1f3b4845cc052d3955a50f1645695b86ac0a2","last_reissued_at":"2026-05-22T01:04:04.869926Z","signature_status":"signed_v1","first_computed_at":"2026-05-22T01:04:04.869926Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.05765","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T01:04:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ktdrpZ2bVRAMB7wEAl/TnOSe8jRM88ymNrwdqzJrfw0PpPyCctbPzSkpaby6lWmEyq44ES8+uItwvt4d1wU/Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T04:42:27.499481Z"},"content_sha256":"0cd477d3d1a4d103724224e74ed032ec616bacfb2bb80e5768838e5f346e3d20","schema_version":"1.0","event_id":"sha256:0cd477d3d1a4d103724224e74ed032ec616bacfb2bb80e5768838e5f346e3d20"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:5JVWW2JHOWF4473VCMTK3YPTWS","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"X-OmniClaw Technical Report: A Unified Mobile Agent for Multimodal Understanding and Interaction","license":"http://creativecommons.org/licenses/by/4.0/","headline":"X-OmniClaw presents a unified architecture for mobile agents that combines multimodal perception, memory, and action to handle complex Android tasks with greater context awareness.","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Binqiang Pan, Chao Li, Haobo Ji, Haonan Lu, Peng Liu, Qi Qi, Qiuxia Hou, Qi Wu, Quanlong Zheng, Ru Zhen, Xiaoming Ren, Yang Song, Yanhao Zhang, Zhenyi Liao","submitted_at":"2026-05-07T06:58:34Z","abstract_excerpt":"Inspired by the development of OpenClaw, there is a growing demand for mobile-based personal agents capable of handling complex and intuitive interactions. In this technical report, we introduce X-OmniClaw, a unified mobile agent designed for multimodal understanding and interaction in the Android ecosystem. This unified architecture of perception, memory, and action enables the agent to handle complex mobile tasks with high contextual awareness. Specifically, Omni Perception provides a unified multimodal ingress pipeline that integrates UI states, real-world visual contexts, and speech inputs"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"Demonstrations across diverse scenarios show that X-OmniClaw effectively enhances interaction efficiency and task reliability, providing a practical architectural blueprint for the next generation of mobile-native personal assistants.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"That the described Omni Perception, Memory, and Action components will integrate and perform robustly in real-world conditions, as the abstract provides no quantitative metrics, baselines, or implementation details to support the effectiveness claims.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"X-OmniClaw presents a unified architecture for Android mobile agents using Omni Perception, Memory, and Action modules to enable efficient multimodal task handling and personalized interactions.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"X-OmniClaw presents a unified architecture for mobile agents that combines multimodal perception, memory, and action to handle complex Android tasks with greater context awareness.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"64c7dbb4182a9521d9aac47b754cf04560c99eb01b31d71d6a101f7f08b47b7e"},"source":{"id":"2605.05765","kind":"arxiv","version":2},"verdict":{"id":"bb1488a4-6bca-4d29-bb51-a98b7acc9929","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-08T14:49:12.379064Z","strongest_claim":"Demonstrations across diverse scenarios show that X-OmniClaw effectively enhances interaction efficiency and task reliability, providing a practical architectural blueprint for the next generation of mobile-native personal assistants.","one_line_summary":"X-OmniClaw presents a unified architecture for Android mobile agents using Omni Perception, Memory, and Action modules to enable efficient multimodal task handling and personalized interactions.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"That the described Omni Perception, Memory, and Action components will integrate and perform robustly in real-world conditions, as the abstract provides no quantitative metrics, baselines, or implementation details to support the effectiveness claims.","pith_extraction_headline":"X-OmniClaw presents a unified architecture for mobile agents that combines multimodal perception, memory, and action to handle complex Android tasks with greater context awareness."},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.05765/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"claim_evidence","ran_at":"2026-05-20T13:42:04.668327Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"ai_meta_artifact","ran_at":"2026-05-20T09:35:28.198235Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"doi_title_agreement","ran_at":"2026-05-19T20:01:19.479952Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"doi_compliance","ran_at":"2026-05-19T13:17:10.180706Z","status":"completed","version":"1.0.0","findings_count":0}],"snapshot_sha256":"47645ac63926ee5ea29dd8db59a6959ac587f0edf80defc389f46c7a3b3cce3f"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"bb1488a4-6bca-4d29-bb51-a98b7acc9929"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-22T01:04:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yQZtRCRpErh9THAAUqeNVRmphaVh1AOrnTG1LgF3lQ2pPlM3TWr+XYpkSZHvtCATaXVhlhSCRGRS5fHjULjeBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T04:42:27.500558Z"},"content_sha256":"b02fe38b99e6b88b1ca2ab190b0f29fa9027e5167b3ef341190fb34a9d0fef65","schema_version":"1.0","event_id":"sha256:b02fe38b99e6b88b1ca2ab190b0f29fa9027e5167b3ef341190fb34a9d0fef65"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5JVWW2JHOWF4473VCMTK3YPTWS/bundle.json","state_url":"https://pith.science/pith/5JVWW2JHOWF4473VCMTK3YPTWS/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5JVWW2JHOWF4473VCMTK3YPTWS/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T04:42:27Z","links":{"resolver":"https://pith.science/pith/5JVWW2JHOWF4473VCMTK3YPTWS","bundle":"https://pith.science/pith/5JVWW2JHOWF4473VCMTK3YPTWS/bundle.json","state":"https://pith.science/pith/5JVWW2JHOWF4473VCMTK3YPTWS/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5JVWW2JHOWF4473VCMTK3YPTWS/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:5JVWW2JHOWF4473VCMTK3YPTWS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"4bbaf9a8e2276ecc29bb9287d89b655a81a46c982e19d565f9ccd8aaf6576779","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T06:58:34Z","title_canon_sha256":"cea5e84d506d4c570fcbb21e7c5bad7bc53bae3d04451a329018fb5ff0190c01"},"schema_version":"1.0","source":{"id":"2605.05765","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.05765","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"arxiv_version","alias_value":"2605.05765v2","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.05765","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"pith_short_12","alias_value":"5JVWW2JHOWF4","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"pith_short_16","alias_value":"5JVWW2JHOWF4473V","created_at":"2026-05-22T01:04:04Z"},{"alias_kind":"pith_short_8","alias_value":"5JVWW2JH","created_at":"2026-05-22T01:04:04Z"}],"graph_snapshots":[{"event_id":"sha256:b02fe38b99e6b88b1ca2ab190b0f29fa9027e5167b3ef341190fb34a9d0fef65","target":"graph","created_at":"2026-05-22T01:04:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"Demonstrations across diverse scenarios show that X-OmniClaw effectively enhances interaction efficiency and task reliability, providing a practical architectural blueprint for the next generation of mobile-native personal assistants."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That the described Omni Perception, Memory, and Action components will integrate and perform robustly in real-world conditions, as the abstract provides no quantitative metrics, baselines, or implementation details to support the effectiveness claims."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"X-OmniClaw presents a unified architecture for Android mobile agents using Omni Perception, Memory, and Action modules to enable efficient multimodal task handling and personalized interactions."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"X-OmniClaw presents a unified architecture for mobile agents that combines multimodal perception, memory, and action to handle complex Android tasks with greater context awareness."}],"snapshot_sha256":"64c7dbb4182a9521d9aac47b754cf04560c99eb01b31d71d6a101f7f08b47b7e"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-20T13:42:04.668327Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-20T09:35:28.198235Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_title_agreement","ran_at":"2026-05-19T20:01:19.479952Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-19T13:17:10.180706Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2605.05765/integrity.json","findings":[],"snapshot_sha256":"47645ac63926ee5ea29dd8db59a6959ac587f0edf80defc389f46c7a3b3cce3f","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Inspired by the development of OpenClaw, there is a growing demand for mobile-based personal agents capable of handling complex and intuitive interactions. In this technical report, we introduce X-OmniClaw, a unified mobile agent designed for multimodal understanding and interaction in the Android ecosystem. This unified architecture of perception, memory, and action enables the agent to handle complex mobile tasks with high contextual awareness. Specifically, Omni Perception provides a unified multimodal ingress pipeline that integrates UI states, real-world visual contexts, and speech inputs","authors_text":"Binqiang Pan, Chao Li, Haobo Ji, Haonan Lu, Peng Liu, Qi Qi, Qiuxia Hou, Qi Wu, Quanlong Zheng, Ru Zhen, Xiaoming Ren, Yang Song, Yanhao Zhang, Zhenyi Liao","cross_cats":[],"headline":"X-OmniClaw presents a unified architecture for mobile agents that combines multimodal perception, memory, and action to handle complex Android tasks with greater context awareness.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T06:58:34Z","title":"X-OmniClaw Technical Report: A Unified Mobile Agent for Multimodal Understanding and Interaction"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.05765","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-08T14:49:12.379064Z","id":"bb1488a4-6bca-4d29-bb51-a98b7acc9929","model_set":{"reader":"grok-4.3"},"one_line_summary":"X-OmniClaw presents a unified architecture for Android mobile agents using Omni Perception, Memory, and Action modules to enable efficient multimodal task handling and personalized interactions.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"X-OmniClaw presents a unified architecture for mobile agents that combines multimodal perception, memory, and action to handle complex Android tasks with greater context awareness.","strongest_claim":"Demonstrations across diverse scenarios show that X-OmniClaw effectively enhances interaction efficiency and task reliability, providing a practical architectural blueprint for the next generation of mobile-native personal assistants.","weakest_assumption":"That the described Omni Perception, Memory, and Action components will integrate and perform robustly in real-world conditions, as the abstract provides no quantitative metrics, baselines, or implementation details to support the effectiveness claims."}},"verdict_id":"bb1488a4-6bca-4d29-bb51-a98b7acc9929"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0cd477d3d1a4d103724224e74ed032ec616bacfb2bb80e5768838e5f346e3d20","target":"record","created_at":"2026-05-22T01:04:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"4bbaf9a8e2276ecc29bb9287d89b655a81a46c982e19d565f9ccd8aaf6576779","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T06:58:34Z","title_canon_sha256":"cea5e84d506d4c570fcbb21e7c5bad7bc53bae3d04451a329018fb5ff0190c01"},"schema_version":"1.0","source":{"id":"2605.05765","kind":"arxiv","version":2}},"canonical_sha256":"ea6b6b6927758bce7f751326ade1f3b4845cc052d3955a50f1645695b86ac0a2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ea6b6b6927758bce7f751326ade1f3b4845cc052d3955a50f1645695b86ac0a2","first_computed_at":"2026-05-22T01:04:04.869926Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-22T01:04:04.869926Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"7vCd+otwXCZjtnApJHR4BuVTNBNVVXtMOLWzZ127NVFuaIfV3SItvjToRNgbnH89IS2LND6CJZDKGUY3RfXwBA==","signature_status":"signed_v1","signed_at":"2026-05-22T01:04:04.870525Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.05765","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0cd477d3d1a4d103724224e74ed032ec616bacfb2bb80e5768838e5f346e3d20","sha256:b02fe38b99e6b88b1ca2ab190b0f29fa9027e5167b3ef341190fb34a9d0fef65"],"state_sha256":"2b9ac5f67047c42b791c860aa47fd83fd82f9707127c6f3ae107f6132225aec3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"7TeDiYh2RDa2etGeeYvO4R6lBOLgw2s20/IuO+lPOxEzeUjBxU95ypAKd8XKYx69Bfh/0NvdZRYmpL2t6t0HBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T04:42:27.507210Z","bundle_sha256":"b66272fbc494d6cced03927675ac44c1cae489af6817e1fdbf5889b12e14a6c1"}}