{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:JCLACOT4H752THHZGZBPH56C7M","short_pith_number":"pith:JCLACOT4","canonical_record":{"source":{"id":"2605.25624","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-25T09:28:03Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"c5f0704cd886df5c67682dc6f04f432d30c3d53ab148f00d420db97724115254","abstract_canon_sha256":"1127a300440b722ae726d336e5aef77fe1ab87d56c49e00e4bd12d0dda027442"},"schema_version":"1.0"},"canonical_sha256":"4896013a7c3ffba99cf93642f3f7c2fb1da7d8a2f4c806767987ec27b4300166","source":{"kind":"arxiv","id":"2605.25624","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.25624","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"arxiv_version","alias_value":"2605.25624v1","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.25624","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"pith_short_12","alias_value":"JCLACOT4H752","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"pith_short_16","alias_value":"JCLACOT4H752THHZ","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"pith_short_8","alias_value":"JCLACOT4","created_at":"2026-05-26T02:04:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:JCLACOT4H752THHZGZBPH56C7M","target":"record","payload":{"canonical_record":{"source":{"id":"2605.25624","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-25T09:28:03Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"c5f0704cd886df5c67682dc6f04f432d30c3d53ab148f00d420db97724115254","abstract_canon_sha256":"1127a300440b722ae726d336e5aef77fe1ab87d56c49e00e4bd12d0dda027442"},"schema_version":"1.0"},"canonical_sha256":"4896013a7c3ffba99cf93642f3f7c2fb1da7d8a2f4c806767987ec27b4300166","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-26T02:04:47.037900Z","signature_b64":"N0B1PBMWovUlyamJ77qtbyOzdrBpM0/R5Pa0sMXQaWha+RNHHu+HZdSzSpUNzOrizZ78iVryC5uAtQhUop9CBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4896013a7c3ffba99cf93642f3f7c2fb1da7d8a2f4c806767987ec27b4300166","last_reissued_at":"2026-05-26T02:04:47.037161Z","signature_status":"signed_v1","first_computed_at":"2026-05-26T02:04:47.037161Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.25624","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T02:04:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JgNoeqLGEWQkSSKMgiKXYLlFO0E5GxW0pn3hCafAlFdZlVl3Jhg2wsWIM2zvWkYQTdH0i1Q85nM8hGS/CdqvBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T17:37:43.101002Z"},"content_sha256":"a24e1f6e094267c94a9c9e52334b4972d854828de2a01020f0b32d4b8eba6fab","schema_version":"1.0","event_id":"sha256:a24e1f6e094267c94a9c9e52334b4972d854828de2a01020f0b32d4b8eba6fab"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:JCLACOT4H752THHZGZBPH56C7M","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"CUA-Gym: Scaling Verifiable Training Environments and Tasks for Computer-Use Agents","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.AI","authors_text":"Bowen Wang, Dayiheng Liu, Dunjie Lu, HaiQuan Wang, Hao Hu, Junli Wang, Junyang Lin, Que Shen, Shixuan Liu, Shuai Bai, Tao Yu, Tianbao Xie, Tianyi Bai, Zhipeng Zhang","submitted_at":"2026-05-25T09:28:03Z","abstract_excerpt":"Reinforcement learning with verifiable rewards (RLVR) has driven breakthroughs in domains such as math, tool-use, and software engineering, yet its extension to computer-use agents (CUAs) has been bottlenecked by the scarcity of scalable training data with deterministic rewards. Constructing such data for CUAs requires consistent task instruction, executable environment, and verifiable reward. However, hand-curated benchmarks achieve high reward fidelity but cover few applications and LLM-as-judge-based datasets scale broadly but lack reliable verification. We present CUA-Gym, a scalable pipel"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.25624","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.25624/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-26T02:04:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qNdGNHy6u2YhV8WuRkDQa5EJFbRedk0TcFz5m8Fbuk/JypuUFG9s5D7BmSFPxAlD33tfvsX6/wGj1RLEuIGRAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T17:37:43.101645Z"},"content_sha256":"cccf7390ae4deb5d3bdddeede04c674bd0d4b50743bed3a80c621eb59c036c27","schema_version":"1.0","event_id":"sha256:cccf7390ae4deb5d3bdddeede04c674bd0d4b50743bed3a80c621eb59c036c27"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/JCLACOT4H752THHZGZBPH56C7M/bundle.json","state_url":"https://pith.science/pith/JCLACOT4H752THHZGZBPH56C7M/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/JCLACOT4H752THHZGZBPH56C7M/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T17:37:43Z","links":{"resolver":"https://pith.science/pith/JCLACOT4H752THHZGZBPH56C7M","bundle":"https://pith.science/pith/JCLACOT4H752THHZGZBPH56C7M/bundle.json","state":"https://pith.science/pith/JCLACOT4H752THHZGZBPH56C7M/state.json","well_known_bundle":"https://pith.science/.well-known/pith/JCLACOT4H752THHZGZBPH56C7M/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:JCLACOT4H752THHZGZBPH56C7M","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"1127a300440b722ae726d336e5aef77fe1ab87d56c49e00e4bd12d0dda027442","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-25T09:28:03Z","title_canon_sha256":"c5f0704cd886df5c67682dc6f04f432d30c3d53ab148f00d420db97724115254"},"schema_version":"1.0","source":{"id":"2605.25624","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.25624","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"arxiv_version","alias_value":"2605.25624v1","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.25624","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"pith_short_12","alias_value":"JCLACOT4H752","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"pith_short_16","alias_value":"JCLACOT4H752THHZ","created_at":"2026-05-26T02:04:47Z"},{"alias_kind":"pith_short_8","alias_value":"JCLACOT4","created_at":"2026-05-26T02:04:47Z"}],"graph_snapshots":[{"event_id":"sha256:cccf7390ae4deb5d3bdddeede04c674bd0d4b50743bed3a80c621eb59c036c27","target":"graph","created_at":"2026-05-26T02:04:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.25624/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reinforcement learning with verifiable rewards (RLVR) has driven breakthroughs in domains such as math, tool-use, and software engineering, yet its extension to computer-use agents (CUAs) has been bottlenecked by the scarcity of scalable training data with deterministic rewards. Constructing such data for CUAs requires consistent task instruction, executable environment, and verifiable reward. However, hand-curated benchmarks achieve high reward fidelity but cover few applications and LLM-as-judge-based datasets scale broadly but lack reliable verification. We present CUA-Gym, a scalable pipel","authors_text":"Bowen Wang, Dayiheng Liu, Dunjie Lu, HaiQuan Wang, Hao Hu, Junli Wang, Junyang Lin, Que Shen, Shixuan Liu, Shuai Bai, Tao Yu, Tianbao Xie, Tianyi Bai, Zhipeng Zhang","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-25T09:28:03Z","title":"CUA-Gym: Scaling Verifiable Training Environments and Tasks for Computer-Use Agents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.25624","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:a24e1f6e094267c94a9c9e52334b4972d854828de2a01020f0b32d4b8eba6fab","target":"record","created_at":"2026-05-26T02:04:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"1127a300440b722ae726d336e5aef77fe1ab87d56c49e00e4bd12d0dda027442","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2026-05-25T09:28:03Z","title_canon_sha256":"c5f0704cd886df5c67682dc6f04f432d30c3d53ab148f00d420db97724115254"},"schema_version":"1.0","source":{"id":"2605.25624","kind":"arxiv","version":1}},"canonical_sha256":"4896013a7c3ffba99cf93642f3f7c2fb1da7d8a2f4c806767987ec27b4300166","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4896013a7c3ffba99cf93642f3f7c2fb1da7d8a2f4c806767987ec27b4300166","first_computed_at":"2026-05-26T02:04:47.037161Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-26T02:04:47.037161Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"N0B1PBMWovUlyamJ77qtbyOzdrBpM0/R5Pa0sMXQaWha+RNHHu+HZdSzSpUNzOrizZ78iVryC5uAtQhUop9CBA==","signature_status":"signed_v1","signed_at":"2026-05-26T02:04:47.037900Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.25624","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:a24e1f6e094267c94a9c9e52334b4972d854828de2a01020f0b32d4b8eba6fab","sha256:cccf7390ae4deb5d3bdddeede04c674bd0d4b50743bed3a80c621eb59c036c27"],"state_sha256":"140db352bf6f112052460e6617350f3f7078b9c58e88a4f92f2f84dc08a9dfe0"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cIuHxXE7IpI+pFDo6nC/fYRyRcd85Wm4FSlaIFOMk0FdF+w5ZZEnDrbuKtK8cpnpT0BafXvFZy55rf1E0BrKDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T17:37:43.104440Z","bundle_sha256":"80cd0b311370747aab9b5bb9f9c8aca60e46fb406e111ce838644890b6bd1a02"}}