{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:XLKJ3NP4TRXGEWXHKI7OEJHVY4","short_pith_number":"pith:XLKJ3NP4","canonical_record":{"source":{"id":"2512.18552","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2025-12-21T00:49:40Z","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"title_canon_sha256":"2075bcfa013e9ea8e5c19b2285d607e970a905fc175e9a65d90d4db8863330e2","abstract_canon_sha256":"9c186bd863f52f12a752a65743e0de1a1b6edbc37e0f1ed6f8d9e43b55a0533f"},"schema_version":"1.0"},"canonical_sha256":"bad49db5fc9c6e625ae7523ee224f5c72818c50fb6145fb0aea3c6147c2c424a","source":{"kind":"arxiv","id":"2512.18552","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2512.18552","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"arxiv_version","alias_value":"2512.18552v2","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2512.18552","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"pith_short_12","alias_value":"XLKJ3NP4TRXG","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"pith_short_16","alias_value":"XLKJ3NP4TRXGEWXH","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"pith_short_8","alias_value":"XLKJ3NP4","created_at":"2026-05-20T01:04:30Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:XLKJ3NP4TRXGEWXHKI7OEJHVY4","target":"record","payload":{"canonical_record":{"source":{"id":"2512.18552","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2025-12-21T00:49:40Z","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"title_canon_sha256":"2075bcfa013e9ea8e5c19b2285d607e970a905fc175e9a65d90d4db8863330e2","abstract_canon_sha256":"9c186bd863f52f12a752a65743e0de1a1b6edbc37e0f1ed6f8d9e43b55a0533f"},"schema_version":"1.0"},"canonical_sha256":"bad49db5fc9c6e625ae7523ee224f5c72818c50fb6145fb0aea3c6147c2c424a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:04:30.349970Z","signature_b64":"LYYzHvDG2AyI5lNqfWFfPE6KUxaSdEHfIc9G/G6bWmzNChDXly4HLXJlVt2dqspTfFzb9KzW+k/DcEe+UMYZAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"bad49db5fc9c6e625ae7523ee224f5c72818c50fb6145fb0aea3c6147c2c424a","last_reissued_at":"2026-05-20T01:04:30.349222Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:04:30.349222Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2512.18552","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:04:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YbYRK+AXnP3fvnt7uDa1THScMOcphDgGFHsMPysCOEzVROhtZ+bxMVfkuh8AG2FkLQB0UjuNPr1sPyzgBjRcBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T15:42:17.932036Z"},"content_sha256":"b088f4037619593799aa6bd891b2a9895b404f01f9c35f9440f175c28009e57f","schema_version":"1.0","event_id":"sha256:b088f4037619593799aa6bd891b2a9895b404f01f9c35f9440f175c28009e57f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:XLKJ3NP4TRXGEWXHKI7OEJHVY4","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Toward Training Superintelligent Software Agents through Self-Play SWE-RL","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.LG"],"primary_cat":"cs.SE","authors_text":"Daniel Fried, David Zhang, Emily McMilin, Gabriel Synnaeve, Jonas Gehring, Lingming Zhang, Sida Wang, Yuxiang Wei, Zhiqing Sun","submitted_at":"2025-12-21T00:49:40Z","abstract_excerpt":"While current software agents powered by large language models (LLMs) and agentic reinforcement learning (RL) can boost programmer productivity, their training data (e.g., GitHub issues and pull requests) and environments (e.g., pass-to-pass and fail-to-pass tests) heavily depend on human knowledge or curation, posing a fundamental barrier to superintelligence. In this paper, we present Self-play SWE-RL (SSR), a first step toward training paradigms for superintelligent software agents. Our approach takes minimal data assumptions, only requiring access to sandboxed repositories with source code"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2512.18552","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2512.18552/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:04:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6wsBokL01JvEiOKjQo8vFF+gEFc+BpjwaH6Q/sGCjes1EeZ/X/77LK1IxIlCzkAkPaS9smDLtAzdD5uSwC3yBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T15:42:17.932839Z"},"content_sha256":"063c78fef6b3541866cfebb96200b6bc0a9911dde8e0d248ece36b22d9f2de01","schema_version":"1.0","event_id":"sha256:063c78fef6b3541866cfebb96200b6bc0a9911dde8e0d248ece36b22d9f2de01"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XLKJ3NP4TRXGEWXHKI7OEJHVY4/bundle.json","state_url":"https://pith.science/pith/XLKJ3NP4TRXGEWXHKI7OEJHVY4/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XLKJ3NP4TRXGEWXHKI7OEJHVY4/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-09T15:42:17Z","links":{"resolver":"https://pith.science/pith/XLKJ3NP4TRXGEWXHKI7OEJHVY4","bundle":"https://pith.science/pith/XLKJ3NP4TRXGEWXHKI7OEJHVY4/bundle.json","state":"https://pith.science/pith/XLKJ3NP4TRXGEWXHKI7OEJHVY4/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XLKJ3NP4TRXGEWXHKI7OEJHVY4/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:XLKJ3NP4TRXGEWXHKI7OEJHVY4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9c186bd863f52f12a752a65743e0de1a1b6edbc37e0f1ed6f8d9e43b55a0533f","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2025-12-21T00:49:40Z","title_canon_sha256":"2075bcfa013e9ea8e5c19b2285d607e970a905fc175e9a65d90d4db8863330e2"},"schema_version":"1.0","source":{"id":"2512.18552","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2512.18552","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"arxiv_version","alias_value":"2512.18552v2","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2512.18552","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"pith_short_12","alias_value":"XLKJ3NP4TRXG","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"pith_short_16","alias_value":"XLKJ3NP4TRXGEWXH","created_at":"2026-05-20T01:04:30Z"},{"alias_kind":"pith_short_8","alias_value":"XLKJ3NP4","created_at":"2026-05-20T01:04:30Z"}],"graph_snapshots":[{"event_id":"sha256:063c78fef6b3541866cfebb96200b6bc0a9911dde8e0d248ece36b22d9f2de01","target":"graph","created_at":"2026-05-20T01:04:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2512.18552/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"While current software agents powered by large language models (LLMs) and agentic reinforcement learning (RL) can boost programmer productivity, their training data (e.g., GitHub issues and pull requests) and environments (e.g., pass-to-pass and fail-to-pass tests) heavily depend on human knowledge or curation, posing a fundamental barrier to superintelligence. In this paper, we present Self-play SWE-RL (SSR), a first step toward training paradigms for superintelligent software agents. Our approach takes minimal data assumptions, only requiring access to sandboxed repositories with source code","authors_text":"Daniel Fried, David Zhang, Emily McMilin, Gabriel Synnaeve, Jonas Gehring, Lingming Zhang, Sida Wang, Yuxiang Wei, Zhiqing Sun","cross_cats":["cs.AI","cs.CL","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2025-12-21T00:49:40Z","title":"Toward Training Superintelligent Software Agents through Self-Play SWE-RL"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2512.18552","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b088f4037619593799aa6bd891b2a9895b404f01f9c35f9440f175c28009e57f","target":"record","created_at":"2026-05-20T01:04:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9c186bd863f52f12a752a65743e0de1a1b6edbc37e0f1ed6f8d9e43b55a0533f","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2025-12-21T00:49:40Z","title_canon_sha256":"2075bcfa013e9ea8e5c19b2285d607e970a905fc175e9a65d90d4db8863330e2"},"schema_version":"1.0","source":{"id":"2512.18552","kind":"arxiv","version":2}},"canonical_sha256":"bad49db5fc9c6e625ae7523ee224f5c72818c50fb6145fb0aea3c6147c2c424a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"bad49db5fc9c6e625ae7523ee224f5c72818c50fb6145fb0aea3c6147c2c424a","first_computed_at":"2026-05-20T01:04:30.349222Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T01:04:30.349222Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"LYYzHvDG2AyI5lNqfWFfPE6KUxaSdEHfIc9G/G6bWmzNChDXly4HLXJlVt2dqspTfFzb9KzW+k/DcEe+UMYZAA==","signature_status":"signed_v1","signed_at":"2026-05-20T01:04:30.349970Z","signed_message":"canonical_sha256_bytes"},"source_id":"2512.18552","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b088f4037619593799aa6bd891b2a9895b404f01f9c35f9440f175c28009e57f","sha256:063c78fef6b3541866cfebb96200b6bc0a9911dde8e0d248ece36b22d9f2de01"],"state_sha256":"deaef8dffb6df9e5537b51b502148129b93e5c1e36411c4a367f6e5910f2105d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RErzLW6y3WTghVNEMFFAfjabYTLRrgTfc2oaqacWoFX68t2bf8gE/2lfTnowUu+1EsDmRcFn3d5eL48AhEyuCA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-09T15:42:17.937185Z","bundle_sha256":"ec248d5d98639d6782e509ef56c299168bfa24cdb1b947ea341c33efddc5bb26"}}