{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:LY736NPXLG55XUYV7TR7BKNNE6","short_pith_number":"pith:LY736NPX","canonical_record":{"source":{"id":"2602.02262","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-02-02T16:04:10Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"6bbdc03b04b020026f1cd704bc5ccd52f032b77d2147c5c101239042da72b07e","abstract_canon_sha256":"d3984692fa7ee044e3182aa21d274ff5d610c13a622c9584740bc6534c490b37"},"schema_version":"1.0"},"canonical_sha256":"5e3fbf35f759bbdbd315fce3f0a9ad27a2a2b68562009686e5b4be8c26644562","source":{"kind":"arxiv","id":"2602.02262","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2602.02262","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"arxiv_version","alias_value":"2602.02262v3","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2602.02262","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"pith_short_12","alias_value":"LY736NPXLG55","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"pith_short_16","alias_value":"LY736NPXLG55XUYV","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"pith_short_8","alias_value":"LY736NPX","created_at":"2026-05-20T00:05:41Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:LY736NPXLG55XUYV7TR7BKNNE6","target":"record","payload":{"canonical_record":{"source":{"id":"2602.02262","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-02-02T16:04:10Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"6bbdc03b04b020026f1cd704bc5ccd52f032b77d2147c5c101239042da72b07e","abstract_canon_sha256":"d3984692fa7ee044e3182aa21d274ff5d610c13a622c9584740bc6534c490b37"},"schema_version":"1.0"},"canonical_sha256":"5e3fbf35f759bbdbd315fce3f0a9ad27a2a2b68562009686e5b4be8c26644562","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:05:41.371665Z","signature_b64":"Hspl44KHGnnbybQxPS9OrMou2OPHPrxEnefQekEp9PyvDR7EFtQh7ZcOlRuQsjKtn7rMxJ3bAJL6e+sMfVxQBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"5e3fbf35f759bbdbd315fce3f0a9ad27a2a2b68562009686e5b4be8c26644562","last_reissued_at":"2026-05-20T00:05:41.371124Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:05:41.371124Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2602.02262","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:05:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2Okt+zR+1uyKSFifxOb5NxN2/02EwKaaZovIAGCQNmRCOH2vE4skzZmu6CQA0Wu+Ce7RdhC/gfUAIemsjaMCDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T04:36:00.381965Z"},"content_sha256":"f3932bdf17af73506f9921d1e5d2a7891ad85231dfe7616cedcbea992f0cd956","schema_version":"1.0","event_id":"sha256:f3932bdf17af73506f9921d1e5d2a7891ad85231dfe7616cedcbea992f0cd956"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:LY736NPXLG55XUYV7TR7BKNNE6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"OmniCode: A Benchmark for Evaluating Software Engineering Agents","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.SE","authors_text":"Atharv Sonwane, Carter Larsen, Claas Beger, Debjit Dhar, Eng-Shen Tu, Gloria Geng, Guohao Chen, Kevin Ellis, Rachel Chen, Ronit Pattanayak, Saikat Dutta, Simon Alford, Tuan Anh Dang, Wei-Chung Lu","submitted_at":"2026-02-02T16:04:10Z","abstract_excerpt":"LLM-powered coding agents are redefining how real-world software is developed. To drive the research towards better coding agents, we require challenging benchmarks that can rigorously evaluate the ability of such agents to perform various software engineering tasks. However, popular coding benchmarks such as HumanEval and SWE-Bench focus on narrowly scoped tasks such as competition programming and patch generation. In reality, software engineers have to handle a broader set of tasks for real-world software development. To address this gap, we propose OmniCode, a novel software engineering ben"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2602.02262","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2602.02262/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:05:41Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0yzXKqGg2aI7tUXWeSjZk5a1VgWzewBG4fxEyYLw+sf3r9va12cGKfJA0kcj/Vs47CVQf6cL10JHbqsxwrk+CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T04:36:00.382406Z"},"content_sha256":"75799c20ad5805428efcae6fe7516c02d63a03cfc5129f51aa886eb6d3beeb8c","schema_version":"1.0","event_id":"sha256:75799c20ad5805428efcae6fe7516c02d63a03cfc5129f51aa886eb6d3beeb8c"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/LY736NPXLG55XUYV7TR7BKNNE6/bundle.json","state_url":"https://pith.science/pith/LY736NPXLG55XUYV7TR7BKNNE6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/LY736NPXLG55XUYV7TR7BKNNE6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T04:36:00Z","links":{"resolver":"https://pith.science/pith/LY736NPXLG55XUYV7TR7BKNNE6","bundle":"https://pith.science/pith/LY736NPXLG55XUYV7TR7BKNNE6/bundle.json","state":"https://pith.science/pith/LY736NPXLG55XUYV7TR7BKNNE6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/LY736NPXLG55XUYV7TR7BKNNE6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:LY736NPXLG55XUYV7TR7BKNNE6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d3984692fa7ee044e3182aa21d274ff5d610c13a622c9584740bc6534c490b37","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-02-02T16:04:10Z","title_canon_sha256":"6bbdc03b04b020026f1cd704bc5ccd52f032b77d2147c5c101239042da72b07e"},"schema_version":"1.0","source":{"id":"2602.02262","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2602.02262","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"arxiv_version","alias_value":"2602.02262v3","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2602.02262","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"pith_short_12","alias_value":"LY736NPXLG55","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"pith_short_16","alias_value":"LY736NPXLG55XUYV","created_at":"2026-05-20T00:05:41Z"},{"alias_kind":"pith_short_8","alias_value":"LY736NPX","created_at":"2026-05-20T00:05:41Z"}],"graph_snapshots":[{"event_id":"sha256:75799c20ad5805428efcae6fe7516c02d63a03cfc5129f51aa886eb6d3beeb8c","target":"graph","created_at":"2026-05-20T00:05:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2602.02262/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"LLM-powered coding agents are redefining how real-world software is developed. To drive the research towards better coding agents, we require challenging benchmarks that can rigorously evaluate the ability of such agents to perform various software engineering tasks. However, popular coding benchmarks such as HumanEval and SWE-Bench focus on narrowly scoped tasks such as competition programming and patch generation. In reality, software engineers have to handle a broader set of tasks for real-world software development. To address this gap, we propose OmniCode, a novel software engineering ben","authors_text":"Atharv Sonwane, Carter Larsen, Claas Beger, Debjit Dhar, Eng-Shen Tu, Gloria Geng, Guohao Chen, Kevin Ellis, Rachel Chen, Ronit Pattanayak, Saikat Dutta, Simon Alford, Tuan Anh Dang, Wei-Chung Lu","cross_cats":["cs.AI","cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-02-02T16:04:10Z","title":"OmniCode: A Benchmark for Evaluating Software Engineering Agents"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2602.02262","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f3932bdf17af73506f9921d1e5d2a7891ad85231dfe7616cedcbea992f0cd956","target":"record","created_at":"2026-05-20T00:05:41Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d3984692fa7ee044e3182aa21d274ff5d610c13a622c9584740bc6534c490b37","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-02-02T16:04:10Z","title_canon_sha256":"6bbdc03b04b020026f1cd704bc5ccd52f032b77d2147c5c101239042da72b07e"},"schema_version":"1.0","source":{"id":"2602.02262","kind":"arxiv","version":3}},"canonical_sha256":"5e3fbf35f759bbdbd315fce3f0a9ad27a2a2b68562009686e5b4be8c26644562","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5e3fbf35f759bbdbd315fce3f0a9ad27a2a2b68562009686e5b4be8c26644562","first_computed_at":"2026-05-20T00:05:41.371124Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:05:41.371124Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Hspl44KHGnnbybQxPS9OrMou2OPHPrxEnefQekEp9PyvDR7EFtQh7ZcOlRuQsjKtn7rMxJ3bAJL6e+sMfVxQBA==","signature_status":"signed_v1","signed_at":"2026-05-20T00:05:41.371665Z","signed_message":"canonical_sha256_bytes"},"source_id":"2602.02262","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f3932bdf17af73506f9921d1e5d2a7891ad85231dfe7616cedcbea992f0cd956","sha256:75799c20ad5805428efcae6fe7516c02d63a03cfc5129f51aa886eb6d3beeb8c"],"state_sha256":"9f7d75bc8f88db63a42a413ac2b4e64c420e6753a3a4d5c7f5f4b8c420991d5c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1WLIUD4gfDAlsGTREBMXiWtnJnmOXmH4wFddwrjza9geV2YKhQiAlyzhVid6u4n10v7jJUNorU0bxkZ67XEhDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T04:36:00.384615Z","bundle_sha256":"3dd8f018d7600edcb2696975d11161e8e360d3a991ade12c5ff1efa28d8d3a1d"}}