{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:UBQOGPCSBNJ4HFRNH6ZHJRCV3G","short_pith_number":"pith:UBQOGPCS","canonical_record":{"source":{"id":"2605.30021","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-28T14:42:18Z","cross_cats_sorted":[],"title_canon_sha256":"7df04e27c52069bd86cb330aee33482dbedadc58b1b4eb88213a4cb490733620","abstract_canon_sha256":"3fc4574d0e32588d319133b859eb73af4d5945e0faee90ff23c97dcadf856251"},"schema_version":"1.0"},"canonical_sha256":"a060e33c520b53c3962d3fb274c455d9aae2d0647bfe3d790dc2718b30847dba","source":{"kind":"arxiv","id":"2605.30021","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.30021","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"arxiv_version","alias_value":"2605.30021v1","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.30021","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"pith_short_12","alias_value":"UBQOGPCSBNJ4","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"pith_short_16","alias_value":"UBQOGPCSBNJ4HFRN","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"pith_short_8","alias_value":"UBQOGPCS","created_at":"2026-05-29T02:06:07Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:UBQOGPCSBNJ4HFRNH6ZHJRCV3G","target":"record","payload":{"canonical_record":{"source":{"id":"2605.30021","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-28T14:42:18Z","cross_cats_sorted":[],"title_canon_sha256":"7df04e27c52069bd86cb330aee33482dbedadc58b1b4eb88213a4cb490733620","abstract_canon_sha256":"3fc4574d0e32588d319133b859eb73af4d5945e0faee90ff23c97dcadf856251"},"schema_version":"1.0"},"canonical_sha256":"a060e33c520b53c3962d3fb274c455d9aae2d0647bfe3d790dc2718b30847dba","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-29T02:06:07.339081Z","signature_b64":"BD9KbjT5sR7wSNn+esWzhoYpppweOmbCcAKCcMIAXoTE/mnSwo9YcvPUxjhKdRJl+nKZopRKBgHAzY4rG5ADCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a060e33c520b53c3962d3fb274c455d9aae2d0647bfe3d790dc2718b30847dba","last_reissued_at":"2026-05-29T02:06:07.338494Z","signature_status":"signed_v1","first_computed_at":"2026-05-29T02:06:07.338494Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.30021","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T02:06:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"XREVb4r68xXGXK6Nh+sOEQzd5ApNeDxWb6V5R46Zx8BC4YoFjX9qjzA5MtbGfy9DNpLbNFuQDKfy4jsM6ZWgCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T20:01:48.131432Z"},"content_sha256":"df48ba5d30b0fceacdade4407be0de6f7abcf1867113f93610e71fb018efeab6","schema_version":"1.0","event_id":"sha256:df48ba5d30b0fceacdade4407be0de6f7abcf1867113f93610e71fb018efeab6"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:UBQOGPCSBNJ4HFRNH6ZHJRCV3G","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Recovering Diversity Without Losing Alignment: A DPO Recipe for Post-Trained LLMs","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Mohit Iyyer, Vinay Samuel, Yapei Chang","submitted_at":"2026-05-28T14:42:18Z","abstract_excerpt":"Many open-ended instructions have multiple valid answers that users can benefit from seeing, but post-training often narrows an LLM's output space toward a small set of canonical responses. We introduce REDIPO, an offline DPO data-construction pipeline for recovering distinct valid answer modes while preserving the alignment benefits of the instruct model. For each prompt, REDIPO samples responses from both base and instruct models, rewrites base-model responses with the instruct model, filters candidates for safety and instruction-following quality, and builds preference pairs that favor marg"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.30021","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.30021/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-29T02:06:07Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9EHFs5e53IXFbNaue0Lua54UIxixyUWDRqzVMK6LZFSg3r+Ez5iNFyGXy7L92CMsPTyyXTt6MZoINZ2bZ1R2BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T20:01:48.131819Z"},"content_sha256":"4098659cbcc606d7832327093f51e5df24ef668964f029e96fc368afc249b1d8","schema_version":"1.0","event_id":"sha256:4098659cbcc606d7832327093f51e5df24ef668964f029e96fc368afc249b1d8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/UBQOGPCSBNJ4HFRNH6ZHJRCV3G/bundle.json","state_url":"https://pith.science/pith/UBQOGPCSBNJ4HFRNH6ZHJRCV3G/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/UBQOGPCSBNJ4HFRNH6ZHJRCV3G/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T20:01:48Z","links":{"resolver":"https://pith.science/pith/UBQOGPCSBNJ4HFRNH6ZHJRCV3G","bundle":"https://pith.science/pith/UBQOGPCSBNJ4HFRNH6ZHJRCV3G/bundle.json","state":"https://pith.science/pith/UBQOGPCSBNJ4HFRNH6ZHJRCV3G/state.json","well_known_bundle":"https://pith.science/.well-known/pith/UBQOGPCSBNJ4HFRNH6ZHJRCV3G/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:UBQOGPCSBNJ4HFRNH6ZHJRCV3G","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3fc4574d0e32588d319133b859eb73af4d5945e0faee90ff23c97dcadf856251","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-28T14:42:18Z","title_canon_sha256":"7df04e27c52069bd86cb330aee33482dbedadc58b1b4eb88213a4cb490733620"},"schema_version":"1.0","source":{"id":"2605.30021","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.30021","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"arxiv_version","alias_value":"2605.30021v1","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.30021","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"pith_short_12","alias_value":"UBQOGPCSBNJ4","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"pith_short_16","alias_value":"UBQOGPCSBNJ4HFRN","created_at":"2026-05-29T02:06:07Z"},{"alias_kind":"pith_short_8","alias_value":"UBQOGPCS","created_at":"2026-05-29T02:06:07Z"}],"graph_snapshots":[{"event_id":"sha256:4098659cbcc606d7832327093f51e5df24ef668964f029e96fc368afc249b1d8","target":"graph","created_at":"2026-05-29T02:06:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.30021/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Many open-ended instructions have multiple valid answers that users can benefit from seeing, but post-training often narrows an LLM's output space toward a small set of canonical responses. We introduce REDIPO, an offline DPO data-construction pipeline for recovering distinct valid answer modes while preserving the alignment benefits of the instruct model. For each prompt, REDIPO samples responses from both base and instruct models, rewrites base-model responses with the instruct model, filters candidates for safety and instruction-following quality, and builds preference pairs that favor marg","authors_text":"Mohit Iyyer, Vinay Samuel, Yapei Chang","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-28T14:42:18Z","title":"Recovering Diversity Without Losing Alignment: A DPO Recipe for Post-Trained LLMs"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.30021","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:df48ba5d30b0fceacdade4407be0de6f7abcf1867113f93610e71fb018efeab6","target":"record","created_at":"2026-05-29T02:06:07Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3fc4574d0e32588d319133b859eb73af4d5945e0faee90ff23c97dcadf856251","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CL","submitted_at":"2026-05-28T14:42:18Z","title_canon_sha256":"7df04e27c52069bd86cb330aee33482dbedadc58b1b4eb88213a4cb490733620"},"schema_version":"1.0","source":{"id":"2605.30021","kind":"arxiv","version":1}},"canonical_sha256":"a060e33c520b53c3962d3fb274c455d9aae2d0647bfe3d790dc2718b30847dba","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a060e33c520b53c3962d3fb274c455d9aae2d0647bfe3d790dc2718b30847dba","first_computed_at":"2026-05-29T02:06:07.338494Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-29T02:06:07.338494Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"BD9KbjT5sR7wSNn+esWzhoYpppweOmbCcAKCcMIAXoTE/mnSwo9YcvPUxjhKdRJl+nKZopRKBgHAzY4rG5ADCw==","signature_status":"signed_v1","signed_at":"2026-05-29T02:06:07.339081Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.30021","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:df48ba5d30b0fceacdade4407be0de6f7abcf1867113f93610e71fb018efeab6","sha256:4098659cbcc606d7832327093f51e5df24ef668964f029e96fc368afc249b1d8"],"state_sha256":"cd692225e855e78e1729cede8ca96b30fe6ce996a06931714a60fc07d187b899"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"V07Rio1Esm1ThMSn3eHAtLdep50GowxMv2/ctqozYEm1JILuffwYMaDmHXXaX6QVE3EHpbK/7zME2rCEhS34Ag==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T20:01:48.133953Z","bundle_sha256":"bf68e96fdae38e88481c0894578fce42b3154e83817e3a9f818919be281f995d"}}