{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:PRJTBIUV3327TF7JSOWHYKX5IO","short_pith_number":"pith:PRJTBIUV","canonical_record":{"source":{"id":"2511.12796","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2025-11-16T21:55:59Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"d76681166c3f1369424d641f875aa27c43a21fd1429c766a7e8d43a414087bcf","abstract_canon_sha256":"d6c6b234bf71feedca04ee177823cfead8fa851e05201be8b34675c694c0098a"},"schema_version":"1.0"},"canonical_sha256":"7c5330a295def5f997e993ac7c2afd43af2a9c85c0acafc68058d3718aa2491f","source":{"kind":"arxiv","id":"2511.12796","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2511.12796","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"arxiv_version","alias_value":"2511.12796v2","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.12796","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"pith_short_12","alias_value":"PRJTBIUV3327","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"pith_short_16","alias_value":"PRJTBIUV3327TF7J","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"pith_short_8","alias_value":"PRJTBIUV","created_at":"2026-06-24T01:14:59Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:PRJTBIUV3327TF7JSOWHYKX5IO","target":"record","payload":{"canonical_record":{"source":{"id":"2511.12796","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2025-11-16T21:55:59Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"d76681166c3f1369424d641f875aa27c43a21fd1429c766a7e8d43a414087bcf","abstract_canon_sha256":"d6c6b234bf71feedca04ee177823cfead8fa851e05201be8b34675c694c0098a"},"schema_version":"1.0"},"canonical_sha256":"7c5330a295def5f997e993ac7c2afd43af2a9c85c0acafc68058d3718aa2491f","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-24T01:14:59.426119Z","signature_b64":"bZgHQdYKhH200BJk9vdRqjYAOVIQCr0vg1yp1Fbs+vLXVul9FFumyAPHXTjtWV8Qmh34nfjMHP/5pZUL8Wj8BA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7c5330a295def5f997e993ac7c2afd43af2a9c85c0acafc68058d3718aa2491f","last_reissued_at":"2026-06-24T01:14:59.425620Z","signature_status":"signed_v1","first_computed_at":"2026-06-24T01:14:59.425620Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2511.12796","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:14:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FfQYZqfYiMV/TZdZuTvzLic3YGdHpmequ5zTJPOZbRBGaot+0GdD3j4S4XufdwwawaL/DTwIx+7pwbPrDXNgDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T11:18:31.194217Z"},"content_sha256":"5766b27509de56b29a11ddc689f438c7001ee7d10ee708e6562da366974b3173","schema_version":"1.0","event_id":"sha256:5766b27509de56b29a11ddc689f438c7001ee7d10ee708e6562da366974b3173"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:PRJTBIUV3327TF7JSOWHYKX5IO","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Maximizing the efficiency of human feedback in AI alignment: a comparative analysis","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.HC","authors_text":"Andreas Chouliaras, Dimitris Chatzopoulos","submitted_at":"2025-11-16T21:55:59Z","abstract_excerpt":"Reinforcement Learning from Human Feedback (RLHF) relies on preference modeling to align machine learning systems with human values, yet the popular approach of random pair sampling with Bradley-Terry modeling is statistically limited and inefficient under constrained annotation budgets. In this work, we explore alternative sampling and evaluation strategies for preference inference in RLHF, drawing inspiration from areas such as game theory, statistics, and social choice theory. Our best-performing method, Swiss InfoGain, employs a Swiss tournament system with a proxy mutual-information-gain "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.12796","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2511.12796/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:14:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+vLFVeKTaVNpS9zJIz10Vt42W6SsODRar0iywWGvIUUHPSM7MAMighS5RbEZ9DlUQslwa7FcBVoHcOb3/S9SDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T11:18:31.194607Z"},"content_sha256":"3638ad8ef1def60fe2428224cde0ac853d6699be83bebdd0d5150a2b3ad42b11","schema_version":"1.0","event_id":"sha256:3638ad8ef1def60fe2428224cde0ac853d6699be83bebdd0d5150a2b3ad42b11"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/PRJTBIUV3327TF7JSOWHYKX5IO/bundle.json","state_url":"https://pith.science/pith/PRJTBIUV3327TF7JSOWHYKX5IO/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/PRJTBIUV3327TF7JSOWHYKX5IO/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T11:18:31Z","links":{"resolver":"https://pith.science/pith/PRJTBIUV3327TF7JSOWHYKX5IO","bundle":"https://pith.science/pith/PRJTBIUV3327TF7JSOWHYKX5IO/bundle.json","state":"https://pith.science/pith/PRJTBIUV3327TF7JSOWHYKX5IO/state.json","well_known_bundle":"https://pith.science/.well-known/pith/PRJTBIUV3327TF7JSOWHYKX5IO/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:PRJTBIUV3327TF7JSOWHYKX5IO","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d6c6b234bf71feedca04ee177823cfead8fa851e05201be8b34675c694c0098a","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2025-11-16T21:55:59Z","title_canon_sha256":"d76681166c3f1369424d641f875aa27c43a21fd1429c766a7e8d43a414087bcf"},"schema_version":"1.0","source":{"id":"2511.12796","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2511.12796","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"arxiv_version","alias_value":"2511.12796v2","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.12796","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"pith_short_12","alias_value":"PRJTBIUV3327","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"pith_short_16","alias_value":"PRJTBIUV3327TF7J","created_at":"2026-06-24T01:14:59Z"},{"alias_kind":"pith_short_8","alias_value":"PRJTBIUV","created_at":"2026-06-24T01:14:59Z"}],"graph_snapshots":[{"event_id":"sha256:3638ad8ef1def60fe2428224cde0ac853d6699be83bebdd0d5150a2b3ad42b11","target":"graph","created_at":"2026-06-24T01:14:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2511.12796/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reinforcement Learning from Human Feedback (RLHF) relies on preference modeling to align machine learning systems with human values, yet the popular approach of random pair sampling with Bradley-Terry modeling is statistically limited and inefficient under constrained annotation budgets. In this work, we explore alternative sampling and evaluation strategies for preference inference in RLHF, drawing inspiration from areas such as game theory, statistics, and social choice theory. Our best-performing method, Swiss InfoGain, employs a Swiss tournament system with a proxy mutual-information-gain ","authors_text":"Andreas Chouliaras, Dimitris Chatzopoulos","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2025-11-16T21:55:59Z","title":"Maximizing the efficiency of human feedback in AI alignment: a comparative analysis"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.12796","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5766b27509de56b29a11ddc689f438c7001ee7d10ee708e6562da366974b3173","target":"record","created_at":"2026-06-24T01:14:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d6c6b234bf71feedca04ee177823cfead8fa851e05201be8b34675c694c0098a","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.HC","submitted_at":"2025-11-16T21:55:59Z","title_canon_sha256":"d76681166c3f1369424d641f875aa27c43a21fd1429c766a7e8d43a414087bcf"},"schema_version":"1.0","source":{"id":"2511.12796","kind":"arxiv","version":2}},"canonical_sha256":"7c5330a295def5f997e993ac7c2afd43af2a9c85c0acafc68058d3718aa2491f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"7c5330a295def5f997e993ac7c2afd43af2a9c85c0acafc68058d3718aa2491f","first_computed_at":"2026-06-24T01:14:59.425620Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-24T01:14:59.425620Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"bZgHQdYKhH200BJk9vdRqjYAOVIQCr0vg1yp1Fbs+vLXVul9FFumyAPHXTjtWV8Qmh34nfjMHP/5pZUL8Wj8BA==","signature_status":"signed_v1","signed_at":"2026-06-24T01:14:59.426119Z","signed_message":"canonical_sha256_bytes"},"source_id":"2511.12796","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5766b27509de56b29a11ddc689f438c7001ee7d10ee708e6562da366974b3173","sha256:3638ad8ef1def60fe2428224cde0ac853d6699be83bebdd0d5150a2b3ad42b11"],"state_sha256":"cba1575ae50baaff4da8847bb3f69912e9b3cc0237e9df61512cff5494a33938"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"y4bCBok+7INxrarECYlBVjNC7v0ReVAtik2Gft4VYhFYTNEqcC5CLD15QAT5FhFXQaa0gXVO7xAg3OnR/eyUCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T11:18:31.196648Z","bundle_sha256":"554a414d76064e9d2e982f2a185d9d14c7ff609cebb38d6e73a0cdf55b12b02f"}}