{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:B4ENL7AW45INWTHHG5SZR3DETG","short_pith_number":"pith:B4ENL7AW","canonical_record":{"source":{"id":"2606.24622","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T14:20:42Z","cross_cats_sorted":["cs.HC"],"title_canon_sha256":"10ba1db44bbd9e48a8282276874eee0a972ec620940a43997109ee54501da249","abstract_canon_sha256":"86ea992d604ef0f90edb2083eb4add0916f01a3b52ab9a94387af35f6223b12d"},"schema_version":"1.0"},"canonical_sha256":"0f08d5fc16e750db4ce7376598ec6499a440a5a05b133fc3a9eb36e474116f82","source":{"kind":"arxiv","id":"2606.24622","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24622","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24622v1","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24622","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"pith_short_12","alias_value":"B4ENL7AW45IN","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"pith_short_16","alias_value":"B4ENL7AW45INWTHH","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"pith_short_8","alias_value":"B4ENL7AW","created_at":"2026-06-24T01:15:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:B4ENL7AW45INWTHHG5SZR3DETG","target":"record","payload":{"canonical_record":{"source":{"id":"2606.24622","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T14:20:42Z","cross_cats_sorted":["cs.HC"],"title_canon_sha256":"10ba1db44bbd9e48a8282276874eee0a972ec620940a43997109ee54501da249","abstract_canon_sha256":"86ea992d604ef0f90edb2083eb4add0916f01a3b52ab9a94387af35f6223b12d"},"schema_version":"1.0"},"canonical_sha256":"0f08d5fc16e750db4ce7376598ec6499a440a5a05b133fc3a9eb36e474116f82","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-24T01:15:37.380066Z","signature_b64":"Cyei1rB7mhVZAu2WECj7JJfBp2azrPZgXOi0PzK6zY+IorWnX6M1xxHqbIbtWe2rSFp7c3PGXCvQwb6vRYA6Cg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0f08d5fc16e750db4ce7376598ec6499a440a5a05b133fc3a9eb36e474116f82","last_reissued_at":"2026-06-24T01:15:37.379744Z","signature_status":"signed_v1","first_computed_at":"2026-06-24T01:15:37.379744Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.24622","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:15:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pCXWm94UigePcopT4FrVpxy4qlnyh2jOHbUUr2sBeor4Qf2kRcoLrO17oU4J0a4gSALXyeD7rrENOrZKugegCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T10:14:33.163090Z"},"content_sha256":"40161ffabe795ae05faecaf4cb1189ecca683076e382bf605ed62e43f8caf493","schema_version":"1.0","event_id":"sha256:40161ffabe795ae05faecaf4cb1189ecca683076e382bf605ed62e43f8caf493"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:B4ENL7AW45INWTHHG5SZR3DETG","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Themis: An explainable AI-enabled framework for Reinforcement Learning with Human Feedback","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.HC"],"primary_cat":"cs.AI","authors_text":"Andreas Chouliaras, Dimitris Chatzpoulos, Luke Connolly","submitted_at":"2026-06-23T14:20:42Z","abstract_excerpt":"Training safe Reinforcement Learning (RL) systems is inherently challenging, with no guarantee of avoiding unwanted behaviors. The most effective defenses against this are (i) transparency through explainability and (ii) alignment via human feedback. While both show promising results, no publicly available framework currently combines them. To address this, we introduce Themis, an XAI-enabled testing and evaluation framework for Reinforcement Learning from Human Feedback. Themis supports over 200 widely used environments and is easily configurable for experiments in RL, transparency, and align"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24622","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.24622/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-24T01:15:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BiE9CeT1z0PGpCY2ZjPIakl1E1x62gXLNW3TkurxKnx1IgrEY8Z1y9J7ybAkeeUW9WVr5JHR8NJwo6+WBt6NBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T10:14:33.163472Z"},"content_sha256":"13d0a3d2bc5ba3ce9b25c782a5bf23a25ae581d2ee6c16756b704d33d5b5ad5f","schema_version":"1.0","event_id":"sha256:13d0a3d2bc5ba3ce9b25c782a5bf23a25ae581d2ee6c16756b704d33d5b5ad5f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/B4ENL7AW45INWTHHG5SZR3DETG/bundle.json","state_url":"https://pith.science/pith/B4ENL7AW45INWTHHG5SZR3DETG/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/B4ENL7AW45INWTHHG5SZR3DETG/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T10:14:33Z","links":{"resolver":"https://pith.science/pith/B4ENL7AW45INWTHHG5SZR3DETG","bundle":"https://pith.science/pith/B4ENL7AW45INWTHHG5SZR3DETG/bundle.json","state":"https://pith.science/pith/B4ENL7AW45INWTHHG5SZR3DETG/state.json","well_known_bundle":"https://pith.science/.well-known/pith/B4ENL7AW45INWTHHG5SZR3DETG/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:B4ENL7AW45INWTHHG5SZR3DETG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"86ea992d604ef0f90edb2083eb4add0916f01a3b52ab9a94387af35f6223b12d","cross_cats_sorted":["cs.HC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T14:20:42Z","title_canon_sha256":"10ba1db44bbd9e48a8282276874eee0a972ec620940a43997109ee54501da249"},"schema_version":"1.0","source":{"id":"2606.24622","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24622","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24622v1","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24622","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"pith_short_12","alias_value":"B4ENL7AW45IN","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"pith_short_16","alias_value":"B4ENL7AW45INWTHH","created_at":"2026-06-24T01:15:37Z"},{"alias_kind":"pith_short_8","alias_value":"B4ENL7AW","created_at":"2026-06-24T01:15:37Z"}],"graph_snapshots":[{"event_id":"sha256:13d0a3d2bc5ba3ce9b25c782a5bf23a25ae581d2ee6c16756b704d33d5b5ad5f","target":"graph","created_at":"2026-06-24T01:15:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.24622/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Training safe Reinforcement Learning (RL) systems is inherently challenging, with no guarantee of avoiding unwanted behaviors. The most effective defenses against this are (i) transparency through explainability and (ii) alignment via human feedback. While both show promising results, no publicly available framework currently combines them. To address this, we introduce Themis, an XAI-enabled testing and evaluation framework for Reinforcement Learning from Human Feedback. Themis supports over 200 widely used environments and is easily configurable for experiments in RL, transparency, and align","authors_text":"Andreas Chouliaras, Dimitris Chatzpoulos, Luke Connolly","cross_cats":["cs.HC"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T14:20:42Z","title":"Themis: An explainable AI-enabled framework for Reinforcement Learning with Human Feedback"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24622","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:40161ffabe795ae05faecaf4cb1189ecca683076e382bf605ed62e43f8caf493","target":"record","created_at":"2026-06-24T01:15:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"86ea992d604ef0f90edb2083eb4add0916f01a3b52ab9a94387af35f6223b12d","cross_cats_sorted":["cs.HC"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-06-23T14:20:42Z","title_canon_sha256":"10ba1db44bbd9e48a8282276874eee0a972ec620940a43997109ee54501da249"},"schema_version":"1.0","source":{"id":"2606.24622","kind":"arxiv","version":1}},"canonical_sha256":"0f08d5fc16e750db4ce7376598ec6499a440a5a05b133fc3a9eb36e474116f82","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0f08d5fc16e750db4ce7376598ec6499a440a5a05b133fc3a9eb36e474116f82","first_computed_at":"2026-06-24T01:15:37.379744Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-24T01:15:37.379744Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Cyei1rB7mhVZAu2WECj7JJfBp2azrPZgXOi0PzK6zY+IorWnX6M1xxHqbIbtWe2rSFp7c3PGXCvQwb6vRYA6Cg==","signature_status":"signed_v1","signed_at":"2026-06-24T01:15:37.380066Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.24622","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:40161ffabe795ae05faecaf4cb1189ecca683076e382bf605ed62e43f8caf493","sha256:13d0a3d2bc5ba3ce9b25c782a5bf23a25ae581d2ee6c16756b704d33d5b5ad5f"],"state_sha256":"0656fdec6d0110b927e9e993a78963fc2e6c15f9dc5e29785f1af121b80fd59b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"I5hL1kFNoTRuL5V68+7JrkFwL9/4zgYUMxxi7u2l/BxpvlIfnb6oHrJ4zk7raePdG6CwPSoS92kcNEtI+y/4Dw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T10:14:33.165376Z","bundle_sha256":"d10ca2f99497e36c03f72dbdeed6e00cc27e9e97b7d97bb7ff6100032919f163"}}