{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:WI2BOOJOLFKAINU4DBC2PHW5CQ","short_pith_number":"pith:WI2BOOJO","canonical_record":{"source":{"id":"2606.24990","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-23T14:42:46Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"83503304e5e3d6894cc65275cb076f5d5e19cc6c4bd08a9642d97e7c11f38ea0","abstract_canon_sha256":"f1e773bed58a86555287f63581f45703a490244d3f21a61b98afc2b894a6ca6e"},"schema_version":"1.0"},"canonical_sha256":"b23417392e595404369c1845a79edd143846c1e8febe26fd887ba41daf3f102e","source":{"kind":"arxiv","id":"2606.24990","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24990","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24990v1","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24990","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"pith_short_12","alias_value":"WI2BOOJOLFKA","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"pith_short_16","alias_value":"WI2BOOJOLFKAINU4","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"pith_short_8","alias_value":"WI2BOOJO","created_at":"2026-06-25T00:17:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:WI2BOOJOLFKAINU4DBC2PHW5CQ","target":"record","payload":{"canonical_record":{"source":{"id":"2606.24990","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-23T14:42:46Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"83503304e5e3d6894cc65275cb076f5d5e19cc6c4bd08a9642d97e7c11f38ea0","abstract_canon_sha256":"f1e773bed58a86555287f63581f45703a490244d3f21a61b98afc2b894a6ca6e"},"schema_version":"1.0"},"canonical_sha256":"b23417392e595404369c1845a79edd143846c1e8febe26fd887ba41daf3f102e","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-25T00:17:47.683301Z","signature_b64":"igC7sMZey9O/Da2wV9NhlLHDjxJBQNgwWB7CWdFEeZr27FkpX3CrsFR7uvjKZM3otI4AXplRFR3LvarVBvNLCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b23417392e595404369c1845a79edd143846c1e8febe26fd887ba41daf3f102e","last_reissued_at":"2026-06-25T00:17:47.682909Z","signature_status":"signed_v1","first_computed_at":"2026-06-25T00:17:47.682909Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.24990","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-25T00:17:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Ragn5AESjdL+iwQ+/+Z5Xc6PleXGvDFbFlV3RGt9EowIByDLlOTRIXXBtLug3ufrE9OycTRmNEyeAk+R+qqEBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T17:24:06.924437Z"},"content_sha256":"19910b2472aaf987bfd0d2bedaf9a7554ad56896ec233b97e2a337858ba08fae","schema_version":"1.0","event_id":"sha256:19910b2472aaf987bfd0d2bedaf9a7554ad56896ec233b97e2a337858ba08fae"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:WI2BOOJOLFKAINU4DBC2PHW5CQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Uncertainty-aware reinforcement learning for chemical language models","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Borja Medina, Jon Paul Janet","submitted_at":"2026-06-23T14:42:46Z","abstract_excerpt":"Reinforcement Learning (RL) has become a powerful paradigm for de novo molecular design, enabling Chemical Language Models (CLMs) to navigate and explore the chemical space while optimizing specific desired properties. However, the existing RL frameworks treat all scoring functions as deterministic oracles, neglecting the inherent uncertainty attached to the predictions of the different molecular properties. This can lead to the exploration of highly-uncertain regions of the chemical space, focusing on the generation of highly scored molecules which are poorly supported by the training data. T"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24990","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.24990/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-25T00:17:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9XX5GAG2UylgcUOMNsJTXYr4Q2LpD3Kcmce9NvTq7F3MPjTYtup/cIMMYIVhJdYjA3AlmFScY+W0saFd0N/NCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T17:24:06.924810Z"},"content_sha256":"9764b1ea35d01ba24b2a8f1e333544321bd084c737016bd3fd8b013316e46bb2","schema_version":"1.0","event_id":"sha256:9764b1ea35d01ba24b2a8f1e333544321bd084c737016bd3fd8b013316e46bb2"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/WI2BOOJOLFKAINU4DBC2PHW5CQ/bundle.json","state_url":"https://pith.science/pith/WI2BOOJOLFKAINU4DBC2PHW5CQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/WI2BOOJOLFKAINU4DBC2PHW5CQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T17:24:06Z","links":{"resolver":"https://pith.science/pith/WI2BOOJOLFKAINU4DBC2PHW5CQ","bundle":"https://pith.science/pith/WI2BOOJOLFKAINU4DBC2PHW5CQ/bundle.json","state":"https://pith.science/pith/WI2BOOJOLFKAINU4DBC2PHW5CQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/WI2BOOJOLFKAINU4DBC2PHW5CQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:WI2BOOJOLFKAINU4DBC2PHW5CQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f1e773bed58a86555287f63581f45703a490244d3f21a61b98afc2b894a6ca6e","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-23T14:42:46Z","title_canon_sha256":"83503304e5e3d6894cc65275cb076f5d5e19cc6c4bd08a9642d97e7c11f38ea0"},"schema_version":"1.0","source":{"id":"2606.24990","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.24990","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.24990v1","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24990","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"pith_short_12","alias_value":"WI2BOOJOLFKA","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"pith_short_16","alias_value":"WI2BOOJOLFKAINU4","created_at":"2026-06-25T00:17:47Z"},{"alias_kind":"pith_short_8","alias_value":"WI2BOOJO","created_at":"2026-06-25T00:17:47Z"}],"graph_snapshots":[{"event_id":"sha256:9764b1ea35d01ba24b2a8f1e333544321bd084c737016bd3fd8b013316e46bb2","target":"graph","created_at":"2026-06-25T00:17:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.24990/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Reinforcement Learning (RL) has become a powerful paradigm for de novo molecular design, enabling Chemical Language Models (CLMs) to navigate and explore the chemical space while optimizing specific desired properties. However, the existing RL frameworks treat all scoring functions as deterministic oracles, neglecting the inherent uncertainty attached to the predictions of the different molecular properties. This can lead to the exploration of highly-uncertain regions of the chemical space, focusing on the generation of highly scored molecules which are poorly supported by the training data. T","authors_text":"Borja Medina, Jon Paul Janet","cross_cats":["cs.AI"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-23T14:42:46Z","title":"Uncertainty-aware reinforcement learning for chemical language models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24990","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:19910b2472aaf987bfd0d2bedaf9a7554ad56896ec233b97e2a337858ba08fae","target":"record","created_at":"2026-06-25T00:17:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f1e773bed58a86555287f63581f45703a490244d3f21a61b98afc2b894a6ca6e","cross_cats_sorted":["cs.AI"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-23T14:42:46Z","title_canon_sha256":"83503304e5e3d6894cc65275cb076f5d5e19cc6c4bd08a9642d97e7c11f38ea0"},"schema_version":"1.0","source":{"id":"2606.24990","kind":"arxiv","version":1}},"canonical_sha256":"b23417392e595404369c1845a79edd143846c1e8febe26fd887ba41daf3f102e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b23417392e595404369c1845a79edd143846c1e8febe26fd887ba41daf3f102e","first_computed_at":"2026-06-25T00:17:47.682909Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-25T00:17:47.682909Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"igC7sMZey9O/Da2wV9NhlLHDjxJBQNgwWB7CWdFEeZr27FkpX3CrsFR7uvjKZM3otI4AXplRFR3LvarVBvNLCg==","signature_status":"signed_v1","signed_at":"2026-06-25T00:17:47.683301Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.24990","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:19910b2472aaf987bfd0d2bedaf9a7554ad56896ec233b97e2a337858ba08fae","sha256:9764b1ea35d01ba24b2a8f1e333544321bd084c737016bd3fd8b013316e46bb2"],"state_sha256":"f9888216e5ec1c42ec41fcf1cc79e055522288f7500e8e3948f70f28b61dbc57"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"in0C/FXvCPtzBOan1glSXc574SVKwTWyMBPRe15Dv0sFe9gRfM4lHy7Nkh/lMsUF2II8SD+2YVcNh2MJXw3bBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T17:24:06.926796Z","bundle_sha256":"1b55ff81ff64370f3ff745d5719d04f9a0ee235eb7991736d2a9a4437018a392"}}