{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:XFQWT2RUKVYSPY7QE7FGBMC6GX","short_pith_number":"pith:XFQWT2RU","canonical_record":{"source":{"id":"2606.06746","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-04T21:59:47Z","cross_cats_sorted":[],"title_canon_sha256":"eaf52ffc352ebbcffb97668a369d7c1d6f46fc10fd7a983c6b45e2444481caca","abstract_canon_sha256":"0e70e3f2d6a2a27e5e2398f3d3789133f8ab34058d3744ec57322e02c903c4f8"},"schema_version":"1.0"},"canonical_sha256":"b96169ea34557127e3f027ca60b05e35dc6c6137f652de7e47e029323207d34d","source":{"kind":"arxiv","id":"2606.06746","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.06746","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"arxiv_version","alias_value":"2606.06746v1","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.06746","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"pith_short_12","alias_value":"XFQWT2RUKVYS","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"pith_short_16","alias_value":"XFQWT2RUKVYSPY7Q","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"pith_short_8","alias_value":"XFQWT2RU","created_at":"2026-06-08T01:04:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:XFQWT2RUKVYSPY7QE7FGBMC6GX","target":"record","payload":{"canonical_record":{"source":{"id":"2606.06746","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-04T21:59:47Z","cross_cats_sorted":[],"title_canon_sha256":"eaf52ffc352ebbcffb97668a369d7c1d6f46fc10fd7a983c6b45e2444481caca","abstract_canon_sha256":"0e70e3f2d6a2a27e5e2398f3d3789133f8ab34058d3744ec57322e02c903c4f8"},"schema_version":"1.0"},"canonical_sha256":"b96169ea34557127e3f027ca60b05e35dc6c6137f652de7e47e029323207d34d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-08T01:04:25.830760Z","signature_b64":"7GyPO+XiVQatTbCm8rtutYTiXpqgFhP0xt0ZBQ0uBcy7RoOjeDEw6vbyCGhJLPEkCwWcZRAZY+rQoClNGmRCCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b96169ea34557127e3f027ca60b05e35dc6c6137f652de7e47e029323207d34d","last_reissued_at":"2026-06-08T01:04:25.829947Z","signature_status":"signed_v1","first_computed_at":"2026-06-08T01:04:25.829947Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.06746","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-08T01:04:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SuZTFm2MioIecFID7wjB8+0JluFpaaZDocwZdKfP0JbTr0TXkqP4P5rUuGY8HpWye4jtamASfUn6yZIjT+WPBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T21:00:33.265402Z"},"content_sha256":"751a5a570115142f7d599d41d54fafc0041e3e08f8cc752e64794c96e575e8f3","schema_version":"1.0","event_id":"sha256:751a5a570115142f7d599d41d54fafc0041e3e08f8cc752e64794c96e575e8f3"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:XFQWT2RUKVYSPY7QE7FGBMC6GX","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Performance Variation in Deep Reinforcement Learning","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"A. Rupam Mahmood, Haruto Tanaka","submitted_at":"2026-06-04T21:59:47Z","abstract_excerpt":"Deep reinforcement learning (RL) algorithms often suffer from low run-to-run robustness, manifesting as significant performance variation across independent runs of identically configured agents. Although this issue poses a spectrum of challenges across research and practice, relatively few studies develop methods to evaluate it; RL research instead often reports uncertainty in the estimated mean performance. In this paper, we outline the limitations of conventional uncertainty and variation estimates, particularly their misalignment with purpose and the risk of underreporting. We then propose"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.06746","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.06746/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-08T01:04:25Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yXiaMj7HB11xKn3riQ9VgbB0fEGiQfu4Wkp9QZmFAhJ2vD8hfRxrgJi71G4bfgR1lCARRFkeX5fJnsvzuo5FDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T21:00:33.265771Z"},"content_sha256":"48acd1a0578696cdf0a07ff3435e09a33772a28151096a64c263793af389f338","schema_version":"1.0","event_id":"sha256:48acd1a0578696cdf0a07ff3435e09a33772a28151096a64c263793af389f338"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/XFQWT2RUKVYSPY7QE7FGBMC6GX/bundle.json","state_url":"https://pith.science/pith/XFQWT2RUKVYSPY7QE7FGBMC6GX/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/XFQWT2RUKVYSPY7QE7FGBMC6GX/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T21:00:33Z","links":{"resolver":"https://pith.science/pith/XFQWT2RUKVYSPY7QE7FGBMC6GX","bundle":"https://pith.science/pith/XFQWT2RUKVYSPY7QE7FGBMC6GX/bundle.json","state":"https://pith.science/pith/XFQWT2RUKVYSPY7QE7FGBMC6GX/state.json","well_known_bundle":"https://pith.science/.well-known/pith/XFQWT2RUKVYSPY7QE7FGBMC6GX/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:XFQWT2RUKVYSPY7QE7FGBMC6GX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0e70e3f2d6a2a27e5e2398f3d3789133f8ab34058d3744ec57322e02c903c4f8","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-04T21:59:47Z","title_canon_sha256":"eaf52ffc352ebbcffb97668a369d7c1d6f46fc10fd7a983c6b45e2444481caca"},"schema_version":"1.0","source":{"id":"2606.06746","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.06746","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"arxiv_version","alias_value":"2606.06746v1","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.06746","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"pith_short_12","alias_value":"XFQWT2RUKVYS","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"pith_short_16","alias_value":"XFQWT2RUKVYSPY7Q","created_at":"2026-06-08T01:04:25Z"},{"alias_kind":"pith_short_8","alias_value":"XFQWT2RU","created_at":"2026-06-08T01:04:25Z"}],"graph_snapshots":[{"event_id":"sha256:48acd1a0578696cdf0a07ff3435e09a33772a28151096a64c263793af389f338","target":"graph","created_at":"2026-06-08T01:04:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.06746/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Deep reinforcement learning (RL) algorithms often suffer from low run-to-run robustness, manifesting as significant performance variation across independent runs of identically configured agents. Although this issue poses a spectrum of challenges across research and practice, relatively few studies develop methods to evaluate it; RL research instead often reports uncertainty in the estimated mean performance. In this paper, we outline the limitations of conventional uncertainty and variation estimates, particularly their misalignment with purpose and the risk of underreporting. We then propose","authors_text":"A. Rupam Mahmood, Haruto Tanaka","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-04T21:59:47Z","title":"Performance Variation in Deep Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.06746","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:751a5a570115142f7d599d41d54fafc0041e3e08f8cc752e64794c96e575e8f3","target":"record","created_at":"2026-06-08T01:04:25Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0e70e3f2d6a2a27e5e2398f3d3789133f8ab34058d3744ec57322e02c903c4f8","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-04T21:59:47Z","title_canon_sha256":"eaf52ffc352ebbcffb97668a369d7c1d6f46fc10fd7a983c6b45e2444481caca"},"schema_version":"1.0","source":{"id":"2606.06746","kind":"arxiv","version":1}},"canonical_sha256":"b96169ea34557127e3f027ca60b05e35dc6c6137f652de7e47e029323207d34d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"b96169ea34557127e3f027ca60b05e35dc6c6137f652de7e47e029323207d34d","first_computed_at":"2026-06-08T01:04:25.829947Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-08T01:04:25.829947Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"7GyPO+XiVQatTbCm8rtutYTiXpqgFhP0xt0ZBQ0uBcy7RoOjeDEw6vbyCGhJLPEkCwWcZRAZY+rQoClNGmRCCg==","signature_status":"signed_v1","signed_at":"2026-06-08T01:04:25.830760Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.06746","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:751a5a570115142f7d599d41d54fafc0041e3e08f8cc752e64794c96e575e8f3","sha256:48acd1a0578696cdf0a07ff3435e09a33772a28151096a64c263793af389f338"],"state_sha256":"7d22193308cea21f916723750c793e4e7e72b96948898e2637f75f3d547a338e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"a2q0ORIQAVthmKY6PUWsBiom+HQUh6o4KrhRcSCA3zh7rj2z+oYBDmUw3iL2+c/zHg+CObndfA55o5as/EaXCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T21:00:33.267831Z","bundle_sha256":"89bab5521476f01d93ffef0bbc2e141e8cadac20cf0b66687c5d49c4f2c11e8e"}}