{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:2TYZRMI4LJES2TOM66E2WZEMLQ","short_pith_number":"pith:2TYZRMI4","canonical_record":{"source":{"id":"2606.22922","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","cross_cats_sorted":["cs.AI","math.AC","math.CO"],"title_canon_sha256":"ba4820b5c63984cdfeae2607c62bd1b3aff53a9788e82a681ba43cd47d48f527","abstract_canon_sha256":"7acb910b535db5d4a674f91d3966a22f1c404ba1a549cd672ddb48f687d5fb0a"},"schema_version":"1.0"},"canonical_sha256":"d4f198b11c5a492d4dccf789ab648c5c03c98422034478bbe5bbe3dce2dd7744","source":{"kind":"arxiv","id":"2606.22922","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.22922","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"arxiv_version","alias_value":"2606.22922v1","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.22922","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_12","alias_value":"2TYZRMI4LJES","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_16","alias_value":"2TYZRMI4LJES2TOM","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_8","alias_value":"2TYZRMI4","created_at":"2026-06-23T03:14:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:2TYZRMI4LJES2TOM66E2WZEMLQ","target":"record","payload":{"canonical_record":{"source":{"id":"2606.22922","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","cross_cats_sorted":["cs.AI","math.AC","math.CO"],"title_canon_sha256":"ba4820b5c63984cdfeae2607c62bd1b3aff53a9788e82a681ba43cd47d48f527","abstract_canon_sha256":"7acb910b535db5d4a674f91d3966a22f1c404ba1a549cd672ddb48f687d5fb0a"},"schema_version":"1.0"},"canonical_sha256":"d4f198b11c5a492d4dccf789ab648c5c03c98422034478bbe5bbe3dce2dd7744","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-23T03:14:04.291182Z","signature_b64":"1+CRVG4lZJRHsNVztNbd/V3KBQ1+v51tauidjS/zPeLgx2wW/NDPqB2C8qx9Z2pNec4BHVaRaLSAHwgBIZhuCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d4f198b11c5a492d4dccf789ab648c5c03c98422034478bbe5bbe3dce2dd7744","last_reissued_at":"2026-06-23T03:14:04.290719Z","signature_status":"signed_v1","first_computed_at":"2026-06-23T03:14:04.290719Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.22922","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-23T03:14:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"v7X2iZ3AopD4psQKeq6UFqPx/SWV6NfbSBKBr/4Ctp4c9EFGJ2WW6hQiYfm2CfWVPLtNVRJrbgNNlqo1nb+dCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-26T15:31:33.016750Z"},"content_sha256":"0b6a7d405e96b99c456464a0b7a72ad7e4304132d5dd9c2ae2dc111c9a7c365a","schema_version":"1.0","event_id":"sha256:0b6a7d405e96b99c456464a0b7a72ad7e4304132d5dd9c2ae2dc111c9a7c365a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:2TYZRMI4LJES2TOM66E2WZEMLQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Hierarchical Reinforcement Learning for Sparse-Reward Search in Commutative Algebra","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.AI","math.AC","math.CO"],"primary_cat":"cs.LG","authors_text":"Ali Shehper, Coco Huang, David Eisenbud, Davide Passaro, Giorgi Butbaia, Hailong Dao, Lucas Fagan, Michele Tarquini, Paul Orland, Sergei Gukov","submitted_at":"2026-06-22T07:02:08Z","abstract_excerpt":"Applying machine learning techniques to solving long-standing mathematical conjectures can be particularly challenging due to their extreme reward sparsity. As an illustrative example, we consider Kalai's algebraic Hirsch conjecture and recast the construction of its counterexamples as a sparse-reward reinforcement learning problem on graphs. We propose a constrained options-based HRL framework with an equivariant graph neural network policy, which allows us to learn useful temporal abstractions for this task. We evaluate our approach over a wide range of degrees and demonstrate that it consis"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.22922","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.22922/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-23T03:14:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"jFn9CgcTw3NxB+mTddYgF9V1PrlNw4RXHFm6IAET/F6sLYywFWQwiHeWtIISdOITCs+sbyx1JSMiBsMxjWEkDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-26T15:31:33.017139Z"},"content_sha256":"0813f085f5e5629c52a3326a7d9a2b62012622b8b76660035be344783e0d171f","schema_version":"1.0","event_id":"sha256:0813f085f5e5629c52a3326a7d9a2b62012622b8b76660035be344783e0d171f"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/2TYZRMI4LJES2TOM66E2WZEMLQ/bundle.json","state_url":"https://pith.science/pith/2TYZRMI4LJES2TOM66E2WZEMLQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/2TYZRMI4LJES2TOM66E2WZEMLQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-26T15:31:33Z","links":{"resolver":"https://pith.science/pith/2TYZRMI4LJES2TOM66E2WZEMLQ","bundle":"https://pith.science/pith/2TYZRMI4LJES2TOM66E2WZEMLQ/bundle.json","state":"https://pith.science/pith/2TYZRMI4LJES2TOM66E2WZEMLQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/2TYZRMI4LJES2TOM66E2WZEMLQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:2TYZRMI4LJES2TOM66E2WZEMLQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7acb910b535db5d4a674f91d3966a22f1c404ba1a549cd672ddb48f687d5fb0a","cross_cats_sorted":["cs.AI","math.AC","math.CO"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","title_canon_sha256":"ba4820b5c63984cdfeae2607c62bd1b3aff53a9788e82a681ba43cd47d48f527"},"schema_version":"1.0","source":{"id":"2606.22922","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.22922","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"arxiv_version","alias_value":"2606.22922v1","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.22922","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_12","alias_value":"2TYZRMI4LJES","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_16","alias_value":"2TYZRMI4LJES2TOM","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_8","alias_value":"2TYZRMI4","created_at":"2026-06-23T03:14:04Z"}],"graph_snapshots":[{"event_id":"sha256:0813f085f5e5629c52a3326a7d9a2b62012622b8b76660035be344783e0d171f","target":"graph","created_at":"2026-06-23T03:14:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.22922/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Applying machine learning techniques to solving long-standing mathematical conjectures can be particularly challenging due to their extreme reward sparsity. As an illustrative example, we consider Kalai's algebraic Hirsch conjecture and recast the construction of its counterexamples as a sparse-reward reinforcement learning problem on graphs. We propose a constrained options-based HRL framework with an equivariant graph neural network policy, which allows us to learn useful temporal abstractions for this task. We evaluate our approach over a wide range of degrees and demonstrate that it consis","authors_text":"Ali Shehper, Coco Huang, David Eisenbud, Davide Passaro, Giorgi Butbaia, Hailong Dao, Lucas Fagan, Michele Tarquini, Paul Orland, Sergei Gukov","cross_cats":["cs.AI","math.AC","math.CO"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","title":"Hierarchical Reinforcement Learning for Sparse-Reward Search in Commutative Algebra"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.22922","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0b6a7d405e96b99c456464a0b7a72ad7e4304132d5dd9c2ae2dc111c9a7c365a","target":"record","created_at":"2026-06-23T03:14:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7acb910b535db5d4a674f91d3966a22f1c404ba1a549cd672ddb48f687d5fb0a","cross_cats_sorted":["cs.AI","math.AC","math.CO"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","title_canon_sha256":"ba4820b5c63984cdfeae2607c62bd1b3aff53a9788e82a681ba43cd47d48f527"},"schema_version":"1.0","source":{"id":"2606.22922","kind":"arxiv","version":1}},"canonical_sha256":"d4f198b11c5a492d4dccf789ab648c5c03c98422034478bbe5bbe3dce2dd7744","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d4f198b11c5a492d4dccf789ab648c5c03c98422034478bbe5bbe3dce2dd7744","first_computed_at":"2026-06-23T03:14:04.290719Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-23T03:14:04.290719Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"1+CRVG4lZJRHsNVztNbd/V3KBQ1+v51tauidjS/zPeLgx2wW/NDPqB2C8qx9Z2pNec4BHVaRaLSAHwgBIZhuCA==","signature_status":"signed_v1","signed_at":"2026-06-23T03:14:04.291182Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.22922","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0b6a7d405e96b99c456464a0b7a72ad7e4304132d5dd9c2ae2dc111c9a7c365a","sha256:0813f085f5e5629c52a3326a7d9a2b62012622b8b76660035be344783e0d171f"],"state_sha256":"0bbeef6c62cbac78c011301000691cf0bec83ac3fcc63c9dd1366de68b7b42d6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ikcoDQ42D1+Lu3aoxCVAACdbReBI1t1p6DOjaiwOaA4xKt9cgZbiL3TLQDri7A+t8L1QU2jlHVFDxd4cGK6SCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-26T15:31:33.019196Z","bundle_sha256":"cebd8df257f775cf145e18135ac2bcb48fb7bcf955e550fa479882a1c380aa61"}}