{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:2TYZRMI4LJES2TOM66E2WZEMLQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7acb910b535db5d4a674f91d3966a22f1c404ba1a549cd672ddb48f687d5fb0a","cross_cats_sorted":["cs.AI","math.AC","math.CO"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","title_canon_sha256":"ba4820b5c63984cdfeae2607c62bd1b3aff53a9788e82a681ba43cd47d48f527"},"schema_version":"1.0","source":{"id":"2606.22922","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.22922","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"arxiv_version","alias_value":"2606.22922v1","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.22922","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_12","alias_value":"2TYZRMI4LJES","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_16","alias_value":"2TYZRMI4LJES2TOM","created_at":"2026-06-23T03:14:04Z"},{"alias_kind":"pith_short_8","alias_value":"2TYZRMI4","created_at":"2026-06-23T03:14:04Z"}],"graph_snapshots":[{"event_id":"sha256:0813f085f5e5629c52a3326a7d9a2b62012622b8b76660035be344783e0d171f","target":"graph","created_at":"2026-06-23T03:14:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.22922/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Applying machine learning techniques to solving long-standing mathematical conjectures can be particularly challenging due to their extreme reward sparsity. As an illustrative example, we consider Kalai's algebraic Hirsch conjecture and recast the construction of its counterexamples as a sparse-reward reinforcement learning problem on graphs. We propose a constrained options-based HRL framework with an equivariant graph neural network policy, which allows us to learn useful temporal abstractions for this task. We evaluate our approach over a wide range of degrees and demonstrate that it consis","authors_text":"Ali Shehper, Coco Huang, David Eisenbud, Davide Passaro, Giorgi Butbaia, Hailong Dao, Lucas Fagan, Michele Tarquini, Paul Orland, Sergei Gukov","cross_cats":["cs.AI","math.AC","math.CO"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","title":"Hierarchical Reinforcement Learning for Sparse-Reward Search in Commutative Algebra"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.22922","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0b6a7d405e96b99c456464a0b7a72ad7e4304132d5dd9c2ae2dc111c9a7c365a","target":"record","created_at":"2026-06-23T03:14:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7acb910b535db5d4a674f91d3966a22f1c404ba1a549cd672ddb48f687d5fb0a","cross_cats_sorted":["cs.AI","math.AC","math.CO"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-22T07:02:08Z","title_canon_sha256":"ba4820b5c63984cdfeae2607c62bd1b3aff53a9788e82a681ba43cd47d48f527"},"schema_version":"1.0","source":{"id":"2606.22922","kind":"arxiv","version":1}},"canonical_sha256":"d4f198b11c5a492d4dccf789ab648c5c03c98422034478bbe5bbe3dce2dd7744","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d4f198b11c5a492d4dccf789ab648c5c03c98422034478bbe5bbe3dce2dd7744","first_computed_at":"2026-06-23T03:14:04.290719Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-23T03:14:04.290719Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"1+CRVG4lZJRHsNVztNbd/V3KBQ1+v51tauidjS/zPeLgx2wW/NDPqB2C8qx9Z2pNec4BHVaRaLSAHwgBIZhuCA==","signature_status":"signed_v1","signed_at":"2026-06-23T03:14:04.291182Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.22922","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0b6a7d405e96b99c456464a0b7a72ad7e4304132d5dd9c2ae2dc111c9a7c365a","sha256:0813f085f5e5629c52a3326a7d9a2b62012622b8b76660035be344783e0d171f"],"state_sha256":"0bbeef6c62cbac78c011301000691cf0bec83ac3fcc63c9dd1366de68b7b42d6"}