{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:GU5RAH4LDPH4GSHPQ7QBFKEW74","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"25b30e670af14d96a0fadfddaaa2092caa2cfac327173a5ddaeb6a2142d2149a","cross_cats_sorted":["cs.LG","cs.LO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-19T10:05:43Z","title_canon_sha256":"5ed9d935f4c7e8f3135a93ce1b665bbfc643e474c5e3387d02178bdfad4e97e9"},"schema_version":"1.0","source":{"id":"1805.07563","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.07563","created_at":"2026-05-18T00:15:33Z"},{"alias_kind":"arxiv_version","alias_value":"1805.07563v1","created_at":"2026-05-18T00:15:33Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.07563","created_at":"2026-05-18T00:15:33Z"},{"alias_kind":"pith_short_12","alias_value":"GU5RAH4LDPH4","created_at":"2026-05-18T12:32:25Z"},{"alias_kind":"pith_short_16","alias_value":"GU5RAH4LDPH4GSHP","created_at":"2026-05-18T12:32:25Z"},{"alias_kind":"pith_short_8","alias_value":"GU5RAH4L","created_at":"2026-05-18T12:32:25Z"}],"graph_snapshots":[{"event_id":"sha256:3b8c33399ac3bf38088f80f2dab4d3ca36422fc9ea09c9d05e8a5571a3d97432","target":"graph","created_at":"2026-05-18T00:15:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We introduce a theorem proving algorithm that uses practically no domain heuristics for guiding its connection-style proof search. Instead, it runs many Monte-Carlo simulations guided by reinforcement learning from previous proof attempts. We produce several versions of the prover, parameterized by different learning and guiding algorithms. The strongest version of the system is trained on a large corpus of mathematical problems and evaluated on previously unseen problems. The trained system solves within the same number of inferences over 40% more problems than a baseline prover, which is an ","authors_text":"Cezary Kaliszyk, Henryk Michalewski, Josef Urban, Mirek Ol\\v{s}\\'ak","cross_cats":["cs.LG","cs.LO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-19T10:05:43Z","title":"Reinforcement Learning of Theorem Proving"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.07563","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:49baf9418a323a426cf3bf4574710abf771711b1425718fd564b61094fedb1f8","target":"record","created_at":"2026-05-18T00:15:33Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"25b30e670af14d96a0fadfddaaa2092caa2cfac327173a5ddaeb6a2142d2149a","cross_cats_sorted":["cs.LG","cs.LO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-19T10:05:43Z","title_canon_sha256":"5ed9d935f4c7e8f3135a93ce1b665bbfc643e474c5e3387d02178bdfad4e97e9"},"schema_version":"1.0","source":{"id":"1805.07563","kind":"arxiv","version":1}},"canonical_sha256":"353b101f8b1bcfc348ef87e012a896ff115e5e67f3f8ed2c0af7eccd49d12bea","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"353b101f8b1bcfc348ef87e012a896ff115e5e67f3f8ed2c0af7eccd49d12bea","first_computed_at":"2026-05-18T00:15:33.242269Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:15:33.242269Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"s3fsRnI8T2h8N8Y1eCcTV+nEUfXHo/YTmhZxUm/eANIWOkn+dzqd62YzsLobJ8Thq8RiBLMGkpIrnF3EH6IdAg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:15:33.242917Z","signed_message":"canonical_sha256_bytes"},"source_id":"1805.07563","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:49baf9418a323a426cf3bf4574710abf771711b1425718fd564b61094fedb1f8","sha256:3b8c33399ac3bf38088f80f2dab4d3ca36422fc9ea09c9d05e8a5571a3d97432"],"state_sha256":"addb40b6bd85504477f2e53bbb5686a3abc2da0f47a00b85708bd799055413db"}