{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2017:GPM27EDEJQ7INYP6OGDOPU45BP","short_pith_number":"pith:GPM27EDE","schema_version":"1.0","canonical_sha256":"33d9af90644c3e86e1fe7186e7d39d0bfd83809bf16f14c204b4c215740e9127","source":{"kind":"arxiv","id":"1708.04987","version":4},"attestation_state":"computed","paper":{"title":"ANI-1: A data set of 20M off-equilibrium DFT calculations for organic molecules","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","physics.data-an"],"primary_cat":"physics.chem-ph","authors_text":"Adrian E. Roitberg, Justin S. Smith, Olexandr Isayev","submitted_at":"2017-08-16T17:26:49Z","abstract_excerpt":"One of the grand challenges in modern theoretical chemistry is designing and implementing approximations that expedite ab initio methods without loss of accuracy. Machine learning (ML), in particular neural networks, are emerging as a powerful approach to constructing various forms of transferable atomistic potentials. They have been successfully applied in a variety of applications in chemistry, biology, catalysis, and solid-state physics. However, these models are heavily dependent on the quality and quantity of data used in their fitting. Fitting highly flexible ML potentials comes at a cos"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1708.04987","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"physics.chem-ph","submitted_at":"2017-08-16T17:26:49Z","cross_cats_sorted":["cs.LG","physics.data-an"],"title_canon_sha256":"b9a3c1d9a4f8056c13e24f5331d424dd20a9f094b39232fdfda887ad64227187","abstract_canon_sha256":"81912fdb4c9f266089637b8856a9dc97fbbd61a5732bbcb8664625cbb73d10e0"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:26:29.293752Z","signature_b64":"jiTPg/yEt1q+qH9rlqr7nDrwQj8/AKJeWqUpLz5MOySaTdP8OflkCe93/bftNimP8IXj4P9lmOyO03PnxO7ACw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"33d9af90644c3e86e1fe7186e7d39d0bfd83809bf16f14c204b4c215740e9127","last_reissued_at":"2026-05-18T00:26:29.292138Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:26:29.292138Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"ANI-1: A data set of 20M off-equilibrium DFT calculations for organic molecules","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","physics.data-an"],"primary_cat":"physics.chem-ph","authors_text":"Adrian E. Roitberg, Justin S. Smith, Olexandr Isayev","submitted_at":"2017-08-16T17:26:49Z","abstract_excerpt":"One of the grand challenges in modern theoretical chemistry is designing and implementing approximations that expedite ab initio methods without loss of accuracy. Machine learning (ML), in particular neural networks, are emerging as a powerful approach to constructing various forms of transferable atomistic potentials. They have been successfully applied in a variety of applications in chemistry, biology, catalysis, and solid-state physics. However, these models are heavily dependent on the quality and quantity of data used in their fitting. Fitting highly flexible ML potentials comes at a cos"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.04987","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1708.04987","created_at":"2026-05-18T00:26:29.292265+00:00"},{"alias_kind":"arxiv_version","alias_value":"1708.04987v4","created_at":"2026-05-18T00:26:29.292265+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.04987","created_at":"2026-05-18T00:26:29.292265+00:00"},{"alias_kind":"pith_short_12","alias_value":"GPM27EDEJQ7I","created_at":"2026-05-18T12:31:18.294218+00:00"},{"alias_kind":"pith_short_16","alias_value":"GPM27EDEJQ7INYP6","created_at":"2026-05-18T12:31:18.294218+00:00"},{"alias_kind":"pith_short_8","alias_value":"GPM27EDE","created_at":"2026-05-18T12:31:18.294218+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":1,"internal_anchor_count":0,"sample":[{"citing_arxiv_id":"2604.28064","citing_title":"3D Reconstruction Techniques in the Manufacturing Domain: Applications, Research Opportunities and Use Cases","ref_index":155,"is_internal_anchor":false}]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP","json":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP.json","graph_json":"https://pith.science/api/pith-number/GPM27EDEJQ7INYP6OGDOPU45BP/graph.json","events_json":"https://pith.science/api/pith-number/GPM27EDEJQ7INYP6OGDOPU45BP/events.json","paper":"https://pith.science/paper/GPM27EDE"},"agent_actions":{"view_html":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP","download_json":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP.json","view_paper":"https://pith.science/paper/GPM27EDE","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1708.04987&json=true","fetch_graph":"https://pith.science/api/pith-number/GPM27EDEJQ7INYP6OGDOPU45BP/graph.json","fetch_events":"https://pith.science/api/pith-number/GPM27EDEJQ7INYP6OGDOPU45BP/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP/action/timestamp_anchor","attest_storage":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP/action/storage_attestation","attest_author":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP/action/author_attestation","sign_citation":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP/action/citation_signature","submit_replication":"https://pith.science/pith/GPM27EDEJQ7INYP6OGDOPU45BP/action/replication_record"}},"created_at":"2026-05-18T00:26:29.292265+00:00","updated_at":"2026-05-18T00:26:29.292265+00:00"}