{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:6PW4FQDNMBYT23ABGHXXHZVHJE","short_pith_number":"pith:6PW4FQDN","canonical_record":{"source":{"id":"1712.02034","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-12-06T04:29:28Z","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"title_canon_sha256":"3b67952769a84b491ae86930d5769121f4d1852c3ec38aecc39a2873eb832739","abstract_canon_sha256":"c4c7891fda7a799e0e3d8f6da90fcebcb645deaf5fa5b91d34895f9d7ee82a3d"},"schema_version":"1.0"},"canonical_sha256":"f3edc2c06d60713d6c0131ef73e6a7490be01ae512166204cc42aabf07fa5ee4","source":{"kind":"arxiv","id":"1712.02034","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.02034","created_at":"2026-05-18T00:08:03Z"},{"alias_kind":"arxiv_version","alias_value":"1712.02034v2","created_at":"2026-05-18T00:08:03Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.02034","created_at":"2026-05-18T00:08:03Z"},{"alias_kind":"pith_short_12","alias_value":"6PW4FQDNMBYT","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_16","alias_value":"6PW4FQDNMBYT23AB","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_8","alias_value":"6PW4FQDN","created_at":"2026-05-18T12:31:03Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:6PW4FQDNMBYT23ABGHXXHZVHJE","target":"record","payload":{"canonical_record":{"source":{"id":"1712.02034","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-12-06T04:29:28Z","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"title_canon_sha256":"3b67952769a84b491ae86930d5769121f4d1852c3ec38aecc39a2873eb832739","abstract_canon_sha256":"c4c7891fda7a799e0e3d8f6da90fcebcb645deaf5fa5b91d34895f9d7ee82a3d"},"schema_version":"1.0"},"canonical_sha256":"f3edc2c06d60713d6c0131ef73e6a7490be01ae512166204cc42aabf07fa5ee4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:08:03.219095Z","signature_b64":"d+MJYb8H7ROlRu958VLGE7GTWbrOno4PgyCgGiV3MnRvh9HggCNAMsf3CW1XFDGIJCYPqrzv54BYX1okq/jiAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f3edc2c06d60713d6c0131ef73e6a7490be01ae512166204cc42aabf07fa5ee4","last_reissued_at":"2026-05-18T00:08:03.218606Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:08:03.218606Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1712.02034","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:08:03Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JwQAJKQrQRhsDi5rQ275wUztGL3AkgPbyCsWHaobkM2sLTq/HADc6cl7jQ/0OETWYdpa/VMHVxhMgIPfPP2qAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T22:17:24.739909Z"},"content_sha256":"36489bfb0ace77285d3511aeefb39f729ffef3d5fa1883d640c3e9bc31025739","schema_version":"1.0","event_id":"sha256:36489bfb0ace77285d3511aeefb39f729ffef3d5fa1883d640c3e9bc31025739"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:6PW4FQDNMBYT23ABGHXXHZVHJE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"SMILES2Vec: An Interpretable General-Purpose Deep Neural Network for Predicting Chemical Properties","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.CL","cs.LG"],"primary_cat":"stat.ML","authors_text":"Abhinav Vishnu, Charles Siegel, Garrett B. Goh, Nathan O. Hodas","submitted_at":"2017-12-06T04:29:28Z","abstract_excerpt":"Chemical databases store information in text representations, and the SMILES format is a universal standard used in many cheminformatics software. Encoded in each SMILES string is structural information that can be used to predict complex chemical properties. In this work, we develop SMILES2vec, a deep RNN that automatically learns features from SMILES to predict chemical properties, without the need for additional explicit feature engineering. Using Bayesian optimization methods to tune the network architecture, we show that an optimized SMILES2vec model can serve as a general-purpose neural "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.02034","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:08:03Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ccR0pQevyyZ2Vydgio9b2P52FQ6CAbDFUhD1ma4nMMJD50pecRTEIs2mxcWBV+lBtLzfJicDnbmFk9b14CS7DA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T22:17:24.740544Z"},"content_sha256":"34be63fa7209a02743cddfa0b29c9ec7be3a25cf33b77a275354926d0c149362","schema_version":"1.0","event_id":"sha256:34be63fa7209a02743cddfa0b29c9ec7be3a25cf33b77a275354926d0c149362"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/6PW4FQDNMBYT23ABGHXXHZVHJE/bundle.json","state_url":"https://pith.science/pith/6PW4FQDNMBYT23ABGHXXHZVHJE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/6PW4FQDNMBYT23ABGHXXHZVHJE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T22:17:24Z","links":{"resolver":"https://pith.science/pith/6PW4FQDNMBYT23ABGHXXHZVHJE","bundle":"https://pith.science/pith/6PW4FQDNMBYT23ABGHXXHZVHJE/bundle.json","state":"https://pith.science/pith/6PW4FQDNMBYT23ABGHXXHZVHJE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/6PW4FQDNMBYT23ABGHXXHZVHJE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:6PW4FQDNMBYT23ABGHXXHZVHJE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"c4c7891fda7a799e0e3d8f6da90fcebcb645deaf5fa5b91d34895f9d7ee82a3d","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-12-06T04:29:28Z","title_canon_sha256":"3b67952769a84b491ae86930d5769121f4d1852c3ec38aecc39a2873eb832739"},"schema_version":"1.0","source":{"id":"1712.02034","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1712.02034","created_at":"2026-05-18T00:08:03Z"},{"alias_kind":"arxiv_version","alias_value":"1712.02034v2","created_at":"2026-05-18T00:08:03Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1712.02034","created_at":"2026-05-18T00:08:03Z"},{"alias_kind":"pith_short_12","alias_value":"6PW4FQDNMBYT","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_16","alias_value":"6PW4FQDNMBYT23AB","created_at":"2026-05-18T12:31:03Z"},{"alias_kind":"pith_short_8","alias_value":"6PW4FQDN","created_at":"2026-05-18T12:31:03Z"}],"graph_snapshots":[{"event_id":"sha256:34be63fa7209a02743cddfa0b29c9ec7be3a25cf33b77a275354926d0c149362","target":"graph","created_at":"2026-05-18T00:08:03Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Chemical databases store information in text representations, and the SMILES format is a universal standard used in many cheminformatics software. Encoded in each SMILES string is structural information that can be used to predict complex chemical properties. In this work, we develop SMILES2vec, a deep RNN that automatically learns features from SMILES to predict chemical properties, without the need for additional explicit feature engineering. Using Bayesian optimization methods to tune the network architecture, we show that an optimized SMILES2vec model can serve as a general-purpose neural ","authors_text":"Abhinav Vishnu, Charles Siegel, Garrett B. Goh, Nathan O. Hodas","cross_cats":["cs.AI","cs.CL","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-12-06T04:29:28Z","title":"SMILES2Vec: An Interpretable General-Purpose Deep Neural Network for Predicting Chemical Properties"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1712.02034","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:36489bfb0ace77285d3511aeefb39f729ffef3d5fa1883d640c3e9bc31025739","target":"record","created_at":"2026-05-18T00:08:03Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"c4c7891fda7a799e0e3d8f6da90fcebcb645deaf5fa5b91d34895f9d7ee82a3d","cross_cats_sorted":["cs.AI","cs.CL","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2017-12-06T04:29:28Z","title_canon_sha256":"3b67952769a84b491ae86930d5769121f4d1852c3ec38aecc39a2873eb832739"},"schema_version":"1.0","source":{"id":"1712.02034","kind":"arxiv","version":2}},"canonical_sha256":"f3edc2c06d60713d6c0131ef73e6a7490be01ae512166204cc42aabf07fa5ee4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"f3edc2c06d60713d6c0131ef73e6a7490be01ae512166204cc42aabf07fa5ee4","first_computed_at":"2026-05-18T00:08:03.218606Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:08:03.218606Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"d+MJYb8H7ROlRu958VLGE7GTWbrOno4PgyCgGiV3MnRvh9HggCNAMsf3CW1XFDGIJCYPqrzv54BYX1okq/jiAg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:08:03.219095Z","signed_message":"canonical_sha256_bytes"},"source_id":"1712.02034","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:36489bfb0ace77285d3511aeefb39f729ffef3d5fa1883d640c3e9bc31025739","sha256:34be63fa7209a02743cddfa0b29c9ec7be3a25cf33b77a275354926d0c149362"],"state_sha256":"e7ec02105b3b339c7dce5c86386069dbae2216215a5c744f8d798af6cb80e754"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sQpuCvd9SUYvG+sAWRkab9zZNkFpmIPfu6TwIeHtEIJru/9rZy9VJJCUf5gDsU9nEvxLqUJR+vSIFQj9TaENBg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T22:17:24.743272Z","bundle_sha256":"5293565ca15491cdb2b81e1de6eacc5c3a0319c4b6b31834b4a7434e73956bea"}}