{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2019:YKG2GZMKBPHKDGREQLC6LKGGYS","short_pith_number":"pith:YKG2GZMK","canonical_record":{"source":{"id":"1903.00458","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-03-01T18:39:00Z","cross_cats_sorted":[],"title_canon_sha256":"2d2e3a16040351971e6c4f2b147e350bd6d97c3750e07f6dbe9b71d8f3dc0950","abstract_canon_sha256":"b450e0221d401098e64e7abea0c12746d140721ad161b7a6f8cf564769c3daaa"},"schema_version":"1.0"},"canonical_sha256":"c28da3658a0bcea19a2482c5e5a8c6c4abcafd2f0f01041c209d0bcfcdb921b2","source":{"kind":"arxiv","id":"1903.00458","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.00458","created_at":"2026-05-17T23:52:19Z"},{"alias_kind":"arxiv_version","alias_value":"1903.00458v1","created_at":"2026-05-17T23:52:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.00458","created_at":"2026-05-17T23:52:19Z"},{"alias_kind":"pith_short_12","alias_value":"YKG2GZMKBPHK","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_16","alias_value":"YKG2GZMKBPHKDGRE","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_8","alias_value":"YKG2GZMK","created_at":"2026-05-18T12:33:33Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2019:YKG2GZMKBPHKDGREQLC6LKGGYS","target":"record","payload":{"canonical_record":{"source":{"id":"1903.00458","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-03-01T18:39:00Z","cross_cats_sorted":[],"title_canon_sha256":"2d2e3a16040351971e6c4f2b147e350bd6d97c3750e07f6dbe9b71d8f3dc0950","abstract_canon_sha256":"b450e0221d401098e64e7abea0c12746d140721ad161b7a6f8cf564769c3daaa"},"schema_version":"1.0"},"canonical_sha256":"c28da3658a0bcea19a2482c5e5a8c6c4abcafd2f0f01041c209d0bcfcdb921b2","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:52:19.604377Z","signature_b64":"Sex/EXiLM5raX95kZmJpXvU9KXLVkhv62eEI+XcpBLk7/SNSr+9yWUCqsuI4xxszefG5VxbcWJdcjyWfkSeMBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c28da3658a0bcea19a2482c5e5a8c6c4abcafd2f0f01041c209d0bcfcdb921b2","last_reissued_at":"2026-05-17T23:52:19.603791Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:52:19.603791Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1903.00458","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:52:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3kexpjGGTXbiSje65LrUmVBu3lUAy6aYrOVxCLC7cUpoHAXuwbT1CRPeU1Krdj6UUKTJ7o+daoW/jM5PbE6OBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T19:42:46.698074Z"},"content_sha256":"3c77e6424bb44786cf94950c97ce6bff7b34179bc9e22e69b0669696e64dfe9a","schema_version":"1.0","event_id":"sha256:3c77e6424bb44786cf94950c97ce6bff7b34179bc9e22e69b0669696e64dfe9a"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2019:YKG2GZMKBPHKDGREQLC6LKGGYS","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"How to Hallucinate Functional Proteins","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"q-bio.QM","authors_text":"Hector Garcia Martin, Zak Costello","submitted_at":"2019-03-01T18:39:00Z","abstract_excerpt":"Here we present a novel approach to protein design and phenotypic inference using a generative model for protein sequences. BioSeqVAE, a variational autoencoder variant, can hallucinate syntactically valid protein sequences that are likely to fold and function. BioSeqVAE is trained on the entire known protein sequence space and learns to generate valid examples of protein sequences in an unsupervised manner. The model is validated by showing that its latent feature space is useful and that it accurately reconstructs sequences. Its usefulness is demonstrated with a selection of relevant downstr"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.00458","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:52:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9my1F9M8GWBFetH7pNj483659Oj6ZzN+y7MQqqsBY7Z+okdRkyGtYT7XedxbilcLe7ferxIeJ8aignvbAJwKAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-04T19:42:46.698465Z"},"content_sha256":"4a62696aa462904737c770dc49071d572217ccb70cf17d7b86a92abf019e8908","schema_version":"1.0","event_id":"sha256:4a62696aa462904737c770dc49071d572217ccb70cf17d7b86a92abf019e8908"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/YKG2GZMKBPHKDGREQLC6LKGGYS/bundle.json","state_url":"https://pith.science/pith/YKG2GZMKBPHKDGREQLC6LKGGYS/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/YKG2GZMKBPHKDGREQLC6LKGGYS/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-04T19:42:46Z","links":{"resolver":"https://pith.science/pith/YKG2GZMKBPHKDGREQLC6LKGGYS","bundle":"https://pith.science/pith/YKG2GZMKBPHKDGREQLC6LKGGYS/bundle.json","state":"https://pith.science/pith/YKG2GZMKBPHKDGREQLC6LKGGYS/state.json","well_known_bundle":"https://pith.science/.well-known/pith/YKG2GZMKBPHKDGREQLC6LKGGYS/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2019:YKG2GZMKBPHKDGREQLC6LKGGYS","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"b450e0221d401098e64e7abea0c12746d140721ad161b7a6f8cf564769c3daaa","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-03-01T18:39:00Z","title_canon_sha256":"2d2e3a16040351971e6c4f2b147e350bd6d97c3750e07f6dbe9b71d8f3dc0950"},"schema_version":"1.0","source":{"id":"1903.00458","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1903.00458","created_at":"2026-05-17T23:52:19Z"},{"alias_kind":"arxiv_version","alias_value":"1903.00458v1","created_at":"2026-05-17T23:52:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1903.00458","created_at":"2026-05-17T23:52:19Z"},{"alias_kind":"pith_short_12","alias_value":"YKG2GZMKBPHK","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_16","alias_value":"YKG2GZMKBPHKDGRE","created_at":"2026-05-18T12:33:33Z"},{"alias_kind":"pith_short_8","alias_value":"YKG2GZMK","created_at":"2026-05-18T12:33:33Z"}],"graph_snapshots":[{"event_id":"sha256:4a62696aa462904737c770dc49071d572217ccb70cf17d7b86a92abf019e8908","target":"graph","created_at":"2026-05-17T23:52:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Here we present a novel approach to protein design and phenotypic inference using a generative model for protein sequences. BioSeqVAE, a variational autoencoder variant, can hallucinate syntactically valid protein sequences that are likely to fold and function. BioSeqVAE is trained on the entire known protein sequence space and learns to generate valid examples of protein sequences in an unsupervised manner. The model is validated by showing that its latent feature space is useful and that it accurately reconstructs sequences. Its usefulness is demonstrated with a selection of relevant downstr","authors_text":"Hector Garcia Martin, Zak Costello","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-03-01T18:39:00Z","title":"How to Hallucinate Functional Proteins"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1903.00458","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3c77e6424bb44786cf94950c97ce6bff7b34179bc9e22e69b0669696e64dfe9a","target":"record","created_at":"2026-05-17T23:52:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"b450e0221d401098e64e7abea0c12746d140721ad161b7a6f8cf564769c3daaa","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"q-bio.QM","submitted_at":"2019-03-01T18:39:00Z","title_canon_sha256":"2d2e3a16040351971e6c4f2b147e350bd6d97c3750e07f6dbe9b71d8f3dc0950"},"schema_version":"1.0","source":{"id":"1903.00458","kind":"arxiv","version":1}},"canonical_sha256":"c28da3658a0bcea19a2482c5e5a8c6c4abcafd2f0f01041c209d0bcfcdb921b2","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c28da3658a0bcea19a2482c5e5a8c6c4abcafd2f0f01041c209d0bcfcdb921b2","first_computed_at":"2026-05-17T23:52:19.603791Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:52:19.603791Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"Sex/EXiLM5raX95kZmJpXvU9KXLVkhv62eEI+XcpBLk7/SNSr+9yWUCqsuI4xxszefG5VxbcWJdcjyWfkSeMBg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:52:19.604377Z","signed_message":"canonical_sha256_bytes"},"source_id":"1903.00458","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3c77e6424bb44786cf94950c97ce6bff7b34179bc9e22e69b0669696e64dfe9a","sha256:4a62696aa462904737c770dc49071d572217ccb70cf17d7b86a92abf019e8908"],"state_sha256":"a3f274add445760b915d58a1f5da949264f902046693cdda8088fea4a1992ccf"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"lfdEEgd69SNjkP6/7flD39Ie7pmsJDwO7xUBGS2kxGQcUDweh3AJKFyIs0DG3chNZUAI4Rnguj8Ye9HC8+gCCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-04T19:42:46.700364Z","bundle_sha256":"b36fd2eec089dccd8805ef7a584eb09da96426dc72fe4e9774f09955229667bf"}}