{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:7MG3EZHZSP4R3RXPGKOQJUPFBE","short_pith_number":"pith:7MG3EZHZ","canonical_record":{"source":{"id":"1811.11958","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-29T04:26:07Z","cross_cats_sorted":[],"title_canon_sha256":"093d0aaa8b10d33d8712f027509e3e0b937a2e38bbcb0b0a7b82f663f4a74595","abstract_canon_sha256":"329b415c4ec49e996f19f188317c567e182536eaf7dccbe5216ac313badb52cc"},"schema_version":"1.0"},"canonical_sha256":"fb0db264f993f91dc6ef329d04d1e5092d5ac6c07df79c6183cc5a656ca1c688","source":{"kind":"arxiv","id":"1811.11958","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.11958","created_at":"2026-05-17T23:59:34Z"},{"alias_kind":"arxiv_version","alias_value":"1811.11958v1","created_at":"2026-05-17T23:59:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.11958","created_at":"2026-05-17T23:59:34Z"},{"alias_kind":"pith_short_12","alias_value":"7MG3EZHZSP4R","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_16","alias_value":"7MG3EZHZSP4R3RXP","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_8","alias_value":"7MG3EZHZ","created_at":"2026-05-18T12:32:11Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:7MG3EZHZSP4R3RXPGKOQJUPFBE","target":"record","payload":{"canonical_record":{"source":{"id":"1811.11958","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-29T04:26:07Z","cross_cats_sorted":[],"title_canon_sha256":"093d0aaa8b10d33d8712f027509e3e0b937a2e38bbcb0b0a7b82f663f4a74595","abstract_canon_sha256":"329b415c4ec49e996f19f188317c567e182536eaf7dccbe5216ac313badb52cc"},"schema_version":"1.0"},"canonical_sha256":"fb0db264f993f91dc6ef329d04d1e5092d5ac6c07df79c6183cc5a656ca1c688","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:59:34.973531Z","signature_b64":"oYITvqn80L4FgqZCaQBfyBGvSliwCmZroBTUVbMZwO18oEkplEvqrU0JQqIdWboXph5ecQwYxwXasIFSFiFKBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"fb0db264f993f91dc6ef329d04d1e5092d5ac6c07df79c6183cc5a656ca1c688","last_reissued_at":"2026-05-17T23:59:34.972849Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:59:34.972849Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1811.11958","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"24cAfz8mPHbkS5AbZop4Oan6GihU+7v6T6x6QMNngTWRseq58KKWqPuZlUbM8GIZXfRjLClA8zFRMUQTRH76CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T02:10:36.658338Z"},"content_sha256":"0486adbfd5e381d9120fb5bd473c934e450f79b20209c14f17c3d54d0f073772","schema_version":"1.0","event_id":"sha256:0486adbfd5e381d9120fb5bd473c934e450f79b20209c14f17c3d54d0f073772"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:7MG3EZHZSP4R3RXPGKOQJUPFBE","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Large-scale Generative Modeling to Improve Automated Veterinary Disease Coding","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Allen Nie, James Zou, Yuhui Zhang","submitted_at":"2018-11-29T04:26:07Z","abstract_excerpt":"Supervised learning is limited both by the quantity and quality of the labeled data. In the field of medical record tagging, writing styles between hospitals vary drastically. The knowledge learned from one hospital might not transfer well to another. This problem is amplified in veterinary medicine domain because veterinary clinics rarely apply medical codes to their records. We proposed and trained the first large-scale generative modeling algorithm in automated disease coding. We demonstrate that generative modeling can learn discriminative features when additionally trained with supervised"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.11958","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:59:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MmAZUp2aW/m8lwPOV3AJvFPAjV/X7THqtf3lBm2y39sEvvum34R7rrlz95rxfhkstiLIUx+IHFMXY77erTcfDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T02:10:36.658696Z"},"content_sha256":"3a2fdbcf8e431d3296d9234e2fe77533cc474fe1015001d0a5e5bc0c58403b5e","schema_version":"1.0","event_id":"sha256:3a2fdbcf8e431d3296d9234e2fe77533cc474fe1015001d0a5e5bc0c58403b5e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/7MG3EZHZSP4R3RXPGKOQJUPFBE/bundle.json","state_url":"https://pith.science/pith/7MG3EZHZSP4R3RXPGKOQJUPFBE/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/7MG3EZHZSP4R3RXPGKOQJUPFBE/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T02:10:36Z","links":{"resolver":"https://pith.science/pith/7MG3EZHZSP4R3RXPGKOQJUPFBE","bundle":"https://pith.science/pith/7MG3EZHZSP4R3RXPGKOQJUPFBE/bundle.json","state":"https://pith.science/pith/7MG3EZHZSP4R3RXPGKOQJUPFBE/state.json","well_known_bundle":"https://pith.science/.well-known/pith/7MG3EZHZSP4R3RXPGKOQJUPFBE/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:7MG3EZHZSP4R3RXPGKOQJUPFBE","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"329b415c4ec49e996f19f188317c567e182536eaf7dccbe5216ac313badb52cc","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-29T04:26:07Z","title_canon_sha256":"093d0aaa8b10d33d8712f027509e3e0b937a2e38bbcb0b0a7b82f663f4a74595"},"schema_version":"1.0","source":{"id":"1811.11958","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.11958","created_at":"2026-05-17T23:59:34Z"},{"alias_kind":"arxiv_version","alias_value":"1811.11958v1","created_at":"2026-05-17T23:59:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.11958","created_at":"2026-05-17T23:59:34Z"},{"alias_kind":"pith_short_12","alias_value":"7MG3EZHZSP4R","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_16","alias_value":"7MG3EZHZSP4R3RXP","created_at":"2026-05-18T12:32:11Z"},{"alias_kind":"pith_short_8","alias_value":"7MG3EZHZ","created_at":"2026-05-18T12:32:11Z"}],"graph_snapshots":[{"event_id":"sha256:3a2fdbcf8e431d3296d9234e2fe77533cc474fe1015001d0a5e5bc0c58403b5e","target":"graph","created_at":"2026-05-17T23:59:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Supervised learning is limited both by the quantity and quality of the labeled data. In the field of medical record tagging, writing styles between hospitals vary drastically. The knowledge learned from one hospital might not transfer well to another. This problem is amplified in veterinary medicine domain because veterinary clinics rarely apply medical codes to their records. We proposed and trained the first large-scale generative modeling algorithm in automated disease coding. We demonstrate that generative modeling can learn discriminative features when additionally trained with supervised","authors_text":"Allen Nie, James Zou, Yuhui Zhang","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-29T04:26:07Z","title":"Large-scale Generative Modeling to Improve Automated Veterinary Disease Coding"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.11958","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:0486adbfd5e381d9120fb5bd473c934e450f79b20209c14f17c3d54d0f073772","target":"record","created_at":"2026-05-17T23:59:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"329b415c4ec49e996f19f188317c567e182536eaf7dccbe5216ac313badb52cc","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2018-11-29T04:26:07Z","title_canon_sha256":"093d0aaa8b10d33d8712f027509e3e0b937a2e38bbcb0b0a7b82f663f4a74595"},"schema_version":"1.0","source":{"id":"1811.11958","kind":"arxiv","version":1}},"canonical_sha256":"fb0db264f993f91dc6ef329d04d1e5092d5ac6c07df79c6183cc5a656ca1c688","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"fb0db264f993f91dc6ef329d04d1e5092d5ac6c07df79c6183cc5a656ca1c688","first_computed_at":"2026-05-17T23:59:34.972849Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:59:34.972849Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"oYITvqn80L4FgqZCaQBfyBGvSliwCmZroBTUVbMZwO18oEkplEvqrU0JQqIdWboXph5ecQwYxwXasIFSFiFKBw==","signature_status":"signed_v1","signed_at":"2026-05-17T23:59:34.973531Z","signed_message":"canonical_sha256_bytes"},"source_id":"1811.11958","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:0486adbfd5e381d9120fb5bd473c934e450f79b20209c14f17c3d54d0f073772","sha256:3a2fdbcf8e431d3296d9234e2fe77533cc474fe1015001d0a5e5bc0c58403b5e"],"state_sha256":"309d64ed643cc89139309e888d3a932b5a482dacc4ad0e4f23608261c5aa692d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"bW2uRh+FqrT4QA0Uw/WyX1iVjHWkHQ0xWrnCDPZNgqA7JdnpLeFRzSYw67YDqigruEL44HZVhKP1Rn7c2uVKDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T02:10:36.660587Z","bundle_sha256":"79898839a2c1e6e2eb961e71419066768db0766a713b67bdb3b4bb38836d0129"}}