{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:3NCPVYDQPC344AYMFG5P2WOSYY","short_pith_number":"pith:3NCPVYDQ","canonical_record":{"source":{"id":"2605.17758","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T02:24:52Z","cross_cats_sorted":[],"title_canon_sha256":"d4af9a1b00e2a8f44772c18d638061e894801dba323891c034a033a2181fb041","abstract_canon_sha256":"10b63049e01e0a5be6ad568e6ee133610dbd7a1dfb753de1d3bc13aa67866e56"},"schema_version":"1.0"},"canonical_sha256":"db44fae07078b7ce030c29bafd59d2c63c1fa00e36b3ab248ff3b376114cdf44","source":{"kind":"arxiv","id":"2605.17758","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.17758","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"arxiv_version","alias_value":"2605.17758v1","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.17758","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"pith_short_12","alias_value":"3NCPVYDQPC34","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"pith_short_16","alias_value":"3NCPVYDQPC344AYM","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"pith_short_8","alias_value":"3NCPVYDQ","created_at":"2026-05-20T00:04:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:3NCPVYDQPC344AYMFG5P2WOSYY","target":"record","payload":{"canonical_record":{"source":{"id":"2605.17758","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T02:24:52Z","cross_cats_sorted":[],"title_canon_sha256":"d4af9a1b00e2a8f44772c18d638061e894801dba323891c034a033a2181fb041","abstract_canon_sha256":"10b63049e01e0a5be6ad568e6ee133610dbd7a1dfb753de1d3bc13aa67866e56"},"schema_version":"1.0"},"canonical_sha256":"db44fae07078b7ce030c29bafd59d2c63c1fa00e36b3ab248ff3b376114cdf44","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:04:56.745760Z","signature_b64":"h2hMm3uU5bCQX3tLXfz3DDc+mwpwH55nLIeglQnWdII0gna90yawGrVEkUN0L09DRgihZ5Qjr17gTr5P9KofBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"db44fae07078b7ce030c29bafd59d2c63c1fa00e36b3ab248ff3b376114cdf44","last_reissued_at":"2026-05-20T00:04:56.744954Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:04:56.744954Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.17758","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:04:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"651/FS5BtRDiqpS0mykagRSuNCGDrW8RKWsN3uJL8JT8MP6iV5voWqNrdo6BmLy/gnsoJ+mqwssOH98roay/AQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T20:01:30.757959Z"},"content_sha256":"06cc2fe663ab92a4040ae1765070d72ec1b60397cf45ccfb506aeadb21d411f9","schema_version":"1.0","event_id":"sha256:06cc2fe663ab92a4040ae1765070d72ec1b60397cf45ccfb506aeadb21d411f9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:3NCPVYDQPC344AYMFG5P2WOSYY","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Memisis: Orchestrating and Evaluating Synthetic Data for Tabular Health Datasets","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Aadi Sharma, Amir M. Rahmani, Arshia Harish Puthran, Ian Harris, Mahdi Bagheri, Muhjaazee Love, Nitish Nagesh, Pengbao Zhou","submitted_at":"2026-05-18T02:24:52Z","abstract_excerpt":"Synthetic data is widely used in healthcare to create datasets that are similar to original data but without the privacy concerns. Generating and evaluating synthetic data across privacy, utility and fairness is crucial for facilitating high quality data availability for downstream prediction tasks and clinical decision making. We present Memisis, a tool that orchestrates and evaluates synthetic data by leveraging existing synthetic data tools, the power of large language models and state-of-the-art evaluation metrics. Our tool creates a unified workflow for data generation, validation and eva"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.17758","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.17758/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:04:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"zOroSzXS3mk8yEkVmGChrSbLkQ2v0GCKZeRytDMc2Hn630rpdbFViUW+sfI3uEjVLOfcWa2yyFvdHNYChsT0CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T20:01:30.758668Z"},"content_sha256":"dcfe07c666e60832f6c7744f04a7436d99d941cb37715ffdca5c82786324e841","schema_version":"1.0","event_id":"sha256:dcfe07c666e60832f6c7744f04a7436d99d941cb37715ffdca5c82786324e841"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/3NCPVYDQPC344AYMFG5P2WOSYY/bundle.json","state_url":"https://pith.science/pith/3NCPVYDQPC344AYMFG5P2WOSYY/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/3NCPVYDQPC344AYMFG5P2WOSYY/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T20:01:30Z","links":{"resolver":"https://pith.science/pith/3NCPVYDQPC344AYMFG5P2WOSYY","bundle":"https://pith.science/pith/3NCPVYDQPC344AYMFG5P2WOSYY/bundle.json","state":"https://pith.science/pith/3NCPVYDQPC344AYMFG5P2WOSYY/state.json","well_known_bundle":"https://pith.science/.well-known/pith/3NCPVYDQPC344AYMFG5P2WOSYY/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:3NCPVYDQPC344AYMFG5P2WOSYY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"10b63049e01e0a5be6ad568e6ee133610dbd7a1dfb753de1d3bc13aa67866e56","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T02:24:52Z","title_canon_sha256":"d4af9a1b00e2a8f44772c18d638061e894801dba323891c034a033a2181fb041"},"schema_version":"1.0","source":{"id":"2605.17758","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.17758","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"arxiv_version","alias_value":"2605.17758v1","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.17758","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"pith_short_12","alias_value":"3NCPVYDQPC34","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"pith_short_16","alias_value":"3NCPVYDQPC344AYM","created_at":"2026-05-20T00:04:56Z"},{"alias_kind":"pith_short_8","alias_value":"3NCPVYDQ","created_at":"2026-05-20T00:04:56Z"}],"graph_snapshots":[{"event_id":"sha256:dcfe07c666e60832f6c7744f04a7436d99d941cb37715ffdca5c82786324e841","target":"graph","created_at":"2026-05-20T00:04:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.17758/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Synthetic data is widely used in healthcare to create datasets that are similar to original data but without the privacy concerns. Generating and evaluating synthetic data across privacy, utility and fairness is crucial for facilitating high quality data availability for downstream prediction tasks and clinical decision making. We present Memisis, a tool that orchestrates and evaluates synthetic data by leveraging existing synthetic data tools, the power of large language models and state-of-the-art evaluation metrics. Our tool creates a unified workflow for data generation, validation and eva","authors_text":"Aadi Sharma, Amir M. Rahmani, Arshia Harish Puthran, Ian Harris, Mahdi Bagheri, Muhjaazee Love, Nitish Nagesh, Pengbao Zhou","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T02:24:52Z","title":"Memisis: Orchestrating and Evaluating Synthetic Data for Tabular Health Datasets"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.17758","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:06cc2fe663ab92a4040ae1765070d72ec1b60397cf45ccfb506aeadb21d411f9","target":"record","created_at":"2026-05-20T00:04:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"10b63049e01e0a5be6ad568e6ee133610dbd7a1dfb753de1d3bc13aa67866e56","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-05-18T02:24:52Z","title_canon_sha256":"d4af9a1b00e2a8f44772c18d638061e894801dba323891c034a033a2181fb041"},"schema_version":"1.0","source":{"id":"2605.17758","kind":"arxiv","version":1}},"canonical_sha256":"db44fae07078b7ce030c29bafd59d2c63c1fa00e36b3ab248ff3b376114cdf44","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"db44fae07078b7ce030c29bafd59d2c63c1fa00e36b3ab248ff3b376114cdf44","first_computed_at":"2026-05-20T00:04:56.744954Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:04:56.744954Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"h2hMm3uU5bCQX3tLXfz3DDc+mwpwH55nLIeglQnWdII0gna90yawGrVEkUN0L09DRgihZ5Qjr17gTr5P9KofBw==","signature_status":"signed_v1","signed_at":"2026-05-20T00:04:56.745760Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.17758","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:06cc2fe663ab92a4040ae1765070d72ec1b60397cf45ccfb506aeadb21d411f9","sha256:dcfe07c666e60832f6c7744f04a7436d99d941cb37715ffdca5c82786324e841"],"state_sha256":"10f6a65c9c0d1b1df12ecb24706100a64a0bcd6653fa2ba651e6c368157d0f70"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"EL51JcbWQWM0qOfnGExJdVaXQdNh7NLo0b5YJVNdZ+FzJdHMGPLx7kitdCi8ZOZiOWfIMu19kOLoVUXZTqLLDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T20:01:30.762232Z","bundle_sha256":"14343c2becb6b3aafdd6cc3528873051d2e1266efbb8c878c7312f37c2fabb85"}}