{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:YXUVRP56GGIOSYOZAMYHY4LYHQ","short_pith_number":"pith:YXUVRP56","canonical_record":{"source":{"id":"1610.08123","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-25T23:43:49Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"42a9fdcc2da5fe02efb19662b7ba04ee57b6c72d9dcf80994d973b856802454a","abstract_canon_sha256":"d1516d986f77bb774752c4dd46f7793a938f40022567fe5847bbc53d7c634c08"},"schema_version":"1.0"},"canonical_sha256":"c5e958bfbe3190e961d903307c71783c1b809cef5f0ebe3ba556c813bb9b091b","source":{"kind":"arxiv","id":"1610.08123","version":4},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1610.08123","created_at":"2026-05-18T00:34:10Z"},{"alias_kind":"arxiv_version","alias_value":"1610.08123v4","created_at":"2026-05-18T00:34:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1610.08123","created_at":"2026-05-18T00:34:10Z"},{"alias_kind":"pith_short_12","alias_value":"YXUVRP56GGIO","created_at":"2026-05-18T12:30:53Z"},{"alias_kind":"pith_short_16","alias_value":"YXUVRP56GGIOSYOZ","created_at":"2026-05-18T12:30:53Z"},{"alias_kind":"pith_short_8","alias_value":"YXUVRP56","created_at":"2026-05-18T12:30:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:YXUVRP56GGIOSYOZAMYHY4LYHQ","target":"record","payload":{"canonical_record":{"source":{"id":"1610.08123","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-25T23:43:49Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"42a9fdcc2da5fe02efb19662b7ba04ee57b6c72d9dcf80994d973b856802454a","abstract_canon_sha256":"d1516d986f77bb774752c4dd46f7793a938f40022567fe5847bbc53d7c634c08"},"schema_version":"1.0"},"canonical_sha256":"c5e958bfbe3190e961d903307c71783c1b809cef5f0ebe3ba556c813bb9b091b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:34:10.251907Z","signature_b64":"4osAD3EHdzlraaxgU9CBbrBvmgAPIsGQc9d5YmWMkNwnXmYDTr5hJFYA1X13E+KaaHtV5nBVEuCa95CWvDyRCg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c5e958bfbe3190e961d903307c71783c1b809cef5f0ebe3ba556c813bb9b091b","last_reissued_at":"2026-05-18T00:34:10.251193Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:34:10.251193Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1610.08123","source_version":4,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:34:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KppMhrIOvhdDVE/hzx+Ia/prM3i9QuWftyu5Si5Wa7ubJM9rbExVh55pDLLa5KGpYmHneke+Glvv8GMsRi9SCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T21:53:01.296032Z"},"content_sha256":"5c80abe62dfebfa97ed29ea582dcd36c5182729e3c982779d49cb4d3d7536ade","schema_version":"1.0","event_id":"sha256:5c80abe62dfebfa97ed29ea582dcd36c5182729e3c982779d49cb4d3d7536ade"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:YXUVRP56GGIOSYOZAMYHY4LYHQ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Socratic Learning: Augmenting Generative Models to Incorporate Latent Subsets in Training Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Bryan He, Christopher De Sa, Christopher R\\'e, Dan Iter, Paroma Varma, Peng Xu, Rose Yu","submitted_at":"2016-10-25T23:43:49Z","abstract_excerpt":"A challenge in training discriminative models like neural networks is obtaining enough labeled training data. Recent approaches use generative models to combine weak supervision sources, like user-defined heuristics or knowledge bases, to label training data. Prior work has explored learning accuracies for these sources even without ground truth labels, but they assume that a single accuracy parameter is sufficient to model the behavior of these sources over the entire training set. In particular, they fail to model latent subsets in the training data in which the supervision sources perform d"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1610.08123","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:34:10Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"2rZXNd1h3DTW40lvSH4GwQQJ/aO/uAXU0Bd4A4Bp9y0cwvtLISVTpFd1oVM6lBoAcR7TBno2Gm/MUlO2dQe2CQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-01T21:53:01.296407Z"},"content_sha256":"74716eda8ea60145d74d60e95f76f75f6a457eba4fa3db5979623435eac964f8","schema_version":"1.0","event_id":"sha256:74716eda8ea60145d74d60e95f76f75f6a457eba4fa3db5979623435eac964f8"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/YXUVRP56GGIOSYOZAMYHY4LYHQ/bundle.json","state_url":"https://pith.science/pith/YXUVRP56GGIOSYOZAMYHY4LYHQ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/YXUVRP56GGIOSYOZAMYHY4LYHQ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-01T21:53:01Z","links":{"resolver":"https://pith.science/pith/YXUVRP56GGIOSYOZAMYHY4LYHQ","bundle":"https://pith.science/pith/YXUVRP56GGIOSYOZAMYHY4LYHQ/bundle.json","state":"https://pith.science/pith/YXUVRP56GGIOSYOZAMYHY4LYHQ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/YXUVRP56GGIOSYOZAMYHY4LYHQ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:YXUVRP56GGIOSYOZAMYHY4LYHQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d1516d986f77bb774752c4dd46f7793a938f40022567fe5847bbc53d7c634c08","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-25T23:43:49Z","title_canon_sha256":"42a9fdcc2da5fe02efb19662b7ba04ee57b6c72d9dcf80994d973b856802454a"},"schema_version":"1.0","source":{"id":"1610.08123","kind":"arxiv","version":4}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1610.08123","created_at":"2026-05-18T00:34:10Z"},{"alias_kind":"arxiv_version","alias_value":"1610.08123v4","created_at":"2026-05-18T00:34:10Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1610.08123","created_at":"2026-05-18T00:34:10Z"},{"alias_kind":"pith_short_12","alias_value":"YXUVRP56GGIO","created_at":"2026-05-18T12:30:53Z"},{"alias_kind":"pith_short_16","alias_value":"YXUVRP56GGIOSYOZ","created_at":"2026-05-18T12:30:53Z"},{"alias_kind":"pith_short_8","alias_value":"YXUVRP56","created_at":"2026-05-18T12:30:53Z"}],"graph_snapshots":[{"event_id":"sha256:74716eda8ea60145d74d60e95f76f75f6a457eba4fa3db5979623435eac964f8","target":"graph","created_at":"2026-05-18T00:34:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"A challenge in training discriminative models like neural networks is obtaining enough labeled training data. Recent approaches use generative models to combine weak supervision sources, like user-defined heuristics or knowledge bases, to label training data. Prior work has explored learning accuracies for these sources even without ground truth labels, but they assume that a single accuracy parameter is sufficient to model the behavior of these sources over the entire training set. In particular, they fail to model latent subsets in the training data in which the supervision sources perform d","authors_text":"Bryan He, Christopher De Sa, Christopher R\\'e, Dan Iter, Paroma Varma, Peng Xu, Rose Yu","cross_cats":["stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-25T23:43:49Z","title":"Socratic Learning: Augmenting Generative Models to Incorporate Latent Subsets in Training Data"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1610.08123","kind":"arxiv","version":4},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:5c80abe62dfebfa97ed29ea582dcd36c5182729e3c982779d49cb4d3d7536ade","target":"record","created_at":"2026-05-18T00:34:10Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d1516d986f77bb774752c4dd46f7793a938f40022567fe5847bbc53d7c634c08","cross_cats_sorted":["stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-10-25T23:43:49Z","title_canon_sha256":"42a9fdcc2da5fe02efb19662b7ba04ee57b6c72d9dcf80994d973b856802454a"},"schema_version":"1.0","source":{"id":"1610.08123","kind":"arxiv","version":4}},"canonical_sha256":"c5e958bfbe3190e961d903307c71783c1b809cef5f0ebe3ba556c813bb9b091b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c5e958bfbe3190e961d903307c71783c1b809cef5f0ebe3ba556c813bb9b091b","first_computed_at":"2026-05-18T00:34:10.251193Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:34:10.251193Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"4osAD3EHdzlraaxgU9CBbrBvmgAPIsGQc9d5YmWMkNwnXmYDTr5hJFYA1X13E+KaaHtV5nBVEuCa95CWvDyRCg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:34:10.251907Z","signed_message":"canonical_sha256_bytes"},"source_id":"1610.08123","source_kind":"arxiv","source_version":4}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:5c80abe62dfebfa97ed29ea582dcd36c5182729e3c982779d49cb4d3d7536ade","sha256:74716eda8ea60145d74d60e95f76f75f6a457eba4fa3db5979623435eac964f8"],"state_sha256":"fa2477d20c8569648071461109113609d18abbaa74c2cc2bf89567c282d73974"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"VSdrB0M404wOrA/+BnWQmm5IdlUoF3d8uiDnkh7U5uq0hhVEAT28fc375Ly97dOGo19KBKeaKpQemQdnUSPnCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-01T21:53:01.298362Z","bundle_sha256":"69c8f5901563e9d9b6231b8ba8869423cef1eab05b0e58a57026bd4badb2ffbb"}}