{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:UHSMMUJSJZBGHAJ4CNQFJN6QA6","short_pith_number":"pith:UHSMMUJS","canonical_record":{"source":{"id":"2606.00512","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-30T04:01:14Z","cross_cats_sorted":["cs.IT","math.IT","stat.ML"],"title_canon_sha256":"eb11433b7f5ad9c7ad6fd282d59c699a37042fd487de68428d5fd2943a0b9b05","abstract_canon_sha256":"7d87445c817a1670f7ccb9c685da7ad9d2ab1c195e9bf82772b130c7e7eaacc4"},"schema_version":"1.0"},"canonical_sha256":"a1e4c651324e4263813c136054b7d007b7308558901db78d6a25b80ce4fdc9ca","source":{"kind":"arxiv","id":"2606.00512","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00512","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00512v1","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00512","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"pith_short_12","alias_value":"UHSMMUJSJZBG","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"pith_short_16","alias_value":"UHSMMUJSJZBGHAJ4","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"pith_short_8","alias_value":"UHSMMUJS","created_at":"2026-06-02T01:03:56Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:UHSMMUJSJZBGHAJ4CNQFJN6QA6","target":"record","payload":{"canonical_record":{"source":{"id":"2606.00512","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-30T04:01:14Z","cross_cats_sorted":["cs.IT","math.IT","stat.ML"],"title_canon_sha256":"eb11433b7f5ad9c7ad6fd282d59c699a37042fd487de68428d5fd2943a0b9b05","abstract_canon_sha256":"7d87445c817a1670f7ccb9c685da7ad9d2ab1c195e9bf82772b130c7e7eaacc4"},"schema_version":"1.0"},"canonical_sha256":"a1e4c651324e4263813c136054b7d007b7308558901db78d6a25b80ce4fdc9ca","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T01:03:56.914952Z","signature_b64":"zVWL2IVrjW2uW8641XcBVThyv6h1iS18hhRNEQwz3HjYekclg7DY14AbvOMRsT4sYndQW7sXHZcbWjTefuglBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a1e4c651324e4263813c136054b7d007b7308558901db78d6a25b80ce4fdc9ca","last_reissued_at":"2026-06-02T01:03:56.914569Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T01:03:56.914569Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.00512","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T01:03:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"bVgDXUhJcJ+8czMQffRbYQcMSkK42teBit/KLP06YtmP8mnOxbJZckxP8FiUPeSsDvGyFEkv8gjjMo4IwZkfCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T16:02:06.593397Z"},"content_sha256":"8356963f6de81b9eeab8e7a138a2e56056d9664593d50d02149b53882789ccc9","schema_version":"1.0","event_id":"sha256:8356963f6de81b9eeab8e7a138a2e56056d9664593d50d02149b53882789ccc9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:UHSMMUJSJZBGHAJ4CNQFJN6QA6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Semi-Supervised Learning with Noisy Proxy Covariates: Generalization Bounds and Distribution Regression","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.IT","math.IT","stat.ML"],"primary_cat":"cs.LG","authors_text":"Jisu Kim, Kwangho Kim","submitted_at":"2026-05-30T04:01:14Z","abstract_excerpt":"In many modern machine learning pipelines, abundant pretrained representations serve as noisy proxy covariates, while task-specific labels remain scarce. We study semi-supervised regression in this setting, and propose a simple two stage estimator that learns kernel eigenfeatures from all proxy covariates and fits a ridge predictor on labeled data. We derive finite sample bounds showing that fast labeled sample rates are recovered when proxy perturbation is controlled and unlabeled proxy covariates are sufficiently abundant. We also show that distribution regression is a direct special case, w"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00512","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.00512/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T01:03:56Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OVDoXedzz0fwn88iCvl0krmar99mBLyrw6HagWXGzdwdtejpo8aOt3mQgbFfOpQMjPYX1TcbDtGbaDUoBzIgDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-11T16:02:06.594178Z"},"content_sha256":"cf7e864a2c8792fa59299297bfc691b641307cea75ec5306bd0b0f7989b407a2","schema_version":"1.0","event_id":"sha256:cf7e864a2c8792fa59299297bfc691b641307cea75ec5306bd0b0f7989b407a2"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/UHSMMUJSJZBGHAJ4CNQFJN6QA6/bundle.json","state_url":"https://pith.science/pith/UHSMMUJSJZBGHAJ4CNQFJN6QA6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/UHSMMUJSJZBGHAJ4CNQFJN6QA6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-11T16:02:06Z","links":{"resolver":"https://pith.science/pith/UHSMMUJSJZBGHAJ4CNQFJN6QA6","bundle":"https://pith.science/pith/UHSMMUJSJZBGHAJ4CNQFJN6QA6/bundle.json","state":"https://pith.science/pith/UHSMMUJSJZBGHAJ4CNQFJN6QA6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/UHSMMUJSJZBGHAJ4CNQFJN6QA6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:UHSMMUJSJZBGHAJ4CNQFJN6QA6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7d87445c817a1670f7ccb9c685da7ad9d2ab1c195e9bf82772b130c7e7eaacc4","cross_cats_sorted":["cs.IT","math.IT","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-30T04:01:14Z","title_canon_sha256":"eb11433b7f5ad9c7ad6fd282d59c699a37042fd487de68428d5fd2943a0b9b05"},"schema_version":"1.0","source":{"id":"2606.00512","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.00512","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"arxiv_version","alias_value":"2606.00512v1","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.00512","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"pith_short_12","alias_value":"UHSMMUJSJZBG","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"pith_short_16","alias_value":"UHSMMUJSJZBGHAJ4","created_at":"2026-06-02T01:03:56Z"},{"alias_kind":"pith_short_8","alias_value":"UHSMMUJS","created_at":"2026-06-02T01:03:56Z"}],"graph_snapshots":[{"event_id":"sha256:cf7e864a2c8792fa59299297bfc691b641307cea75ec5306bd0b0f7989b407a2","target":"graph","created_at":"2026-06-02T01:03:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.00512/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"In many modern machine learning pipelines, abundant pretrained representations serve as noisy proxy covariates, while task-specific labels remain scarce. We study semi-supervised regression in this setting, and propose a simple two stage estimator that learns kernel eigenfeatures from all proxy covariates and fits a ridge predictor on labeled data. We derive finite sample bounds showing that fast labeled sample rates are recovered when proxy perturbation is controlled and unlabeled proxy covariates are sufficiently abundant. We also show that distribution regression is a direct special case, w","authors_text":"Jisu Kim, Kwangho Kim","cross_cats":["cs.IT","math.IT","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-30T04:01:14Z","title":"Semi-Supervised Learning with Noisy Proxy Covariates: Generalization Bounds and Distribution Regression"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.00512","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8356963f6de81b9eeab8e7a138a2e56056d9664593d50d02149b53882789ccc9","target":"record","created_at":"2026-06-02T01:03:56Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7d87445c817a1670f7ccb9c685da7ad9d2ab1c195e9bf82772b130c7e7eaacc4","cross_cats_sorted":["cs.IT","math.IT","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-30T04:01:14Z","title_canon_sha256":"eb11433b7f5ad9c7ad6fd282d59c699a37042fd487de68428d5fd2943a0b9b05"},"schema_version":"1.0","source":{"id":"2606.00512","kind":"arxiv","version":1}},"canonical_sha256":"a1e4c651324e4263813c136054b7d007b7308558901db78d6a25b80ce4fdc9ca","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a1e4c651324e4263813c136054b7d007b7308558901db78d6a25b80ce4fdc9ca","first_computed_at":"2026-06-02T01:03:56.914569Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T01:03:56.914569Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"zVWL2IVrjW2uW8641XcBVThyv6h1iS18hhRNEQwz3HjYekclg7DY14AbvOMRsT4sYndQW7sXHZcbWjTefuglBg==","signature_status":"signed_v1","signed_at":"2026-06-02T01:03:56.914952Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.00512","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8356963f6de81b9eeab8e7a138a2e56056d9664593d50d02149b53882789ccc9","sha256:cf7e864a2c8792fa59299297bfc691b641307cea75ec5306bd0b0f7989b407a2"],"state_sha256":"f98120d4e61436d80dfeb22fa88a156ac416c74d97bf350948b77775782d1737"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"I/IiuLTiVPHJ2WmVR7PYvLWb8+ilqg7l42zDhKEr0Kh/pStCl7hssM2PQVbFErvrewSaWTLRAHy+6fhW6aRFBw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-11T16:02:06.597602Z","bundle_sha256":"ca12de2f9008f16cbc66b577c83da17761a013dcdce96a926c3bc3c4eae0e632"}}