{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:TNJ5UYESW5COHMQOVUPVGSTMPJ","short_pith_number":"pith:TNJ5UYES","schema_version":"1.0","canonical_sha256":"9b53da6092b744e3b20ead1f534a6c7a602c309d1104881a4b0750c64092faf5","source":{"kind":"arxiv","id":"1809.03207","version":4},"attestation_state":"computed","paper":{"title":"Beyond the Selected Completely At Random Assumption for Learning from Positive and Unlabeled Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Jessa Bekker, Jesse Davis, Pieter Robberechts","submitted_at":"2018-09-10T09:23:32Z","abstract_excerpt":"Most positive and unlabeled data is subject to selection biases. The labeled examples can, for example, be selected from the positive set because they are easier to obtain or more obviously positive. This paper investigates how learning can be ena BHbled in this setting. We propose and theoretically analyze an empirical-risk-based method for incorporating the labeling mechanism. Additionally, we investigate under which assumptions learning is possible when the labeling mechanism is not fully understood and propose a practical method to enable this. Our empirical analysis supports the theoretic"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1809.03207","kind":"arxiv","version":4},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-09-10T09:23:32Z","cross_cats_sorted":["stat.ML"],"title_canon_sha256":"e4b0dd22fde81e0065a6368dc3a10f1740568cd867810b893b336976031c5c80","abstract_canon_sha256":"1e1581c8d6dfbb5ecb0b1c4582c3ec2823ccd9302c8d1ea8aef7e8a12550fcfb"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:42:03.045002Z","signature_b64":"T2cQDzpxBQ13zxtp3KKyD56WlM0IBtKaeeXLIlQD/5cdvTUvSN4XSUFFC+WgJAMnW1gWcqKBjMA9nug684gXBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9b53da6092b744e3b20ead1f534a6c7a602c309d1104881a4b0750c64092faf5","last_reissued_at":"2026-05-17T23:42:03.044350Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:42:03.044350Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Beyond the Selected Completely At Random Assumption for Learning from Positive and Unlabeled Data","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ML"],"primary_cat":"cs.LG","authors_text":"Jessa Bekker, Jesse Davis, Pieter Robberechts","submitted_at":"2018-09-10T09:23:32Z","abstract_excerpt":"Most positive and unlabeled data is subject to selection biases. The labeled examples can, for example, be selected from the positive set because they are easier to obtain or more obviously positive. This paper investigates how learning can be ena BHbled in this setting. We propose and theoretically analyze an empirical-risk-based method for incorporating the labeling mechanism. Additionally, we investigate under which assumptions learning is possible when the labeling mechanism is not fully understood and propose a practical method to enable this. Our empirical analysis supports the theoretic"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1809.03207","kind":"arxiv","version":4},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1809.03207","created_at":"2026-05-17T23:42:03.044452+00:00"},{"alias_kind":"arxiv_version","alias_value":"1809.03207v4","created_at":"2026-05-17T23:42:03.044452+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1809.03207","created_at":"2026-05-17T23:42:03.044452+00:00"},{"alias_kind":"pith_short_12","alias_value":"TNJ5UYESW5CO","created_at":"2026-05-18T12:32:53.628368+00:00"},{"alias_kind":"pith_short_16","alias_value":"TNJ5UYESW5COHMQO","created_at":"2026-05-18T12:32:53.628368+00:00"},{"alias_kind":"pith_short_8","alias_value":"TNJ5UYES","created_at":"2026-05-18T12:32:53.628368+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ","json":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ.json","graph_json":"https://pith.science/api/pith-number/TNJ5UYESW5COHMQOVUPVGSTMPJ/graph.json","events_json":"https://pith.science/api/pith-number/TNJ5UYESW5COHMQOVUPVGSTMPJ/events.json","paper":"https://pith.science/paper/TNJ5UYES"},"agent_actions":{"view_html":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ","download_json":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ.json","view_paper":"https://pith.science/paper/TNJ5UYES","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1809.03207&json=true","fetch_graph":"https://pith.science/api/pith-number/TNJ5UYESW5COHMQOVUPVGSTMPJ/graph.json","fetch_events":"https://pith.science/api/pith-number/TNJ5UYESW5COHMQOVUPVGSTMPJ/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ/action/timestamp_anchor","attest_storage":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ/action/storage_attestation","attest_author":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ/action/author_attestation","sign_citation":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ/action/citation_signature","submit_replication":"https://pith.science/pith/TNJ5UYESW5COHMQOVUPVGSTMPJ/action/replication_record"}},"created_at":"2026-05-17T23:42:03.044452+00:00","updated_at":"2026-05-17T23:42:03.044452+00:00"}