{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:PTVVYS5KIFUP47MPYE4V3ZB7FP","short_pith_number":"pith:PTVVYS5K","schema_version":"1.0","canonical_sha256":"7ceb5c4baa4168fe7d8fc1395de43f2be0d440540718d445076da1fc3a8de696","source":{"kind":"arxiv","id":"1801.07875","version":2},"attestation_state":"computed","paper":{"title":"Support Vector Machine Active Learning Algorithms with Query-by-Committee versus Closest-to-Hyperplane Selection","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.IR","stat.ML"],"primary_cat":"cs.LG","authors_text":"Michael Bloodgood","submitted_at":"2018-01-24T06:38:06Z","abstract_excerpt":"This paper investigates and evaluates support vector machine active learning algorithms for use with imbalanced datasets, which commonly arise in many applications such as information extraction applications. Algorithms based on closest-to-hyperplane selection and query-by-committee selection are combined with methods for addressing imbalance such as positive amplification based on prevalence statistics from initial random samples. Three algorithms (ClosestPA, QBagPA, and QBoostPA) are presented and carefully evaluated on datasets for text classification and relation extraction. The ClosestPA "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1801.07875","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-01-24T06:38:06Z","cross_cats_sorted":["cs.CL","cs.IR","stat.ML"],"title_canon_sha256":"df07afc330b8969248684298fabcd4cac1f74f3ea0c678c561e4e00c07898a75","abstract_canon_sha256":"3aaf0c0bcd25d44464a2cda600fe136dd18786b46510a628a97f40909a436fd4"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:15:46.690507Z","signature_b64":"+AvPXrOS3XWmK8LUgmiFimSAs6k3BWbbfFe4BsZNy2dYZA5bNe9b6s4hay1fE5OOMugVrlzT9W48xBTms9O5Aw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"7ceb5c4baa4168fe7d8fc1395de43f2be0d440540718d445076da1fc3a8de696","last_reissued_at":"2026-05-18T00:15:46.689816Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:15:46.689816Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Support Vector Machine Active Learning Algorithms with Query-by-Committee versus Closest-to-Hyperplane Selection","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.IR","stat.ML"],"primary_cat":"cs.LG","authors_text":"Michael Bloodgood","submitted_at":"2018-01-24T06:38:06Z","abstract_excerpt":"This paper investigates and evaluates support vector machine active learning algorithms for use with imbalanced datasets, which commonly arise in many applications such as information extraction applications. Algorithms based on closest-to-hyperplane selection and query-by-committee selection are combined with methods for addressing imbalance such as positive amplification based on prevalence statistics from initial random samples. Three algorithms (ClosestPA, QBagPA, and QBoostPA) are presented and carefully evaluated on datasets for text classification and relation extraction. The ClosestPA "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.07875","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1801.07875","created_at":"2026-05-18T00:15:46.689920+00:00"},{"alias_kind":"arxiv_version","alias_value":"1801.07875v2","created_at":"2026-05-18T00:15:46.689920+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.07875","created_at":"2026-05-18T00:15:46.689920+00:00"},{"alias_kind":"pith_short_12","alias_value":"PTVVYS5KIFUP","created_at":"2026-05-18T12:32:46.962924+00:00"},{"alias_kind":"pith_short_16","alias_value":"PTVVYS5KIFUP47MP","created_at":"2026-05-18T12:32:46.962924+00:00"},{"alias_kind":"pith_short_8","alias_value":"PTVVYS5K","created_at":"2026-05-18T12:32:46.962924+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP","json":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP.json","graph_json":"https://pith.science/api/pith-number/PTVVYS5KIFUP47MPYE4V3ZB7FP/graph.json","events_json":"https://pith.science/api/pith-number/PTVVYS5KIFUP47MPYE4V3ZB7FP/events.json","paper":"https://pith.science/paper/PTVVYS5K"},"agent_actions":{"view_html":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP","download_json":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP.json","view_paper":"https://pith.science/paper/PTVVYS5K","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1801.07875&json=true","fetch_graph":"https://pith.science/api/pith-number/PTVVYS5KIFUP47MPYE4V3ZB7FP/graph.json","fetch_events":"https://pith.science/api/pith-number/PTVVYS5KIFUP47MPYE4V3ZB7FP/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP/action/timestamp_anchor","attest_storage":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP/action/storage_attestation","attest_author":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP/action/author_attestation","sign_citation":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP/action/citation_signature","submit_replication":"https://pith.science/pith/PTVVYS5KIFUP47MPYE4V3ZB7FP/action/replication_record"}},"created_at":"2026-05-18T00:15:46.689920+00:00","updated_at":"2026-05-18T00:15:46.689920+00:00"}