{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:6P4JKMWZTGY5ZAZSAQN7LRLUAX","short_pith_number":"pith:6P4JKMWZ","schema_version":"1.0","canonical_sha256":"f3f89532d999b1dc8332041bf5c57405f3cb6ebcc3b8eb2c641d3aa4ff6a98f1","source":{"kind":"arxiv","id":"1801.07887","version":2},"attestation_state":"computed","paper":{"title":"Impact of Batch Size on Stopping Active Learning for Text Classification","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.IR","stat.ML"],"primary_cat":"cs.LG","authors_text":"Ethan Kochis, Garrett Beatty, Michael Bloodgood","submitted_at":"2018-01-24T07:47:05Z","abstract_excerpt":"When using active learning, smaller batch sizes are typically more efficient from a learning efficiency perspective. However, in practice due to speed and human annotator considerations, the use of larger batch sizes is necessary. While past work has shown that larger batch sizes decrease learning efficiency from a learning curve perspective, it remains an open question how batch size impacts methods for stopping active learning. We find that large batch sizes degrade the performance of a leading stopping method over and above the degradation that results from reduced learning efficiency. We a"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1801.07887","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-01-24T07:47:05Z","cross_cats_sorted":["cs.CL","cs.IR","stat.ML"],"title_canon_sha256":"4e649af60b4dc71d04ec8fafb70f57b857da8e2f0d0ef91755efd154e3c65561","abstract_canon_sha256":"1408b5f4f8684d5d29fd864153aea4226752a15093c6aa013ce0b6a4f99d2071"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:15:46.681692Z","signature_b64":"7yGEXh2u8dPHx10L3GHhNqMP3YNG/OCctWupqB98GtH45Vg2dMNaAchuz5CwQSRUuULK9JtmRNaAfckMvIuiCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f3f89532d999b1dc8332041bf5c57405f3cb6ebcc3b8eb2c641d3aa4ff6a98f1","last_reissued_at":"2026-05-18T00:15:46.681023Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:15:46.681023Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Impact of Batch Size on Stopping Active Learning for Text Classification","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.IR","stat.ML"],"primary_cat":"cs.LG","authors_text":"Ethan Kochis, Garrett Beatty, Michael Bloodgood","submitted_at":"2018-01-24T07:47:05Z","abstract_excerpt":"When using active learning, smaller batch sizes are typically more efficient from a learning efficiency perspective. However, in practice due to speed and human annotator considerations, the use of larger batch sizes is necessary. While past work has shown that larger batch sizes decrease learning efficiency from a learning curve perspective, it remains an open question how batch size impacts methods for stopping active learning. We find that large batch sizes degrade the performance of a leading stopping method over and above the degradation that results from reduced learning efficiency. We a"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1801.07887","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1801.07887","created_at":"2026-05-18T00:15:46.681147+00:00"},{"alias_kind":"arxiv_version","alias_value":"1801.07887v2","created_at":"2026-05-18T00:15:46.681147+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1801.07887","created_at":"2026-05-18T00:15:46.681147+00:00"},{"alias_kind":"pith_short_12","alias_value":"6P4JKMWZTGY5","created_at":"2026-05-18T12:32:11.075285+00:00"},{"alias_kind":"pith_short_16","alias_value":"6P4JKMWZTGY5ZAZS","created_at":"2026-05-18T12:32:11.075285+00:00"},{"alias_kind":"pith_short_8","alias_value":"6P4JKMWZ","created_at":"2026-05-18T12:32:11.075285+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX","json":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX.json","graph_json":"https://pith.science/api/pith-number/6P4JKMWZTGY5ZAZSAQN7LRLUAX/graph.json","events_json":"https://pith.science/api/pith-number/6P4JKMWZTGY5ZAZSAQN7LRLUAX/events.json","paper":"https://pith.science/paper/6P4JKMWZ"},"agent_actions":{"view_html":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX","download_json":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX.json","view_paper":"https://pith.science/paper/6P4JKMWZ","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1801.07887&json=true","fetch_graph":"https://pith.science/api/pith-number/6P4JKMWZTGY5ZAZSAQN7LRLUAX/graph.json","fetch_events":"https://pith.science/api/pith-number/6P4JKMWZTGY5ZAZSAQN7LRLUAX/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX/action/timestamp_anchor","attest_storage":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX/action/storage_attestation","attest_author":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX/action/author_attestation","sign_citation":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX/action/citation_signature","submit_replication":"https://pith.science/pith/6P4JKMWZTGY5ZAZSAQN7LRLUAX/action/replication_record"}},"created_at":"2026-05-18T00:15:46.681147+00:00","updated_at":"2026-05-18T00:15:46.681147+00:00"}