{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2012:VGVPBJYXVBPDNKZOLLFO22WIAW","short_pith_number":"pith:VGVPBJYX","canonical_record":{"source":{"id":"1211.1323","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2012-11-06T17:42:00Z","cross_cats_sorted":["stat.ME","stat.ML"],"title_canon_sha256":"dba2da7fe66e1eba707eaa026c0a1d9832197f9d7a19c72fbaa0ca3f5859e35b","abstract_canon_sha256":"dcae6dc7a353ab30027dd14b89b453d20bdb2c12b32501119220fa7874ad6de7"},"schema_version":"1.0"},"canonical_sha256":"a9aaf0a717a85e36ab2e5acaed6ac8058d801a69ec942ec098b02ea342245b78","source":{"kind":"arxiv","id":"1211.1323","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1211.1323","created_at":"2026-05-18T02:17:12Z"},{"alias_kind":"arxiv_version","alias_value":"1211.1323v3","created_at":"2026-05-18T02:17:12Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1211.1323","created_at":"2026-05-18T02:17:12Z"},{"alias_kind":"pith_short_12","alias_value":"VGVPBJYXVBPD","created_at":"2026-05-18T12:27:25Z"},{"alias_kind":"pith_short_16","alias_value":"VGVPBJYXVBPDNKZO","created_at":"2026-05-18T12:27:25Z"},{"alias_kind":"pith_short_8","alias_value":"VGVPBJYX","created_at":"2026-05-18T12:27:25Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2012:VGVPBJYXVBPDNKZOLLFO22WIAW","target":"record","payload":{"canonical_record":{"source":{"id":"1211.1323","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2012-11-06T17:42:00Z","cross_cats_sorted":["stat.ME","stat.ML"],"title_canon_sha256":"dba2da7fe66e1eba707eaa026c0a1d9832197f9d7a19c72fbaa0ca3f5859e35b","abstract_canon_sha256":"dcae6dc7a353ab30027dd14b89b453d20bdb2c12b32501119220fa7874ad6de7"},"schema_version":"1.0"},"canonical_sha256":"a9aaf0a717a85e36ab2e5acaed6ac8058d801a69ec942ec098b02ea342245b78","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:17:12.659465Z","signature_b64":"SHldM+TGX8rBKMMcnVlfAcOCbNt6WH4pxGUurRThXexF3HRTR3VbxScINH1c2xorbakt3HuROcn7Ib8iPYSHCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a9aaf0a717a85e36ab2e5acaed6ac8058d801a69ec942ec098b02ea342245b78","last_reissued_at":"2026-05-18T02:17:12.658879Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:17:12.658879Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1211.1323","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:17:12Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"0R6N/AqlolK2IUmfd+dvt0lKtySRNT2IzYTAElIKP0O4Relrm63r4Z5W4X7iMUyWugm7+8B2gACSk79BoE4IAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T10:52:26.778568Z"},"content_sha256":"b70385981a7aa9596c83e7005543335492ff00a0eeccaabb84dd52792e77d55e","schema_version":"1.0","event_id":"sha256:b70385981a7aa9596c83e7005543335492ff00a0eeccaabb84dd52792e77d55e"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2012:VGVPBJYXVBPDNKZOLLFO22WIAW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Sample Size Planning for Classification Models","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["stat.ME","stat.ML"],"primary_cat":"stat.AP","authors_text":"Christoph Krafft, Claudia Beleites, J\\\"urgen Popp, Thomas Bocklitz, Ute Neugebauer","submitted_at":"2012-11-06T17:42:00Z","abstract_excerpt":"In biospectroscopy, suitably annotated and statistically independent samples (e. g. patients, batches, etc.) for classifier training and testing are scarce and costly. Learning curves show the model performance as function of the training sample size and can help to determine the sample size needed to train good classifiers. However, building a good model is actually not enough: the performance must also be proven. We discuss learning curves for typical small sample size situations with 5 - 25 independent samples per class. Although the classification models achieve acceptable performance, the"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1211.1323","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T02:17:12Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5BvjfVYclP4zxWSkQrQAF2kJzw3D2i47/QLS5BY1q/HnAcUcXVaGDnniTTy+2zTgtbZPRtzLJkve3yqr/u77CA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-06T10:52:26.779234Z"},"content_sha256":"92cd76dcb0ecfebb005890ba3597ce0ff1dc83e4729ce875fd73cbb2911b2b21","schema_version":"1.0","event_id":"sha256:92cd76dcb0ecfebb005890ba3597ce0ff1dc83e4729ce875fd73cbb2911b2b21"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/VGVPBJYXVBPDNKZOLLFO22WIAW/bundle.json","state_url":"https://pith.science/pith/VGVPBJYXVBPDNKZOLLFO22WIAW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/VGVPBJYXVBPDNKZOLLFO22WIAW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-06T10:52:26Z","links":{"resolver":"https://pith.science/pith/VGVPBJYXVBPDNKZOLLFO22WIAW","bundle":"https://pith.science/pith/VGVPBJYXVBPDNKZOLLFO22WIAW/bundle.json","state":"https://pith.science/pith/VGVPBJYXVBPDNKZOLLFO22WIAW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/VGVPBJYXVBPDNKZOLLFO22WIAW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2012:VGVPBJYXVBPDNKZOLLFO22WIAW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"dcae6dc7a353ab30027dd14b89b453d20bdb2c12b32501119220fa7874ad6de7","cross_cats_sorted":["stat.ME","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2012-11-06T17:42:00Z","title_canon_sha256":"dba2da7fe66e1eba707eaa026c0a1d9832197f9d7a19c72fbaa0ca3f5859e35b"},"schema_version":"1.0","source":{"id":"1211.1323","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1211.1323","created_at":"2026-05-18T02:17:12Z"},{"alias_kind":"arxiv_version","alias_value":"1211.1323v3","created_at":"2026-05-18T02:17:12Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1211.1323","created_at":"2026-05-18T02:17:12Z"},{"alias_kind":"pith_short_12","alias_value":"VGVPBJYXVBPD","created_at":"2026-05-18T12:27:25Z"},{"alias_kind":"pith_short_16","alias_value":"VGVPBJYXVBPDNKZO","created_at":"2026-05-18T12:27:25Z"},{"alias_kind":"pith_short_8","alias_value":"VGVPBJYX","created_at":"2026-05-18T12:27:25Z"}],"graph_snapshots":[{"event_id":"sha256:92cd76dcb0ecfebb005890ba3597ce0ff1dc83e4729ce875fd73cbb2911b2b21","target":"graph","created_at":"2026-05-18T02:17:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In biospectroscopy, suitably annotated and statistically independent samples (e. g. patients, batches, etc.) for classifier training and testing are scarce and costly. Learning curves show the model performance as function of the training sample size and can help to determine the sample size needed to train good classifiers. However, building a good model is actually not enough: the performance must also be proven. We discuss learning curves for typical small sample size situations with 5 - 25 independent samples per class. Although the classification models achieve acceptable performance, the","authors_text":"Christoph Krafft, Claudia Beleites, J\\\"urgen Popp, Thomas Bocklitz, Ute Neugebauer","cross_cats":["stat.ME","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2012-11-06T17:42:00Z","title":"Sample Size Planning for Classification Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1211.1323","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b70385981a7aa9596c83e7005543335492ff00a0eeccaabb84dd52792e77d55e","target":"record","created_at":"2026-05-18T02:17:12Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"dcae6dc7a353ab30027dd14b89b453d20bdb2c12b32501119220fa7874ad6de7","cross_cats_sorted":["stat.ME","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.AP","submitted_at":"2012-11-06T17:42:00Z","title_canon_sha256":"dba2da7fe66e1eba707eaa026c0a1d9832197f9d7a19c72fbaa0ca3f5859e35b"},"schema_version":"1.0","source":{"id":"1211.1323","kind":"arxiv","version":3}},"canonical_sha256":"a9aaf0a717a85e36ab2e5acaed6ac8058d801a69ec942ec098b02ea342245b78","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"a9aaf0a717a85e36ab2e5acaed6ac8058d801a69ec942ec098b02ea342245b78","first_computed_at":"2026-05-18T02:17:12.658879Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T02:17:12.658879Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"SHldM+TGX8rBKMMcnVlfAcOCbNt6WH4pxGUurRThXexF3HRTR3VbxScINH1c2xorbakt3HuROcn7Ib8iPYSHCw==","signature_status":"signed_v1","signed_at":"2026-05-18T02:17:12.659465Z","signed_message":"canonical_sha256_bytes"},"source_id":"1211.1323","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b70385981a7aa9596c83e7005543335492ff00a0eeccaabb84dd52792e77d55e","sha256:92cd76dcb0ecfebb005890ba3597ce0ff1dc83e4729ce875fd73cbb2911b2b21"],"state_sha256":"ac94aa89265d561af1b1675d7007fc94e4c4eab928f706a50838403566dc1d1c"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"V3Ygv+KtNcFWhFGVAKuxeHIoexe+a7qFWE8grdfykvhjqlbIyDqwuIsiGZKYADqt3P4apvtfKrJykyXvlYnlCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-06T10:52:26.783593Z","bundle_sha256":"05d6a2fa97dfea1279dc013cbc960e949bf77db1a8fa02b5c7ba28fdb06debeb"}}