{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:BXANYMHYJB4QMRGVWH6X2MLJ3U","short_pith_number":"pith:BXANYMHY","canonical_record":{"source":{"id":"1508.01235","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-08-05T21:43:32Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"e8d0741d649e40cb498f362b38c55473fcfb58171090a2c2822138ebb5295663","abstract_canon_sha256":"9c5cb6bdf8c527b24597574fcd735ad1be17b6591537f7a174ec66b23a3ad06a"},"schema_version":"1.0"},"canonical_sha256":"0dc0dc30f848790644d5b1fd7d3169dd07e3f6316f69e6412d68e0e44a426ffc","source":{"kind":"arxiv","id":"1508.01235","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1508.01235","created_at":"2026-05-17T23:51:59Z"},{"alias_kind":"arxiv_version","alias_value":"1508.01235v2","created_at":"2026-05-17T23:51:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1508.01235","created_at":"2026-05-17T23:51:59Z"},{"alias_kind":"pith_short_12","alias_value":"BXANYMHYJB4Q","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_16","alias_value":"BXANYMHYJB4QMRGV","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_8","alias_value":"BXANYMHY","created_at":"2026-05-18T12:29:14Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:BXANYMHYJB4QMRGVWH6X2MLJ3U","target":"record","payload":{"canonical_record":{"source":{"id":"1508.01235","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-08-05T21:43:32Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"e8d0741d649e40cb498f362b38c55473fcfb58171090a2c2822138ebb5295663","abstract_canon_sha256":"9c5cb6bdf8c527b24597574fcd735ad1be17b6591537f7a174ec66b23a3ad06a"},"schema_version":"1.0"},"canonical_sha256":"0dc0dc30f848790644d5b1fd7d3169dd07e3f6316f69e6412d68e0e44a426ffc","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:51:59.273140Z","signature_b64":"HqmJllX5EdbVSS1zufOdg76iisK6LZKFt9LVRIcqAu3VaPPwKdEhEB84u66yaRqNjqTB/6aVBJhEghT1v1DpAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0dc0dc30f848790644d5b1fd7d3169dd07e3f6316f69e6412d68e0e44a426ffc","last_reissued_at":"2026-05-17T23:51:59.272538Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:51:59.272538Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1508.01235","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:51:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"xEue+/eD9vhmBFTZxhpBOxZbmSRBaL3m84X+GRxlAVTEkVtCYrE7DP1LEry5U9sAu6c4A9Xonvgd+heqNyTfAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T10:43:34.357086Z"},"content_sha256":"672a0397588459a4823601c089f4a40108df031c4e7a75df0b69d596c7beb012","schema_version":"1.0","event_id":"sha256:672a0397588459a4823601c089f4a40108df031c4e7a75df0b69d596c7beb012"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:BXANYMHYJB4QMRGVWH6X2MLJ3U","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Empirical Similarity for Absent Data Generation in Imbalanced Classification","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"stat.ML","authors_text":"Arash Pourhabib","submitted_at":"2015-08-05T21:43:32Z","abstract_excerpt":"When the training data in a two-class classification problem is overwhelmed by one class, most classification techniques fail to correctly identify the data points belonging to the underrepresented class. We propose Similarity-based Imbalanced Classification (SBIC) that learns patterns in the training data based on an empirical similarity function. To take the imbalanced structure of the training data into account, SBIC utilizes the concept of absent data, i.e. data from the minority class which can help better find the boundary between the two classes. SBIC simultaneously optimizes the weight"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1508.01235","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:51:59Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WV3wFO1K884m+PpXHFfqrACCSQVXJjv/jcOCKs7Pb0SDkgmHwdTc91vzJDckNHqC10ax+Y9nrdf7qpTFHrzsDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-12T10:43:34.357457Z"},"content_sha256":"51dfc93e9e00441ec2781fb642237cee7e3d5a41797341f5316c112bc729a270","schema_version":"1.0","event_id":"sha256:51dfc93e9e00441ec2781fb642237cee7e3d5a41797341f5316c112bc729a270"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/BXANYMHYJB4QMRGVWH6X2MLJ3U/bundle.json","state_url":"https://pith.science/pith/BXANYMHYJB4QMRGVWH6X2MLJ3U/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/BXANYMHYJB4QMRGVWH6X2MLJ3U/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-12T10:43:34Z","links":{"resolver":"https://pith.science/pith/BXANYMHYJB4QMRGVWH6X2MLJ3U","bundle":"https://pith.science/pith/BXANYMHYJB4QMRGVWH6X2MLJ3U/bundle.json","state":"https://pith.science/pith/BXANYMHYJB4QMRGVWH6X2MLJ3U/state.json","well_known_bundle":"https://pith.science/.well-known/pith/BXANYMHYJB4QMRGVWH6X2MLJ3U/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:BXANYMHYJB4QMRGVWH6X2MLJ3U","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"9c5cb6bdf8c527b24597574fcd735ad1be17b6591537f7a174ec66b23a3ad06a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-08-05T21:43:32Z","title_canon_sha256":"e8d0741d649e40cb498f362b38c55473fcfb58171090a2c2822138ebb5295663"},"schema_version":"1.0","source":{"id":"1508.01235","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1508.01235","created_at":"2026-05-17T23:51:59Z"},{"alias_kind":"arxiv_version","alias_value":"1508.01235v2","created_at":"2026-05-17T23:51:59Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1508.01235","created_at":"2026-05-17T23:51:59Z"},{"alias_kind":"pith_short_12","alias_value":"BXANYMHYJB4Q","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_16","alias_value":"BXANYMHYJB4QMRGV","created_at":"2026-05-18T12:29:14Z"},{"alias_kind":"pith_short_8","alias_value":"BXANYMHY","created_at":"2026-05-18T12:29:14Z"}],"graph_snapshots":[{"event_id":"sha256:51dfc93e9e00441ec2781fb642237cee7e3d5a41797341f5316c112bc729a270","target":"graph","created_at":"2026-05-17T23:51:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"When the training data in a two-class classification problem is overwhelmed by one class, most classification techniques fail to correctly identify the data points belonging to the underrepresented class. We propose Similarity-based Imbalanced Classification (SBIC) that learns patterns in the training data based on an empirical similarity function. To take the imbalanced structure of the training data into account, SBIC utilizes the concept of absent data, i.e. data from the minority class which can help better find the boundary between the two classes. SBIC simultaneously optimizes the weight","authors_text":"Arash Pourhabib","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-08-05T21:43:32Z","title":"Empirical Similarity for Absent Data Generation in Imbalanced Classification"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1508.01235","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:672a0397588459a4823601c089f4a40108df031c4e7a75df0b69d596c7beb012","target":"record","created_at":"2026-05-17T23:51:59Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"9c5cb6bdf8c527b24597574fcd735ad1be17b6591537f7a174ec66b23a3ad06a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2015-08-05T21:43:32Z","title_canon_sha256":"e8d0741d649e40cb498f362b38c55473fcfb58171090a2c2822138ebb5295663"},"schema_version":"1.0","source":{"id":"1508.01235","kind":"arxiv","version":2}},"canonical_sha256":"0dc0dc30f848790644d5b1fd7d3169dd07e3f6316f69e6412d68e0e44a426ffc","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0dc0dc30f848790644d5b1fd7d3169dd07e3f6316f69e6412d68e0e44a426ffc","first_computed_at":"2026-05-17T23:51:59.272538Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:51:59.272538Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"HqmJllX5EdbVSS1zufOdg76iisK6LZKFt9LVRIcqAu3VaPPwKdEhEB84u66yaRqNjqTB/6aVBJhEghT1v1DpAg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:51:59.273140Z","signed_message":"canonical_sha256_bytes"},"source_id":"1508.01235","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:672a0397588459a4823601c089f4a40108df031c4e7a75df0b69d596c7beb012","sha256:51dfc93e9e00441ec2781fb642237cee7e3d5a41797341f5316c112bc729a270"],"state_sha256":"9f80ebbafb31ceb2c0516a30629ad74ae8b7ac4710caf5bee50753b469c0da44"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"TTp83lSg/Uo07+F/pSZwoKwp5PRTkQIxCyHMmt18P54i/oTQ8GCcuFGEk6I25KyUF53O6WGKBVMWU+a7e+zxAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-12T10:43:34.359947Z","bundle_sha256":"534fd2a02e90692126f816fe266980c2fa4d554e8f4f7846eeaea12204e1b132"}}