{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:J6PLYUFKBHESMKQMHPOCU76Q2U","short_pith_number":"pith:J6PLYUFK","canonical_record":{"source":{"id":"1604.04007","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-14T01:29:52Z","cross_cats_sorted":[],"title_canon_sha256":"dd6b011cf1ca8e65ba0023cb8051990a3f9d4fd981c113a6f0835acde3996682","abstract_canon_sha256":"df4365e127f62ae5ca745d469e0fa8d0af07681ea871a90f1ba02e844cfef761"},"schema_version":"1.0"},"canonical_sha256":"4f9ebc50aa09c9262a0c3bdc2a7fd0d50e8bff1dc3abec33c5b16cd21aea6b17","source":{"kind":"arxiv","id":"1604.04007","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.04007","created_at":"2026-05-18T01:17:06Z"},{"alias_kind":"arxiv_version","alias_value":"1604.04007v1","created_at":"2026-05-18T01:17:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.04007","created_at":"2026-05-18T01:17:06Z"},{"alias_kind":"pith_short_12","alias_value":"J6PLYUFKBHES","created_at":"2026-05-18T12:30:22Z"},{"alias_kind":"pith_short_16","alias_value":"J6PLYUFKBHESMKQM","created_at":"2026-05-18T12:30:22Z"},{"alias_kind":"pith_short_8","alias_value":"J6PLYUFK","created_at":"2026-05-18T12:30:22Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:J6PLYUFKBHESMKQMHPOCU76Q2U","target":"record","payload":{"canonical_record":{"source":{"id":"1604.04007","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-14T01:29:52Z","cross_cats_sorted":[],"title_canon_sha256":"dd6b011cf1ca8e65ba0023cb8051990a3f9d4fd981c113a6f0835acde3996682","abstract_canon_sha256":"df4365e127f62ae5ca745d469e0fa8d0af07681ea871a90f1ba02e844cfef761"},"schema_version":"1.0"},"canonical_sha256":"4f9ebc50aa09c9262a0c3bdc2a7fd0d50e8bff1dc3abec33c5b16cd21aea6b17","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:17:06.957578Z","signature_b64":"8JrXoOPrS2WACO9KHC6Mn3357DMvwGaE/4BR6/qMgNyKcwImHYQ5jn1LW2+evfAkGBCG2Y1TVp/mNaz5H5T+Dg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4f9ebc50aa09c9262a0c3bdc2a7fd0d50e8bff1dc3abec33c5b16cd21aea6b17","last_reissued_at":"2026-05-18T01:17:06.956934Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:17:06.956934Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1604.04007","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:17:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"cr65FsNYoAH/H27EOiSLtvVIdyvFpi+KQaBnyaVGc/xhqus3Kv1SBE04eqLUGjLJxWLWqTBaYu+a9eZ3WGc6Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T02:32:04.739685Z"},"content_sha256":"ffbb7c558357ce5aba87f7062b897d4e54a969b79d7487e91d345dc0d6eb5915","schema_version":"1.0","event_id":"sha256:ffbb7c558357ce5aba87f7062b897d4e54a969b79d7487e91d345dc0d6eb5915"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:J6PLYUFKBHESMKQMHPOCU76Q2U","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Balancing Between Over-Weighting and Under-Weighting in Supervised Term Weighting","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Haibing Wu, Xiaodong Gu","submitted_at":"2016-04-14T01:29:52Z","abstract_excerpt":"Supervised term weighting could improve the performance of text categorization. A way proven to be effective is to give more weight to terms with more imbalanced distributions across categories. This paper shows that supervised term weighting should not just assign large weights to imbalanced terms, but should also control the trade-off between over-weighting and under-weighting. Over-weighting, a new concept proposed in this paper, is caused by the improper handling of singular terms and too large ratios between term weights. To prevent over-weighting, we present three regularization techniqu"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.04007","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:17:06Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"270VtUlRrxWlLVSaSEAAzM22kJKhTsskTE9/+m90e1z0fgOeN0oiGcxiaMquI/ZKLUn4LAYawvCY7UeuZIK5DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-31T02:32:04.740324Z"},"content_sha256":"194a9a351347553fd2eb5822ccc624ce6e0b021687cc7a287cf5c56ebd84db3d","schema_version":"1.0","event_id":"sha256:194a9a351347553fd2eb5822ccc624ce6e0b021687cc7a287cf5c56ebd84db3d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/J6PLYUFKBHESMKQMHPOCU76Q2U/bundle.json","state_url":"https://pith.science/pith/J6PLYUFKBHESMKQMHPOCU76Q2U/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/J6PLYUFKBHESMKQMHPOCU76Q2U/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-31T02:32:04Z","links":{"resolver":"https://pith.science/pith/J6PLYUFKBHESMKQMHPOCU76Q2U","bundle":"https://pith.science/pith/J6PLYUFKBHESMKQMHPOCU76Q2U/bundle.json","state":"https://pith.science/pith/J6PLYUFKBHESMKQMHPOCU76Q2U/state.json","well_known_bundle":"https://pith.science/.well-known/pith/J6PLYUFKBHESMKQMHPOCU76Q2U/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:J6PLYUFKBHESMKQMHPOCU76Q2U","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"df4365e127f62ae5ca745d469e0fa8d0af07681ea871a90f1ba02e844cfef761","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-14T01:29:52Z","title_canon_sha256":"dd6b011cf1ca8e65ba0023cb8051990a3f9d4fd981c113a6f0835acde3996682"},"schema_version":"1.0","source":{"id":"1604.04007","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1604.04007","created_at":"2026-05-18T01:17:06Z"},{"alias_kind":"arxiv_version","alias_value":"1604.04007v1","created_at":"2026-05-18T01:17:06Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1604.04007","created_at":"2026-05-18T01:17:06Z"},{"alias_kind":"pith_short_12","alias_value":"J6PLYUFKBHES","created_at":"2026-05-18T12:30:22Z"},{"alias_kind":"pith_short_16","alias_value":"J6PLYUFKBHESMKQM","created_at":"2026-05-18T12:30:22Z"},{"alias_kind":"pith_short_8","alias_value":"J6PLYUFK","created_at":"2026-05-18T12:30:22Z"}],"graph_snapshots":[{"event_id":"sha256:194a9a351347553fd2eb5822ccc624ce6e0b021687cc7a287cf5c56ebd84db3d","target":"graph","created_at":"2026-05-18T01:17:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Supervised term weighting could improve the performance of text categorization. A way proven to be effective is to give more weight to terms with more imbalanced distributions across categories. This paper shows that supervised term weighting should not just assign large weights to imbalanced terms, but should also control the trade-off between over-weighting and under-weighting. Over-weighting, a new concept proposed in this paper, is caused by the improper handling of singular terms and too large ratios between term weights. To prevent over-weighting, we present three regularization techniqu","authors_text":"Haibing Wu, Xiaodong Gu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-14T01:29:52Z","title":"Balancing Between Over-Weighting and Under-Weighting in Supervised Term Weighting"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1604.04007","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ffbb7c558357ce5aba87f7062b897d4e54a969b79d7487e91d345dc0d6eb5915","target":"record","created_at":"2026-05-18T01:17:06Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"df4365e127f62ae5ca745d469e0fa8d0af07681ea871a90f1ba02e844cfef761","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2016-04-14T01:29:52Z","title_canon_sha256":"dd6b011cf1ca8e65ba0023cb8051990a3f9d4fd981c113a6f0835acde3996682"},"schema_version":"1.0","source":{"id":"1604.04007","kind":"arxiv","version":1}},"canonical_sha256":"4f9ebc50aa09c9262a0c3bdc2a7fd0d50e8bff1dc3abec33c5b16cd21aea6b17","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4f9ebc50aa09c9262a0c3bdc2a7fd0d50e8bff1dc3abec33c5b16cd21aea6b17","first_computed_at":"2026-05-18T01:17:06.956934Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:17:06.956934Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"8JrXoOPrS2WACO9KHC6Mn3357DMvwGaE/4BR6/qMgNyKcwImHYQ5jn1LW2+evfAkGBCG2Y1TVp/mNaz5H5T+Dg==","signature_status":"signed_v1","signed_at":"2026-05-18T01:17:06.957578Z","signed_message":"canonical_sha256_bytes"},"source_id":"1604.04007","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ffbb7c558357ce5aba87f7062b897d4e54a969b79d7487e91d345dc0d6eb5915","sha256:194a9a351347553fd2eb5822ccc624ce6e0b021687cc7a287cf5c56ebd84db3d"],"state_sha256":"98d986609b130526cab4e48f99c444f5fbc190f8d9fb2285a57596fb3801b9f1"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QFiTEU/qNjmJ7wKjjQvNWnwGOPSUV4KxO0KeV/pOyHW0/aU2zdjabTLUqijpx5ncu0ikfwLE2FUGw1S7b/XMDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-31T02:32:04.742884Z","bundle_sha256":"5020429474ddb9ee55f249c42f776a6335f655851072e4910dab2d1cc5348baa"}}