{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:7I43PKGGLOCROQZ3AAP56CEKUZ","short_pith_number":"pith:7I43PKGG","canonical_record":{"source":{"id":"1608.00104","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-07-30T11:53:04Z","cross_cats_sorted":["cs.CL","cs.IR"],"title_canon_sha256":"94650b2c491227137d0c60d7dab1d8b43b5a7c73143265b38e984917191be631","abstract_canon_sha256":"a9cab3ab1e1918eaa3bbb8dccab1e8d43a497419d5f85fe58c90fe02768c8968"},"schema_version":"1.0"},"canonical_sha256":"fa39b7a8c65b8517433b001fdf088aa67bb146d695868a964bfcce5491e60882","source":{"kind":"arxiv","id":"1608.00104","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1608.00104","created_at":"2026-05-18T01:10:13Z"},{"alias_kind":"arxiv_version","alias_value":"1608.00104v1","created_at":"2026-05-18T01:10:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1608.00104","created_at":"2026-05-18T01:10:13Z"},{"alias_kind":"pith_short_12","alias_value":"7I43PKGGLOCR","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_16","alias_value":"7I43PKGGLOCROQZ3","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_8","alias_value":"7I43PKGG","created_at":"2026-05-18T12:30:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:7I43PKGGLOCROQZ3AAP56CEKUZ","target":"record","payload":{"canonical_record":{"source":{"id":"1608.00104","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-07-30T11:53:04Z","cross_cats_sorted":["cs.CL","cs.IR"],"title_canon_sha256":"94650b2c491227137d0c60d7dab1d8b43b5a7c73143265b38e984917191be631","abstract_canon_sha256":"a9cab3ab1e1918eaa3bbb8dccab1e8d43a497419d5f85fe58c90fe02768c8968"},"schema_version":"1.0"},"canonical_sha256":"fa39b7a8c65b8517433b001fdf088aa67bb146d695868a964bfcce5491e60882","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:10:13.814151Z","signature_b64":"pshJqnidsc4npztrGFmXFt16JjSDATHjz24lwMTo//c0r7E9c2WYmH1oWMS8QxszU8HxZSitVXpkeV78qwHHBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"fa39b7a8c65b8517433b001fdf088aa67bb146d695868a964bfcce5491e60882","last_reissued_at":"2026-05-18T01:10:13.813621Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:10:13.813621Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1608.00104","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:10:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"q1ZpTU5wRz0DBHa0jwcC5asnlitj20UBC1Tav1A9crNlPBzT9f+shVmNWWoRk5d/YhSnasgWlaivAFiCS6gxBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T20:22:21.912301Z"},"content_sha256":"87282dbcb353e5435c65cbc2fef32a51cc07362d57d257a45d9be3e2f24732d4","schema_version":"1.0","event_id":"sha256:87282dbcb353e5435c65cbc2fef32a51cc07362d57d257a45d9be3e2f24732d4"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:7I43PKGGLOCROQZ3AAP56CEKUZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"World Knowledge as Indirect Supervision for Document Clustering","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL","cs.IR"],"primary_cat":"cs.LG","authors_text":"Chenguang Wang, Dan Roth, Jiawei Han, Ming Zhang, Yangqiu Song","submitted_at":"2016-07-30T11:53:04Z","abstract_excerpt":"One of the key obstacles in making learning protocols realistic in applications is the need to supervise them, a costly process that often requires hiring domain experts. We consider the framework to use the world knowledge as indirect supervision. World knowledge is general-purpose knowledge, which is not designed for any specific domain. Then the key challenges are how to adapt the world knowledge to domains and how to represent it for learning. In this paper, we provide an example of using world knowledge for domain dependent document clustering. We provide three ways to specify the world k"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1608.00104","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:10:13Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5pt8pj+e/01meaLeX7wyIZv4DU6DPR+atnIUJEBIEi01vjksg1hHzmVuRMXyF04OodhPnKJPHJJZHpABvkamAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T20:22:21.913088Z"},"content_sha256":"3c7bc2c8220ff847b782519736609dc5bc9e3aa935ca6034793a93bc76a57fdd","schema_version":"1.0","event_id":"sha256:3c7bc2c8220ff847b782519736609dc5bc9e3aa935ca6034793a93bc76a57fdd"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/7I43PKGGLOCROQZ3AAP56CEKUZ/bundle.json","state_url":"https://pith.science/pith/7I43PKGGLOCROQZ3AAP56CEKUZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/7I43PKGGLOCROQZ3AAP56CEKUZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T20:22:21Z","links":{"resolver":"https://pith.science/pith/7I43PKGGLOCROQZ3AAP56CEKUZ","bundle":"https://pith.science/pith/7I43PKGGLOCROQZ3AAP56CEKUZ/bundle.json","state":"https://pith.science/pith/7I43PKGGLOCROQZ3AAP56CEKUZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/7I43PKGGLOCROQZ3AAP56CEKUZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:7I43PKGGLOCROQZ3AAP56CEKUZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a9cab3ab1e1918eaa3bbb8dccab1e8d43a497419d5f85fe58c90fe02768c8968","cross_cats_sorted":["cs.CL","cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-07-30T11:53:04Z","title_canon_sha256":"94650b2c491227137d0c60d7dab1d8b43b5a7c73143265b38e984917191be631"},"schema_version":"1.0","source":{"id":"1608.00104","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1608.00104","created_at":"2026-05-18T01:10:13Z"},{"alias_kind":"arxiv_version","alias_value":"1608.00104v1","created_at":"2026-05-18T01:10:13Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1608.00104","created_at":"2026-05-18T01:10:13Z"},{"alias_kind":"pith_short_12","alias_value":"7I43PKGGLOCR","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_16","alias_value":"7I43PKGGLOCROQZ3","created_at":"2026-05-18T12:30:04Z"},{"alias_kind":"pith_short_8","alias_value":"7I43PKGG","created_at":"2026-05-18T12:30:04Z"}],"graph_snapshots":[{"event_id":"sha256:3c7bc2c8220ff847b782519736609dc5bc9e3aa935ca6034793a93bc76a57fdd","target":"graph","created_at":"2026-05-18T01:10:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"One of the key obstacles in making learning protocols realistic in applications is the need to supervise them, a costly process that often requires hiring domain experts. We consider the framework to use the world knowledge as indirect supervision. World knowledge is general-purpose knowledge, which is not designed for any specific domain. Then the key challenges are how to adapt the world knowledge to domains and how to represent it for learning. In this paper, we provide an example of using world knowledge for domain dependent document clustering. We provide three ways to specify the world k","authors_text":"Chenguang Wang, Dan Roth, Jiawei Han, Ming Zhang, Yangqiu Song","cross_cats":["cs.CL","cs.IR"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-07-30T11:53:04Z","title":"World Knowledge as Indirect Supervision for Document Clustering"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1608.00104","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:87282dbcb353e5435c65cbc2fef32a51cc07362d57d257a45d9be3e2f24732d4","target":"record","created_at":"2026-05-18T01:10:13Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a9cab3ab1e1918eaa3bbb8dccab1e8d43a497419d5f85fe58c90fe02768c8968","cross_cats_sorted":["cs.CL","cs.IR"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-07-30T11:53:04Z","title_canon_sha256":"94650b2c491227137d0c60d7dab1d8b43b5a7c73143265b38e984917191be631"},"schema_version":"1.0","source":{"id":"1608.00104","kind":"arxiv","version":1}},"canonical_sha256":"fa39b7a8c65b8517433b001fdf088aa67bb146d695868a964bfcce5491e60882","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"fa39b7a8c65b8517433b001fdf088aa67bb146d695868a964bfcce5491e60882","first_computed_at":"2026-05-18T01:10:13.813621Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:10:13.813621Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"pshJqnidsc4npztrGFmXFt16JjSDATHjz24lwMTo//c0r7E9c2WYmH1oWMS8QxszU8HxZSitVXpkeV78qwHHBw==","signature_status":"signed_v1","signed_at":"2026-05-18T01:10:13.814151Z","signed_message":"canonical_sha256_bytes"},"source_id":"1608.00104","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:87282dbcb353e5435c65cbc2fef32a51cc07362d57d257a45d9be3e2f24732d4","sha256:3c7bc2c8220ff847b782519736609dc5bc9e3aa935ca6034793a93bc76a57fdd"],"state_sha256":"27425d4673702e032b5a771439e835adf951594f56d64b064a53a4093ed1c5ea"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"sv5+0pmJ37BzhPciRDJJ4EUQFdBx5xJlt4DmnaiUCIzLBiRYIhn8HjPosZlzAzfqgvnyHoMM4q/adbvw9Q6yBQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T20:22:21.917310Z","bundle_sha256":"9fd037848ddcb19d82ec26ee2f560a7bccfee43d4ff2d587f3e44f3aec4d2492"}}