{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:BX2PLQIVACABFDH4V6ZPFZNZGQ","short_pith_number":"pith:BX2PLQIV","schema_version":"1.0","canonical_sha256":"0df4f5c1150080128cfcafb2f2e5b9342f1a9ae893dee69f938cb9b0d722f207","source":{"kind":"arxiv","id":"1806.03255","version":2},"attestation_state":"computed","paper":{"title":"Automatically Generating a Large, Culture-Specific Blocklist for China","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.NI"],"primary_cat":"cs.CY","authors_text":"Austin Hounsel, Nick Feamster, Prateek Mittal","submitted_at":"2018-06-04T20:58:09Z","abstract_excerpt":"Internet censorship measurements rely on lists of websites to be tested, or \"block lists\" that are curated by third parties. Unfortunately, many of these lists are not public, and those that are tend to focus on a small group of topics, leaving other types of sites and services untested. To increase and diversify the set of sites on existing block lists, we use natural language processing and search engines to automatically discover a much wider range of websites that are censored in China. Using these techniques, we create a list of 1125 websites outside the Alexa Top 1,000 that cover Chinese"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1806.03255","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CY","submitted_at":"2018-06-04T20:58:09Z","cross_cats_sorted":["cs.NI"],"title_canon_sha256":"364f649579aa9a647880c5de91b9fa63df9f435018ac58cceb8470b14767a2c5","abstract_canon_sha256":"b4c9a4402ed64b22375bda8eb5e29b452abf64c4427a2cd4a770f8344d6a0dfd"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:10:21.665922Z","signature_b64":"VdrySu0VJDplU5KFFQsPpc2kjeFxOiqhgj1zbeNo/OaZszosFbVjhrag86IcV67fzMzU6g8fxNbOa/6+q2qpBw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0df4f5c1150080128cfcafb2f2e5b9342f1a9ae893dee69f938cb9b0d722f207","last_reissued_at":"2026-05-18T00:10:21.665238Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:10:21.665238Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Automatically Generating a Large, Culture-Specific Blocklist for China","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.NI"],"primary_cat":"cs.CY","authors_text":"Austin Hounsel, Nick Feamster, Prateek Mittal","submitted_at":"2018-06-04T20:58:09Z","abstract_excerpt":"Internet censorship measurements rely on lists of websites to be tested, or \"block lists\" that are curated by third parties. Unfortunately, many of these lists are not public, and those that are tend to focus on a small group of topics, leaving other types of sites and services untested. To increase and diversify the set of sites on existing block lists, we use natural language processing and search engines to automatically discover a much wider range of websites that are censored in China. Using these techniques, we create a list of 1125 websites outside the Alexa Top 1,000 that cover Chinese"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1806.03255","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1806.03255","created_at":"2026-05-18T00:10:21.665355+00:00"},{"alias_kind":"arxiv_version","alias_value":"1806.03255v2","created_at":"2026-05-18T00:10:21.665355+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1806.03255","created_at":"2026-05-18T00:10:21.665355+00:00"},{"alias_kind":"pith_short_12","alias_value":"BX2PLQIVACAB","created_at":"2026-05-18T12:32:16.446611+00:00"},{"alias_kind":"pith_short_16","alias_value":"BX2PLQIVACABFDH4","created_at":"2026-05-18T12:32:16.446611+00:00"},{"alias_kind":"pith_short_8","alias_value":"BX2PLQIV","created_at":"2026-05-18T12:32:16.446611+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ","json":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ.json","graph_json":"https://pith.science/api/pith-number/BX2PLQIVACABFDH4V6ZPFZNZGQ/graph.json","events_json":"https://pith.science/api/pith-number/BX2PLQIVACABFDH4V6ZPFZNZGQ/events.json","paper":"https://pith.science/paper/BX2PLQIV"},"agent_actions":{"view_html":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ","download_json":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ.json","view_paper":"https://pith.science/paper/BX2PLQIV","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1806.03255&json=true","fetch_graph":"https://pith.science/api/pith-number/BX2PLQIVACABFDH4V6ZPFZNZGQ/graph.json","fetch_events":"https://pith.science/api/pith-number/BX2PLQIVACABFDH4V6ZPFZNZGQ/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ/action/timestamp_anchor","attest_storage":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ/action/storage_attestation","attest_author":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ/action/author_attestation","sign_citation":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ/action/citation_signature","submit_replication":"https://pith.science/pith/BX2PLQIVACABFDH4V6ZPFZNZGQ/action/replication_record"}},"created_at":"2026-05-18T00:10:21.665355+00:00","updated_at":"2026-05-18T00:10:21.665355+00:00"}