{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:TIFORWAOBXCG2RXROBDAECGF4E","short_pith_number":"pith:TIFORWAO","schema_version":"1.0","canonical_sha256":"9a0ae8d80e0dc46d46f170460208c5e1041e6ab65a10f3ec877fb803404ce2bb","source":{"kind":"arxiv","id":"1612.01734","version":3},"attestation_state":"computed","paper":{"title":"Do we really need to catch them all? A new User-guided Social Media Crawling method","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.SI","authors_text":"Fredrik Erlandsson, Henric Johnson, Martin Boldt, Piotr Br\\'odka","submitted_at":"2016-12-06T10:22:00Z","abstract_excerpt":"With the growing use of popular social media services like Facebook and Twitter it is challenging to collect all content from the networks without access to the core infrastructure or paying for it. Thus, if all content cannot be collected one must consider which data are of most importance. In this work we present a novel User-guided Social Media Crawling method (USMC) that is able to collect data from social media, utilizing the wisdom of the crowd to decide the order in which user generated content should be collected to cover as many user interactions as possible. USMC is validated by craw"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1612.01734","kind":"arxiv","version":3},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SI","submitted_at":"2016-12-06T10:22:00Z","cross_cats_sorted":[],"title_canon_sha256":"34f8f3b4da141cbf09d3cee52e990ef3922adefb6bb3a5c0ad6cac01eb4b958e","abstract_canon_sha256":"c01c50c07e187d45f7f55d5bac894fa96878320d70d3946fa8a287b3abbda10b"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:28:02.577135Z","signature_b64":"csMsk2Ye2ivRA4vIoVAlSgww5bCmMVW9mkX+89CGc2rs8FifeR5iZ8bbj2btGIpgU6F9F1x96aH6z/rXRfwXAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9a0ae8d80e0dc46d46f170460208c5e1041e6ab65a10f3ec877fb803404ce2bb","last_reissued_at":"2026-05-18T00:28:02.576520Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:28:02.576520Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Do we really need to catch them all? A new User-guided Social Media Crawling method","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.SI","authors_text":"Fredrik Erlandsson, Henric Johnson, Martin Boldt, Piotr Br\\'odka","submitted_at":"2016-12-06T10:22:00Z","abstract_excerpt":"With the growing use of popular social media services like Facebook and Twitter it is challenging to collect all content from the networks without access to the core infrastructure or paying for it. Thus, if all content cannot be collected one must consider which data are of most importance. In this work we present a novel User-guided Social Media Crawling method (USMC) that is able to collect data from social media, utilizing the wisdom of the crowd to decide the order in which user generated content should be collected to cover as many user interactions as possible. USMC is validated by craw"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1612.01734","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1612.01734","created_at":"2026-05-18T00:28:02.576613+00:00"},{"alias_kind":"arxiv_version","alias_value":"1612.01734v3","created_at":"2026-05-18T00:28:02.576613+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1612.01734","created_at":"2026-05-18T00:28:02.576613+00:00"},{"alias_kind":"pith_short_12","alias_value":"TIFORWAOBXCG","created_at":"2026-05-18T12:30:44.179134+00:00"},{"alias_kind":"pith_short_16","alias_value":"TIFORWAOBXCG2RXR","created_at":"2026-05-18T12:30:44.179134+00:00"},{"alias_kind":"pith_short_8","alias_value":"TIFORWAO","created_at":"2026-05-18T12:30:44.179134+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E","json":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E.json","graph_json":"https://pith.science/api/pith-number/TIFORWAOBXCG2RXROBDAECGF4E/graph.json","events_json":"https://pith.science/api/pith-number/TIFORWAOBXCG2RXROBDAECGF4E/events.json","paper":"https://pith.science/paper/TIFORWAO"},"agent_actions":{"view_html":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E","download_json":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E.json","view_paper":"https://pith.science/paper/TIFORWAO","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1612.01734&json=true","fetch_graph":"https://pith.science/api/pith-number/TIFORWAOBXCG2RXROBDAECGF4E/graph.json","fetch_events":"https://pith.science/api/pith-number/TIFORWAOBXCG2RXROBDAECGF4E/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E/action/timestamp_anchor","attest_storage":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E/action/storage_attestation","attest_author":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E/action/author_attestation","sign_citation":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E/action/citation_signature","submit_replication":"https://pith.science/pith/TIFORWAOBXCG2RXROBDAECGF4E/action/replication_record"}},"created_at":"2026-05-18T00:28:02.576613+00:00","updated_at":"2026-05-18T00:28:02.576613+00:00"}