{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2012:INPP5C37RYCFB6B5ZSFSJ7XOPR","short_pith_number":"pith:INPP5C37","schema_version":"1.0","canonical_sha256":"435efe8b7f8e0450f83dcc8b24feee7c745aa4b2110771266ffe3d3c9a8f5bde","source":{"kind":"arxiv","id":"1208.2873","version":1},"attestation_state":"computed","paper":{"title":"Detecting Events and Patterns in Large-Scale User Generated Textual Streams with Statistical Learning Methods","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","headline":"","cross_cats":["cs.CL","cs.IR","cs.SI","stat.AP","stat.ML"],"primary_cat":"cs.LG","authors_text":"Vasileios Lampos","submitted_at":"2012-08-13T18:59:54Z","abstract_excerpt":"A vast amount of textual web streams is influenced by events or phenomena emerging in the real world. The social web forms an excellent modern paradigm, where unstructured user generated content is published on a regular basis and in most occasions is freely distributed. The present Ph.D. Thesis deals with the problem of inferring information - or patterns in general - about events emerging in real life based on the contents of this textual stream. We show that it is possible to extract valuable information about social phenomena, such as an epidemic or even rainfall rates, by automatic analys"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1208.2873","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","primary_cat":"cs.LG","submitted_at":"2012-08-13T18:59:54Z","cross_cats_sorted":["cs.CL","cs.IR","cs.SI","stat.AP","stat.ML"],"title_canon_sha256":"e96c21f4839bb45be80d9823d49f7d0c2e76dcc550594ebdd72c916e54969b77","abstract_canon_sha256":"16ed11003fe48b47f1eed01c1086b86a040f570c5493b345a799e57adc3dd5e9"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T03:48:46.989108Z","signature_b64":"7gfBOcD0ZqFCNpKVfbPgHQkRodCUdfbg0nKm59Y4hcIDNYXyTnnRJChXEgzoX6p1Woo6N9USpIsubl3KvR0iBg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"435efe8b7f8e0450f83dcc8b24feee7c745aa4b2110771266ffe3d3c9a8f5bde","last_reissued_at":"2026-05-18T03:48:46.988601Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T03:48:46.988601Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Detecting Events and Patterns in Large-Scale User Generated Textual Streams with Statistical Learning Methods","license":"http://creativecommons.org/licenses/by-nc-sa/3.0/","headline":"","cross_cats":["cs.CL","cs.IR","cs.SI","stat.AP","stat.ML"],"primary_cat":"cs.LG","authors_text":"Vasileios Lampos","submitted_at":"2012-08-13T18:59:54Z","abstract_excerpt":"A vast amount of textual web streams is influenced by events or phenomena emerging in the real world. The social web forms an excellent modern paradigm, where unstructured user generated content is published on a regular basis and in most occasions is freely distributed. The present Ph.D. Thesis deals with the problem of inferring information - or patterns in general - about events emerging in real life based on the contents of this textual stream. We show that it is possible to extract valuable information about social phenomena, such as an epidemic or even rainfall rates, by automatic analys"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1208.2873","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1208.2873","created_at":"2026-05-18T03:48:46.988678+00:00"},{"alias_kind":"arxiv_version","alias_value":"1208.2873v1","created_at":"2026-05-18T03:48:46.988678+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1208.2873","created_at":"2026-05-18T03:48:46.988678+00:00"},{"alias_kind":"pith_short_12","alias_value":"INPP5C37RYCF","created_at":"2026-05-18T12:27:09.501522+00:00"},{"alias_kind":"pith_short_16","alias_value":"INPP5C37RYCFB6B5","created_at":"2026-05-18T12:27:09.501522+00:00"},{"alias_kind":"pith_short_8","alias_value":"INPP5C37","created_at":"2026-05-18T12:27:09.501522+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR","json":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR.json","graph_json":"https://pith.science/api/pith-number/INPP5C37RYCFB6B5ZSFSJ7XOPR/graph.json","events_json":"https://pith.science/api/pith-number/INPP5C37RYCFB6B5ZSFSJ7XOPR/events.json","paper":"https://pith.science/paper/INPP5C37"},"agent_actions":{"view_html":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR","download_json":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR.json","view_paper":"https://pith.science/paper/INPP5C37","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1208.2873&json=true","fetch_graph":"https://pith.science/api/pith-number/INPP5C37RYCFB6B5ZSFSJ7XOPR/graph.json","fetch_events":"https://pith.science/api/pith-number/INPP5C37RYCFB6B5ZSFSJ7XOPR/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR/action/timestamp_anchor","attest_storage":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR/action/storage_attestation","attest_author":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR/action/author_attestation","sign_citation":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR/action/citation_signature","submit_replication":"https://pith.science/pith/INPP5C37RYCFB6B5ZSFSJ7XOPR/action/replication_record"}},"created_at":"2026-05-18T03:48:46.988678+00:00","updated_at":"2026-05-18T03:48:46.988678+00:00"}