{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:R5MGKV45LCYFSK2P64YFYFT5I6","short_pith_number":"pith:R5MGKV45","canonical_record":{"source":{"id":"1507.02973","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SI","submitted_at":"2015-07-10T17:15:10Z","cross_cats_sorted":[],"title_canon_sha256":"abb8cc9716a0886c953a3e822161938825e5168b51c80bec75cde0c39d34489a","abstract_canon_sha256":"44dc1e34b20324569cece8cb875748b4f7e521ed5517bca4b46ebe820e7e9454"},"schema_version":"1.0"},"canonical_sha256":"8f5865579d58b0592b4ff7305c167d47ac7180e70c73164f6e8cd12413050d7f","source":{"kind":"arxiv","id":"1507.02973","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1507.02973","created_at":"2026-05-18T00:58:35Z"},{"alias_kind":"arxiv_version","alias_value":"1507.02973v1","created_at":"2026-05-18T00:58:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1507.02973","created_at":"2026-05-18T00:58:35Z"},{"alias_kind":"pith_short_12","alias_value":"R5MGKV45LCYF","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_16","alias_value":"R5MGKV45LCYFSK2P","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_8","alias_value":"R5MGKV45","created_at":"2026-05-18T12:29:39Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:R5MGKV45LCYFSK2P64YFYFT5I6","target":"record","payload":{"canonical_record":{"source":{"id":"1507.02973","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SI","submitted_at":"2015-07-10T17:15:10Z","cross_cats_sorted":[],"title_canon_sha256":"abb8cc9716a0886c953a3e822161938825e5168b51c80bec75cde0c39d34489a","abstract_canon_sha256":"44dc1e34b20324569cece8cb875748b4f7e521ed5517bca4b46ebe820e7e9454"},"schema_version":"1.0"},"canonical_sha256":"8f5865579d58b0592b4ff7305c167d47ac7180e70c73164f6e8cd12413050d7f","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:58:35.299371Z","signature_b64":"mtybQWTfKFUxd4rKPRML9/+2wkgSsmXgDQ/fY8yBdo7SSzwM47sg8dNl0J2cS/DtQCbkyBVICyfmNSzTmFakDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8f5865579d58b0592b4ff7305c167d47ac7180e70c73164f6e8cd12413050d7f","last_reissued_at":"2026-05-18T00:58:35.298715Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:58:35.298715Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1507.02973","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:58:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5jE4jq/9YOXWgJm0IvdbxNCtRWgMHEW6SkoJzj7ybTCUFdQGxZNE4FT+mMqiXwkxaGOXfrkMjKEwgJIvLhk1BQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-19T22:24:51.339634Z"},"content_sha256":"b94e0da7bdadac80783f7e2dfbbac72339627ba6b1cc5be118221d4a2b54b605","schema_version":"1.0","event_id":"sha256:b94e0da7bdadac80783f7e2dfbbac72339627ba6b1cc5be118221d4a2b54b605"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:R5MGKV45LCYFSK2P64YFYFT5I6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Overcoming data scarcity of Twitter: using tweets as bootstrap with application to autism-related topic content analysis","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.SI","authors_text":"Adham Beykikhoshk, Dinh Phung, Ognjen Arandjelovic, Svetha Venkatesh","submitted_at":"2015-07-10T17:15:10Z","abstract_excerpt":"Notwithstanding recent work which has demonstrated the potential of using Twitter messages for content-specific data mining and analysis, the depth of such analysis is inherently limited by the scarcity of data imposed by the 140 character tweet limit. In this paper we describe a novel approach for targeted knowledge exploration which uses tweet content analysis as a preliminary step. This step is used to bootstrap more sophisticated data collection from directly related but much richer content sources. In particular we demonstrate that valuable information can be collected by following URLs i"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1507.02973","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:58:35Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"s40w0QvuaiogZ0E1fuEmCYM9quds9R3oYsH5WPnuC5MK+dhB42cKfESFDvtblguDPrE9rXHwyTkM5qDh9oAGAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-19T22:24:51.339978Z"},"content_sha256":"b40095961b2b95ab4222b70f5a45271765fa2720b22560e1374a3bac33817208","schema_version":"1.0","event_id":"sha256:b40095961b2b95ab4222b70f5a45271765fa2720b22560e1374a3bac33817208"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/R5MGKV45LCYFSK2P64YFYFT5I6/bundle.json","state_url":"https://pith.science/pith/R5MGKV45LCYFSK2P64YFYFT5I6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/R5MGKV45LCYFSK2P64YFYFT5I6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-19T22:24:51Z","links":{"resolver":"https://pith.science/pith/R5MGKV45LCYFSK2P64YFYFT5I6","bundle":"https://pith.science/pith/R5MGKV45LCYFSK2P64YFYFT5I6/bundle.json","state":"https://pith.science/pith/R5MGKV45LCYFSK2P64YFYFT5I6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/R5MGKV45LCYFSK2P64YFYFT5I6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:R5MGKV45LCYFSK2P64YFYFT5I6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"44dc1e34b20324569cece8cb875748b4f7e521ed5517bca4b46ebe820e7e9454","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SI","submitted_at":"2015-07-10T17:15:10Z","title_canon_sha256":"abb8cc9716a0886c953a3e822161938825e5168b51c80bec75cde0c39d34489a"},"schema_version":"1.0","source":{"id":"1507.02973","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1507.02973","created_at":"2026-05-18T00:58:35Z"},{"alias_kind":"arxiv_version","alias_value":"1507.02973v1","created_at":"2026-05-18T00:58:35Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1507.02973","created_at":"2026-05-18T00:58:35Z"},{"alias_kind":"pith_short_12","alias_value":"R5MGKV45LCYF","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_16","alias_value":"R5MGKV45LCYFSK2P","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_8","alias_value":"R5MGKV45","created_at":"2026-05-18T12:29:39Z"}],"graph_snapshots":[{"event_id":"sha256:b40095961b2b95ab4222b70f5a45271765fa2720b22560e1374a3bac33817208","target":"graph","created_at":"2026-05-18T00:58:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Notwithstanding recent work which has demonstrated the potential of using Twitter messages for content-specific data mining and analysis, the depth of such analysis is inherently limited by the scarcity of data imposed by the 140 character tweet limit. In this paper we describe a novel approach for targeted knowledge exploration which uses tweet content analysis as a preliminary step. This step is used to bootstrap more sophisticated data collection from directly related but much richer content sources. In particular we demonstrate that valuable information can be collected by following URLs i","authors_text":"Adham Beykikhoshk, Dinh Phung, Ognjen Arandjelovic, Svetha Venkatesh","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SI","submitted_at":"2015-07-10T17:15:10Z","title":"Overcoming data scarcity of Twitter: using tweets as bootstrap with application to autism-related topic content analysis"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1507.02973","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b94e0da7bdadac80783f7e2dfbbac72339627ba6b1cc5be118221d4a2b54b605","target":"record","created_at":"2026-05-18T00:58:35Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"44dc1e34b20324569cece8cb875748b4f7e521ed5517bca4b46ebe820e7e9454","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SI","submitted_at":"2015-07-10T17:15:10Z","title_canon_sha256":"abb8cc9716a0886c953a3e822161938825e5168b51c80bec75cde0c39d34489a"},"schema_version":"1.0","source":{"id":"1507.02973","kind":"arxiv","version":1}},"canonical_sha256":"8f5865579d58b0592b4ff7305c167d47ac7180e70c73164f6e8cd12413050d7f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8f5865579d58b0592b4ff7305c167d47ac7180e70c73164f6e8cd12413050d7f","first_computed_at":"2026-05-18T00:58:35.298715Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:58:35.298715Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"mtybQWTfKFUxd4rKPRML9/+2wkgSsmXgDQ/fY8yBdo7SSzwM47sg8dNl0J2cS/DtQCbkyBVICyfmNSzTmFakDQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:58:35.299371Z","signed_message":"canonical_sha256_bytes"},"source_id":"1507.02973","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b94e0da7bdadac80783f7e2dfbbac72339627ba6b1cc5be118221d4a2b54b605","sha256:b40095961b2b95ab4222b70f5a45271765fa2720b22560e1374a3bac33817208"],"state_sha256":"36a41d83818090b3549fe6f8d020342b17d3fe8e8f41e4058d00eb47a1291766"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"TJECjOR2Kdj+NKP5mfXvR84bSiCiQxBV4cERJHo+wSa4p+/XKwtL6Kzb24xBoY86Ry/nc5iWykIlNyc/br0sDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-19T22:24:51.344115Z","bundle_sha256":"047f4e439698a25b28b9cbb5cf747a3153eb63f5ab784becd92b19297f0bb15b"}}