{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2013:RLULMYP45U45QQWFIDXNOUXLJ6","short_pith_number":"pith:RLULMYP4","schema_version":"1.0","canonical_sha256":"8ae8b661fced39d842c540eed752eb4f88fd826273da89a2f0e07355f61b6ab7","source":{"kind":"arxiv","id":"1308.1479","version":2},"attestation_state":"computed","paper":{"title":"Challenges of Big Data Analysis","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"stat.ML","authors_text":"Fang Han, Han Liu, Jianqing Fan","submitted_at":"2013-08-07T05:09:33Z","abstract_excerpt":"Big Data bring new opportunities to modern society and challenges to data scientists. On one hand, Big Data hold great promises for discovering subtle population patterns and heterogeneities that are not possible with small-scale data. On the other hand, the massive sample size and high dimensionality of Big Data introduce unique computational and statistical challenges, including scalability and storage bottleneck, noise accumulation, spurious correlation, incidental endogeneity, and measurement errors. These challenges are distinguished and require new computational and statistical paradigm."},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1308.1479","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2013-08-07T05:09:33Z","cross_cats_sorted":[],"title_canon_sha256":"66185dfe9fbaf050cab652dfeb4440578eac5f0580ef1967fbb4918402e4d994","abstract_canon_sha256":"0b53d3a0cf659db0b32c46988630ee4e4fc83436b012fe477411dc40c3d9a7f5"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T02:31:21.671736Z","signature_b64":"VRE4nsu1D0HVte2U/whEmQ2Q8Z1tgZ1JZVU1Uj5qCERrcTzgpdJH1xqaU6t7hzVanyj+FmnU4XfVxUrV/32ODQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8ae8b661fced39d842c540eed752eb4f88fd826273da89a2f0e07355f61b6ab7","last_reissued_at":"2026-05-18T02:31:21.671083Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T02:31:21.671083Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Challenges of Big Data Analysis","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"stat.ML","authors_text":"Fang Han, Han Liu, Jianqing Fan","submitted_at":"2013-08-07T05:09:33Z","abstract_excerpt":"Big Data bring new opportunities to modern society and challenges to data scientists. On one hand, Big Data hold great promises for discovering subtle population patterns and heterogeneities that are not possible with small-scale data. On the other hand, the massive sample size and high dimensionality of Big Data introduce unique computational and statistical challenges, including scalability and storage bottleneck, noise accumulation, spurious correlation, incidental endogeneity, and measurement errors. These challenges are distinguished and require new computational and statistical paradigm."},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1308.1479","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1308.1479","created_at":"2026-05-18T02:31:21.671176+00:00"},{"alias_kind":"arxiv_version","alias_value":"1308.1479v2","created_at":"2026-05-18T02:31:21.671176+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1308.1479","created_at":"2026-05-18T02:31:21.671176+00:00"},{"alias_kind":"pith_short_12","alias_value":"RLULMYP45U45","created_at":"2026-05-18T12:27:59.945178+00:00"},{"alias_kind":"pith_short_16","alias_value":"RLULMYP45U45QQWF","created_at":"2026-05-18T12:27:59.945178+00:00"},{"alias_kind":"pith_short_8","alias_value":"RLULMYP4","created_at":"2026-05-18T12:27:59.945178+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6","json":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6.json","graph_json":"https://pith.science/api/pith-number/RLULMYP45U45QQWFIDXNOUXLJ6/graph.json","events_json":"https://pith.science/api/pith-number/RLULMYP45U45QQWFIDXNOUXLJ6/events.json","paper":"https://pith.science/paper/RLULMYP4"},"agent_actions":{"view_html":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6","download_json":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6.json","view_paper":"https://pith.science/paper/RLULMYP4","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1308.1479&json=true","fetch_graph":"https://pith.science/api/pith-number/RLULMYP45U45QQWFIDXNOUXLJ6/graph.json","fetch_events":"https://pith.science/api/pith-number/RLULMYP45U45QQWFIDXNOUXLJ6/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6/action/timestamp_anchor","attest_storage":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6/action/storage_attestation","attest_author":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6/action/author_attestation","sign_citation":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6/action/citation_signature","submit_replication":"https://pith.science/pith/RLULMYP45U45QQWFIDXNOUXLJ6/action/replication_record"}},"created_at":"2026-05-18T02:31:21.671176+00:00","updated_at":"2026-05-18T02:31:21.671176+00:00"}