{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2019:VHM32ULWCRLLIM5RAQWD7ABNV2","short_pith_number":"pith:VHM32ULW","schema_version":"1.0","canonical_sha256":"a9d9bd51761456b433b1042c3f802daebbe2f989a9bbf81a196466d7b7260584","source":{"kind":"arxiv","id":"1906.12125","version":1},"attestation_state":"computed","paper":{"title":"High-dimensional principal component analysis with heterogeneous missingness","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["math.ST","stat.TH"],"primary_cat":"stat.ME","authors_text":"Richard J. Samworth, Tengyao Wang, Ziwei Zhu","submitted_at":"2019-06-28T10:37:16Z","abstract_excerpt":"We study the problem of high-dimensional Principal Component Analysis (PCA) with missing observations. In simple, homogeneous missingness settings with a noise level of constant order, we show that an existing inverse-probability weighted (IPW) estimator of the leading principal components can (nearly) attain the minimax optimal rate of convergence. However, deeper investigation reveals both that, particularly in more realistic settings where the missingness mechanism is heterogeneous, the empirical performance of the IPW estimator can be unsatisfactory, and moreover that, in the noiseless cas"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1906.12125","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2019-06-28T10:37:16Z","cross_cats_sorted":["math.ST","stat.TH"],"title_canon_sha256":"7c988e86d355054323a7006becb369552a01df0fffce76a9dbf1a616612cb92f","abstract_canon_sha256":"8819028fd607bce2414827528185c975bcfccc4727ff9c7d40aa086060a66053"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:41:59.221287Z","signature_b64":"G5DRL0yEKc5+zNW3y0FdTjaOc4DhOIGjefR7mkhWlPGf3KkAj0WltqH8+39KBSA4w+PxoCft1hkbKCQF3REPCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"a9d9bd51761456b433b1042c3f802daebbe2f989a9bbf81a196466d7b7260584","last_reissued_at":"2026-05-17T23:41:59.220927Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:41:59.220927Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"High-dimensional principal component analysis with heterogeneous missingness","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["math.ST","stat.TH"],"primary_cat":"stat.ME","authors_text":"Richard J. Samworth, Tengyao Wang, Ziwei Zhu","submitted_at":"2019-06-28T10:37:16Z","abstract_excerpt":"We study the problem of high-dimensional Principal Component Analysis (PCA) with missing observations. In simple, homogeneous missingness settings with a noise level of constant order, we show that an existing inverse-probability weighted (IPW) estimator of the leading principal components can (nearly) attain the minimax optimal rate of convergence. However, deeper investigation reveals both that, particularly in more realistic settings where the missingness mechanism is heterogeneous, the empirical performance of the IPW estimator can be unsatisfactory, and moreover that, in the noiseless cas"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1906.12125","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1906.12125","created_at":"2026-05-17T23:41:59.220987+00:00"},{"alias_kind":"arxiv_version","alias_value":"1906.12125v1","created_at":"2026-05-17T23:41:59.220987+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1906.12125","created_at":"2026-05-17T23:41:59.220987+00:00"},{"alias_kind":"pith_short_12","alias_value":"VHM32ULWCRLL","created_at":"2026-05-18T12:33:30.264802+00:00"},{"alias_kind":"pith_short_16","alias_value":"VHM32ULWCRLLIM5R","created_at":"2026-05-18T12:33:30.264802+00:00"},{"alias_kind":"pith_short_8","alias_value":"VHM32ULW","created_at":"2026-05-18T12:33:30.264802+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2","json":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2.json","graph_json":"https://pith.science/api/pith-number/VHM32ULWCRLLIM5RAQWD7ABNV2/graph.json","events_json":"https://pith.science/api/pith-number/VHM32ULWCRLLIM5RAQWD7ABNV2/events.json","paper":"https://pith.science/paper/VHM32ULW"},"agent_actions":{"view_html":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2","download_json":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2.json","view_paper":"https://pith.science/paper/VHM32ULW","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1906.12125&json=true","fetch_graph":"https://pith.science/api/pith-number/VHM32ULWCRLLIM5RAQWD7ABNV2/graph.json","fetch_events":"https://pith.science/api/pith-number/VHM32ULWCRLLIM5RAQWD7ABNV2/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2/action/timestamp_anchor","attest_storage":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2/action/storage_attestation","attest_author":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2/action/author_attestation","sign_citation":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2/action/citation_signature","submit_replication":"https://pith.science/pith/VHM32ULWCRLLIM5RAQWD7ABNV2/action/replication_record"}},"created_at":"2026-05-17T23:41:59.220987+00:00","updated_at":"2026-05-17T23:41:59.220987+00:00"}