{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:NXEPO3L6E47DSHDXA5HHUJRGCV","short_pith_number":"pith:NXEPO3L6","canonical_record":{"source":{"id":"1611.05923","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-11-17T22:23:08Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"c47b1286f66526e0074f25a3dede11f6e6076a61c5fbe3fb48eeda110085731e","abstract_canon_sha256":"016cf41a11c250650fd2acf5e2f42842892a4b7833a5a622b44899b47a16622a"},"schema_version":"1.0"},"canonical_sha256":"6dc8f76d7e273e391c77074e7a26261567877366c4cb4aa25b0b3309e5e356d1","source":{"kind":"arxiv","id":"1611.05923","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.05923","created_at":"2026-05-18T00:44:45Z"},{"alias_kind":"arxiv_version","alias_value":"1611.05923v3","created_at":"2026-05-18T00:44:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.05923","created_at":"2026-05-18T00:44:45Z"},{"alias_kind":"pith_short_12","alias_value":"NXEPO3L6E47D","created_at":"2026-05-18T12:30:36Z"},{"alias_kind":"pith_short_16","alias_value":"NXEPO3L6E47DSHDX","created_at":"2026-05-18T12:30:36Z"},{"alias_kind":"pith_short_8","alias_value":"NXEPO3L6","created_at":"2026-05-18T12:30:36Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:NXEPO3L6E47DSHDXA5HHUJRGCV","target":"record","payload":{"canonical_record":{"source":{"id":"1611.05923","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-11-17T22:23:08Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"c47b1286f66526e0074f25a3dede11f6e6076a61c5fbe3fb48eeda110085731e","abstract_canon_sha256":"016cf41a11c250650fd2acf5e2f42842892a4b7833a5a622b44899b47a16622a"},"schema_version":"1.0"},"canonical_sha256":"6dc8f76d7e273e391c77074e7a26261567877366c4cb4aa25b0b3309e5e356d1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:44:45.825980Z","signature_b64":"+XY6MH6JnxgmPoqZqS7sABnVMPpYkE6DDBBuLjNxU9T5oR9tNWz02kUezczq1tNjE0sXMi+yX64K8vneI2c+Bg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"6dc8f76d7e273e391c77074e7a26261567877366c4cb4aa25b0b3309e5e356d1","last_reissued_at":"2026-05-18T00:44:45.825483Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:44:45.825483Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1611.05923","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:44:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RlYob4Ge6Y+Tv0+v7YWvtRirZzUghCB3jUsXe00C/Dvr9IBjIAUjJ8kduLbqEB/k4dO42r5+KBd9cgorLUmlAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T01:25:29.501659Z"},"content_sha256":"7e8aaa4780958a890b387b0efe05ec46b146d8c0a12c319107f535cbbb655c36","schema_version":"1.0","event_id":"sha256:7e8aaa4780958a890b387b0efe05ec46b146d8c0a12c319107f535cbbb655c36"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:NXEPO3L6E47DSHDXA5HHUJRGCV","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"\"Influence Sketching\": Finding Influential Samples In Large-Scale Regressions","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"stat.ML","authors_text":"Ben Cruz, Brian Wallace, Caleb Crable, Jay Luan, Matt Wolff, Mike Wojnowicz, Xuan Zhao","submitted_at":"2016-11-17T22:23:08Z","abstract_excerpt":"There is an especially strong need in modern large-scale data analysis to prioritize samples for manual inspection. For example, the inspection could target important mislabeled samples or key vulnerabilities exploitable by an adversarial attack. In order to solve the \"needle in the haystack\" problem of which samples to inspect, we develop a new scalable version of Cook's distance, a classical statistical technique for identifying samples which unusually strongly impact the fit of a regression model (and its downstream predictions). In order to scale this technique up to very large and high-di"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.05923","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:44:45Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"QJ76DlTXaEMoz6aN22CnY2eTRbnITwiWY/g6So3qk9k9BlTiVqbjcbvi821RlE+UHqCzDlmEJSoGc3gZJ8RMCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T01:25:29.502005Z"},"content_sha256":"0358cba21479ed1e19caaa58964c7c1dff0880c2d205b6cfe4fd2b62546c18ab","schema_version":"1.0","event_id":"sha256:0358cba21479ed1e19caaa58964c7c1dff0880c2d205b6cfe4fd2b62546c18ab"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/NXEPO3L6E47DSHDXA5HHUJRGCV/bundle.json","state_url":"https://pith.science/pith/NXEPO3L6E47DSHDXA5HHUJRGCV/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/NXEPO3L6E47DSHDXA5HHUJRGCV/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T01:25:29Z","links":{"resolver":"https://pith.science/pith/NXEPO3L6E47DSHDXA5HHUJRGCV","bundle":"https://pith.science/pith/NXEPO3L6E47DSHDXA5HHUJRGCV/bundle.json","state":"https://pith.science/pith/NXEPO3L6E47DSHDXA5HHUJRGCV/state.json","well_known_bundle":"https://pith.science/.well-known/pith/NXEPO3L6E47DSHDXA5HHUJRGCV/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:NXEPO3L6E47DSHDXA5HHUJRGCV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"016cf41a11c250650fd2acf5e2f42842892a4b7833a5a622b44899b47a16622a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-11-17T22:23:08Z","title_canon_sha256":"c47b1286f66526e0074f25a3dede11f6e6076a61c5fbe3fb48eeda110085731e"},"schema_version":"1.0","source":{"id":"1611.05923","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.05923","created_at":"2026-05-18T00:44:45Z"},{"alias_kind":"arxiv_version","alias_value":"1611.05923v3","created_at":"2026-05-18T00:44:45Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.05923","created_at":"2026-05-18T00:44:45Z"},{"alias_kind":"pith_short_12","alias_value":"NXEPO3L6E47D","created_at":"2026-05-18T12:30:36Z"},{"alias_kind":"pith_short_16","alias_value":"NXEPO3L6E47DSHDX","created_at":"2026-05-18T12:30:36Z"},{"alias_kind":"pith_short_8","alias_value":"NXEPO3L6","created_at":"2026-05-18T12:30:36Z"}],"graph_snapshots":[{"event_id":"sha256:0358cba21479ed1e19caaa58964c7c1dff0880c2d205b6cfe4fd2b62546c18ab","target":"graph","created_at":"2026-05-18T00:44:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"There is an especially strong need in modern large-scale data analysis to prioritize samples for manual inspection. For example, the inspection could target important mislabeled samples or key vulnerabilities exploitable by an adversarial attack. In order to solve the \"needle in the haystack\" problem of which samples to inspect, we develop a new scalable version of Cook's distance, a classical statistical technique for identifying samples which unusually strongly impact the fit of a regression model (and its downstream predictions). In order to scale this technique up to very large and high-di","authors_text":"Ben Cruz, Brian Wallace, Caleb Crable, Jay Luan, Matt Wolff, Mike Wojnowicz, Xuan Zhao","cross_cats":["cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-11-17T22:23:08Z","title":"\"Influence Sketching\": Finding Influential Samples In Large-Scale Regressions"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.05923","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7e8aaa4780958a890b387b0efe05ec46b146d8c0a12c319107f535cbbb655c36","target":"record","created_at":"2026-05-18T00:44:45Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"016cf41a11c250650fd2acf5e2f42842892a4b7833a5a622b44899b47a16622a","cross_cats_sorted":["cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2016-11-17T22:23:08Z","title_canon_sha256":"c47b1286f66526e0074f25a3dede11f6e6076a61c5fbe3fb48eeda110085731e"},"schema_version":"1.0","source":{"id":"1611.05923","kind":"arxiv","version":3}},"canonical_sha256":"6dc8f76d7e273e391c77074e7a26261567877366c4cb4aa25b0b3309e5e356d1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"6dc8f76d7e273e391c77074e7a26261567877366c4cb4aa25b0b3309e5e356d1","first_computed_at":"2026-05-18T00:44:45.825483Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:44:45.825483Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"+XY6MH6JnxgmPoqZqS7sABnVMPpYkE6DDBBuLjNxU9T5oR9tNWz02kUezczq1tNjE0sXMi+yX64K8vneI2c+Bg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:44:45.825980Z","signed_message":"canonical_sha256_bytes"},"source_id":"1611.05923","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7e8aaa4780958a890b387b0efe05ec46b146d8c0a12c319107f535cbbb655c36","sha256:0358cba21479ed1e19caaa58964c7c1dff0880c2d205b6cfe4fd2b62546c18ab"],"state_sha256":"3ae14df3390d867c0398e2c73922d09045552dd96c7b3fc1d971281ed4125298"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"BPSo4c2PLXgCUR3ME7eFEuLD3LJ7bpTun19ncacjhquNC3y76I5O9/90rzYjPomqPKlCnAOK2bBnlyd5KQEpCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T01:25:29.504002Z","bundle_sha256":"28878728df8326867752da08579864bef7b58b8fbe0e21c084c20b23f3063042"}}