{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2018:WOQ42FXZ5ASOG625VADAMMCG3M","short_pith_number":"pith:WOQ42FXZ","schema_version":"1.0","canonical_sha256":"b3a1cd16f9e824e37b5da806063046db10c9a58bdb12310b65e9eb74fb485792","source":{"kind":"arxiv","id":"1810.04996","version":1},"attestation_state":"computed","paper":{"title":"A Simple Way to Deal with Cherry-picking","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","stat.ML"],"primary_cat":"stat.ME","authors_text":"Junpei Komiyama, Takanori Maehara","submitted_at":"2018-10-11T13:06:48Z","abstract_excerpt":"Statistical hypothesis testing serves as statistical evidence for scientific innovation. However, if the reported results are intentionally biased, hypothesis testing no longer controls the rate of false discovery. In particular, we study such selection bias in machine learning models where the reporter is motivated to promote an algorithmic innovation. When the number of possible configurations (e.g., datasets) is large, we show that the reporter can falsely report an innovation even if there is no improvement at all. We propose a `post-reporting' solution to this issue where the bias of the "},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1810.04996","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ME","submitted_at":"2018-10-11T13:06:48Z","cross_cats_sorted":["cs.LG","stat.ML"],"title_canon_sha256":"d591b296008e3131d5acd37d7e061829b82711ab955e7959f6bab5f91a1896dc","abstract_canon_sha256":"f8c3df6841477cb3d187bcf14670b1b7523b26e949aaa9627e399dc35d6546e6"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:03:35.323228Z","signature_b64":"3iv38O2yRzVMstHa+lyNdfxI9404veY02H2hS2345AHOQHIOrsQe7g+5hseRF6AeaqqAXHx7693kKFma/+7mAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"b3a1cd16f9e824e37b5da806063046db10c9a58bdb12310b65e9eb74fb485792","last_reissued_at":"2026-05-18T00:03:35.322593Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:03:35.322593Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"A Simple Way to Deal with Cherry-picking","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","stat.ML"],"primary_cat":"stat.ME","authors_text":"Junpei Komiyama, Takanori Maehara","submitted_at":"2018-10-11T13:06:48Z","abstract_excerpt":"Statistical hypothesis testing serves as statistical evidence for scientific innovation. However, if the reported results are intentionally biased, hypothesis testing no longer controls the rate of false discovery. In particular, we study such selection bias in machine learning models where the reporter is motivated to promote an algorithmic innovation. When the number of possible configurations (e.g., datasets) is large, we show that the reporter can falsely report an innovation even if there is no improvement at all. We propose a `post-reporting' solution to this issue where the bias of the "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.04996","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1810.04996","created_at":"2026-05-18T00:03:35.322701+00:00"},{"alias_kind":"arxiv_version","alias_value":"1810.04996v1","created_at":"2026-05-18T00:03:35.322701+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.04996","created_at":"2026-05-18T00:03:35.322701+00:00"},{"alias_kind":"pith_short_12","alias_value":"WOQ42FXZ5ASO","created_at":"2026-05-18T12:33:01.666342+00:00"},{"alias_kind":"pith_short_16","alias_value":"WOQ42FXZ5ASOG625","created_at":"2026-05-18T12:33:01.666342+00:00"},{"alias_kind":"pith_short_8","alias_value":"WOQ42FXZ","created_at":"2026-05-18T12:33:01.666342+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M","json":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M.json","graph_json":"https://pith.science/api/pith-number/WOQ42FXZ5ASOG625VADAMMCG3M/graph.json","events_json":"https://pith.science/api/pith-number/WOQ42FXZ5ASOG625VADAMMCG3M/events.json","paper":"https://pith.science/paper/WOQ42FXZ"},"agent_actions":{"view_html":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M","download_json":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M.json","view_paper":"https://pith.science/paper/WOQ42FXZ","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1810.04996&json=true","fetch_graph":"https://pith.science/api/pith-number/WOQ42FXZ5ASOG625VADAMMCG3M/graph.json","fetch_events":"https://pith.science/api/pith-number/WOQ42FXZ5ASOG625VADAMMCG3M/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M/action/timestamp_anchor","attest_storage":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M/action/storage_attestation","attest_author":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M/action/author_attestation","sign_citation":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M/action/citation_signature","submit_replication":"https://pith.science/pith/WOQ42FXZ5ASOG625VADAMMCG3M/action/replication_record"}},"created_at":"2026-05-18T00:03:35.322701+00:00","updated_at":"2026-05-18T00:03:35.322701+00:00"}