{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:4QIIEA3TRCRJDBAVNCTKJN4IPJ","short_pith_number":"pith:4QIIEA3T","canonical_record":{"source":{"id":"1803.04579","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-03-12T23:59:37Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"db7372b1aa5d2a89b92e1a855f86ef8163789f3e2c74fa42d97fd0f5f9d7a72e","abstract_canon_sha256":"edd22cc1691058a51d5b668745fffdc4094dc20e161be9991cb54cfe784f52d6"},"schema_version":"1.0"},"canonical_sha256":"e41082037388a291841568a6a4b7887a69f9ca1cf42cc92df839a0ed7830efb4","source":{"kind":"arxiv","id":"1803.04579","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.04579","created_at":"2026-05-18T00:21:18Z"},{"alias_kind":"arxiv_version","alias_value":"1803.04579v1","created_at":"2026-05-18T00:21:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.04579","created_at":"2026-05-18T00:21:18Z"},{"alias_kind":"pith_short_12","alias_value":"4QIIEA3TRCRJ","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"4QIIEA3TRCRJDBAV","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"4QIIEA3T","created_at":"2026-05-18T12:32:05Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:4QIIEA3TRCRJDBAVNCTKJN4IPJ","target":"record","payload":{"canonical_record":{"source":{"id":"1803.04579","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-03-12T23:59:37Z","cross_cats_sorted":["cs.CL"],"title_canon_sha256":"db7372b1aa5d2a89b92e1a855f86ef8163789f3e2c74fa42d97fd0f5f9d7a72e","abstract_canon_sha256":"edd22cc1691058a51d5b668745fffdc4094dc20e161be9991cb54cfe784f52d6"},"schema_version":"1.0"},"canonical_sha256":"e41082037388a291841568a6a4b7887a69f9ca1cf42cc92df839a0ed7830efb4","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:21:18.611218Z","signature_b64":"VtLvdM0Ib9GniSofC3WTrmVYptAOrPY0Yenx5zFss8O0OKgSk0MfbXrMqZypFifZfsQxUYgXD16UJ9rJTgffDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e41082037388a291841568a6a4b7887a69f9ca1cf42cc92df839a0ed7830efb4","last_reissued_at":"2026-05-18T00:21:18.610797Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:21:18.610797Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1803.04579","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:21:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Aje2ovPEM2/4Q7wXE2pN75Eh94WRYaRQqDIDvYRQllzeUgf8x5SXvlyDF2dUjomAbyEHQMNrnycKCj7WLo47DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T22:56:53.566690Z"},"content_sha256":"9a7624c07b8b47bd451aa95befd836b5a2fe99bb01c44953459f9690cfeb07d0","schema_version":"1.0","event_id":"sha256:9a7624c07b8b47bd451aa95befd836b5a2fe99bb01c44953459f9690cfeb07d0"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:4QIIEA3TRCRJDBAVNCTKJN4IPJ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"It was the training data pruning too!","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.CL"],"primary_cat":"cs.LG","authors_text":"Ankur Taly, Kedar Dhamdhere, Mukund Sundararajan, Pramod Kaushik Mudrakarta","submitted_at":"2018-03-12T23:59:37Z","abstract_excerpt":"We study the current best model (KDG) for question answering on tabular data evaluated over the WikiTableQuestions dataset. Previous ablation studies performed against this model attributed the model's performance to certain aspects of its architecture. In this paper, we find that the model's performance also crucially depends on a certain pruning of the data used to train the model. Disabling the pruning step drops the accuracy of the model from 43.3% to 36.3%. The large impact on the performance of the KDG model suggests that the pruning may be a useful pre-processing step in training other "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.04579","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:21:18Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YlH2tHOyc+Qb5Q57+OOpi5wdwF9EnhvLQR0/bAufyqzjMG6JMwZl2bWZe1SCBRQkDwktxiMx1C+NXyT3+FpPDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T22:56:53.567374Z"},"content_sha256":"680cb827640d5f5a419d6bd477eebcbdceb960a765e619c765433f7082c048e6","schema_version":"1.0","event_id":"sha256:680cb827640d5f5a419d6bd477eebcbdceb960a765e619c765433f7082c048e6"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/4QIIEA3TRCRJDBAVNCTKJN4IPJ/bundle.json","state_url":"https://pith.science/pith/4QIIEA3TRCRJDBAVNCTKJN4IPJ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/4QIIEA3TRCRJDBAVNCTKJN4IPJ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-23T22:56:53Z","links":{"resolver":"https://pith.science/pith/4QIIEA3TRCRJDBAVNCTKJN4IPJ","bundle":"https://pith.science/pith/4QIIEA3TRCRJDBAVNCTKJN4IPJ/bundle.json","state":"https://pith.science/pith/4QIIEA3TRCRJDBAVNCTKJN4IPJ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/4QIIEA3TRCRJDBAVNCTKJN4IPJ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:4QIIEA3TRCRJDBAVNCTKJN4IPJ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"edd22cc1691058a51d5b668745fffdc4094dc20e161be9991cb54cfe784f52d6","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-03-12T23:59:37Z","title_canon_sha256":"db7372b1aa5d2a89b92e1a855f86ef8163789f3e2c74fa42d97fd0f5f9d7a72e"},"schema_version":"1.0","source":{"id":"1803.04579","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.04579","created_at":"2026-05-18T00:21:18Z"},{"alias_kind":"arxiv_version","alias_value":"1803.04579v1","created_at":"2026-05-18T00:21:18Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.04579","created_at":"2026-05-18T00:21:18Z"},{"alias_kind":"pith_short_12","alias_value":"4QIIEA3TRCRJ","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_16","alias_value":"4QIIEA3TRCRJDBAV","created_at":"2026-05-18T12:32:05Z"},{"alias_kind":"pith_short_8","alias_value":"4QIIEA3T","created_at":"2026-05-18T12:32:05Z"}],"graph_snapshots":[{"event_id":"sha256:680cb827640d5f5a419d6bd477eebcbdceb960a765e619c765433f7082c048e6","target":"graph","created_at":"2026-05-18T00:21:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We study the current best model (KDG) for question answering on tabular data evaluated over the WikiTableQuestions dataset. Previous ablation studies performed against this model attributed the model's performance to certain aspects of its architecture. In this paper, we find that the model's performance also crucially depends on a certain pruning of the data used to train the model. Disabling the pruning step drops the accuracy of the model from 43.3% to 36.3%. The large impact on the performance of the KDG model suggests that the pruning may be a useful pre-processing step in training other ","authors_text":"Ankur Taly, Kedar Dhamdhere, Mukund Sundararajan, Pramod Kaushik Mudrakarta","cross_cats":["cs.CL"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-03-12T23:59:37Z","title":"It was the training data pruning too!"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.04579","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:9a7624c07b8b47bd451aa95befd836b5a2fe99bb01c44953459f9690cfeb07d0","target":"record","created_at":"2026-05-18T00:21:18Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"edd22cc1691058a51d5b668745fffdc4094dc20e161be9991cb54cfe784f52d6","cross_cats_sorted":["cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-03-12T23:59:37Z","title_canon_sha256":"db7372b1aa5d2a89b92e1a855f86ef8163789f3e2c74fa42d97fd0f5f9d7a72e"},"schema_version":"1.0","source":{"id":"1803.04579","kind":"arxiv","version":1}},"canonical_sha256":"e41082037388a291841568a6a4b7887a69f9ca1cf42cc92df839a0ed7830efb4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e41082037388a291841568a6a4b7887a69f9ca1cf42cc92df839a0ed7830efb4","first_computed_at":"2026-05-18T00:21:18.610797Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:21:18.610797Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"VtLvdM0Ib9GniSofC3WTrmVYptAOrPY0Yenx5zFss8O0OKgSk0MfbXrMqZypFifZfsQxUYgXD16UJ9rJTgffDw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:21:18.611218Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.04579","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:9a7624c07b8b47bd451aa95befd836b5a2fe99bb01c44953459f9690cfeb07d0","sha256:680cb827640d5f5a419d6bd477eebcbdceb960a765e619c765433f7082c048e6"],"state_sha256":"e67706666ffea3bdff4d2e1c7e4985e9717c32934837a9611a72911558faf578"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"pc4GKjOjaCJhK/gMec87vULcgC57oosoUr97fs4YJXPp+5WPkazUJt4Bh5RCFRDqf1sgmhcg6AOBmAgm0DaRAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-23T22:56:53.571285Z","bundle_sha256":"14da3ab698b8792d5953a06fedaf8dcb09104380c46d676d15d9581b9aff7028"}}