{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:QICNPVM7LOOCUOR3ZSWHBXLCO5","short_pith_number":"pith:QICNPVM7","canonical_record":{"source":{"id":"2606.07709","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-05T12:57:12Z","cross_cats_sorted":[],"title_canon_sha256":"f6ff29574b57aaae330333cc45ae326e3f16ee01c3c7d29823e411e42dbc9103","abstract_canon_sha256":"12105b6940cfcdb2d6824e695adb49ec0db55349232c08a376baa9833d7edf82"},"schema_version":"1.0"},"canonical_sha256":"8204d7d59f5b9c2a3a3bccac70dd6277610ba7ca5dffcf6dd54bff5cc69ff85a","source":{"kind":"arxiv","id":"2606.07709","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07709","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07709v1","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07709","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"pith_short_12","alias_value":"QICNPVM7LOOC","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"pith_short_16","alias_value":"QICNPVM7LOOCUOR3","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"pith_short_8","alias_value":"QICNPVM7","created_at":"2026-06-09T01:04:49Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:QICNPVM7LOOCUOR3ZSWHBXLCO5","target":"record","payload":{"canonical_record":{"source":{"id":"2606.07709","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-05T12:57:12Z","cross_cats_sorted":[],"title_canon_sha256":"f6ff29574b57aaae330333cc45ae326e3f16ee01c3c7d29823e411e42dbc9103","abstract_canon_sha256":"12105b6940cfcdb2d6824e695adb49ec0db55349232c08a376baa9833d7edf82"},"schema_version":"1.0"},"canonical_sha256":"8204d7d59f5b9c2a3a3bccac70dd6277610ba7ca5dffcf6dd54bff5cc69ff85a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-09T01:04:49.919187Z","signature_b64":"xxitEHstWqcIWxBdul2nQPRpbZCcQg1ZNIAueQ0yDu+KqDqi2H0DFEKCSfQNlfdsWsxh5kgwL7/NHaEzF1+VCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8204d7d59f5b9c2a3a3bccac70dd6277610ba7ca5dffcf6dd54bff5cc69ff85a","last_reissued_at":"2026-06-09T01:04:49.918627Z","signature_status":"signed_v1","first_computed_at":"2026-06-09T01:04:49.918627Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.07709","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:04:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"nRMzylxfKamD5uFZj4jQKL/dEFFV4DpRuOtNXgzYBSAHQfJSCD4icwi4drxvt4cCEf5zvhrBm/70pSFjmBANCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T12:31:18.914840Z"},"content_sha256":"34fa482cfa7216d9380d20228116ee329f043017ad658d123401b71870ade8d5","schema_version":"1.0","event_id":"sha256:34fa482cfa7216d9380d20228116ee329f043017ad658d123401b71870ade8d5"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:QICNPVM7LOOCUOR3ZSWHBXLCO5","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Are We Lost in the Woods? Detecting Silent Semantic Faults for Random Forest Classifiers with Data-informed Static Analysis","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.SE","authors_text":"Daniel Varro, Kristian Sandahl, Louis Ohl, Willem Meijer","submitted_at":"2026-06-05T12:57:12Z","abstract_excerpt":"While machine learning (ML) software necessitates effective quality assurance, ML engineers still encounter silent semantic faults, such as imbalanced datasets, that degrade prediction performance without apparent symptoms. These faults are typically detected after expensive training cycles, causing significant resource waste. We propose a data-informed static analysis technique to detect silent semantic faults in ML scripts that use the popular random forest classifier. Our approach extracts ML pipelines into directed acyclic graphs and evaluates them against formalized API contracts to detec"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07709","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.07709/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-09T01:04:49Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"SR8xS6WNMoR7hi4LDQuLhy1H1sV9aO6tv5YNLoatO1ycotWB62PxOmeWbaKwQfozXEQaAz1GoGT2CZ2eLNZCCg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T12:31:18.915229Z"},"content_sha256":"b3aa523b0e44abdfa51134570e6d4ced6b79ad189f594d5fbe98f99f20907647","schema_version":"1.0","event_id":"sha256:b3aa523b0e44abdfa51134570e6d4ced6b79ad189f594d5fbe98f99f20907647"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/QICNPVM7LOOCUOR3ZSWHBXLCO5/bundle.json","state_url":"https://pith.science/pith/QICNPVM7LOOCUOR3ZSWHBXLCO5/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/QICNPVM7LOOCUOR3ZSWHBXLCO5/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T12:31:18Z","links":{"resolver":"https://pith.science/pith/QICNPVM7LOOCUOR3ZSWHBXLCO5","bundle":"https://pith.science/pith/QICNPVM7LOOCUOR3ZSWHBXLCO5/bundle.json","state":"https://pith.science/pith/QICNPVM7LOOCUOR3ZSWHBXLCO5/state.json","well_known_bundle":"https://pith.science/.well-known/pith/QICNPVM7LOOCUOR3ZSWHBXLCO5/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:QICNPVM7LOOCUOR3ZSWHBXLCO5","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"12105b6940cfcdb2d6824e695adb49ec0db55349232c08a376baa9833d7edf82","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-05T12:57:12Z","title_canon_sha256":"f6ff29574b57aaae330333cc45ae326e3f16ee01c3c7d29823e411e42dbc9103"},"schema_version":"1.0","source":{"id":"2606.07709","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07709","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07709v1","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07709","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"pith_short_12","alias_value":"QICNPVM7LOOC","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"pith_short_16","alias_value":"QICNPVM7LOOCUOR3","created_at":"2026-06-09T01:04:49Z"},{"alias_kind":"pith_short_8","alias_value":"QICNPVM7","created_at":"2026-06-09T01:04:49Z"}],"graph_snapshots":[{"event_id":"sha256:b3aa523b0e44abdfa51134570e6d4ced6b79ad189f594d5fbe98f99f20907647","target":"graph","created_at":"2026-06-09T01:04:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.07709/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"While machine learning (ML) software necessitates effective quality assurance, ML engineers still encounter silent semantic faults, such as imbalanced datasets, that degrade prediction performance without apparent symptoms. These faults are typically detected after expensive training cycles, causing significant resource waste. We propose a data-informed static analysis technique to detect silent semantic faults in ML scripts that use the popular random forest classifier. Our approach extracts ML pipelines into directed acyclic graphs and evaluates them against formalized API contracts to detec","authors_text":"Daniel Varro, Kristian Sandahl, Louis Ohl, Willem Meijer","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-05T12:57:12Z","title":"Are We Lost in the Woods? Detecting Silent Semantic Faults for Random Forest Classifiers with Data-informed Static Analysis"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07709","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:34fa482cfa7216d9380d20228116ee329f043017ad658d123401b71870ade8d5","target":"record","created_at":"2026-06-09T01:04:49Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"12105b6940cfcdb2d6824e695adb49ec0db55349232c08a376baa9833d7edf82","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.SE","submitted_at":"2026-06-05T12:57:12Z","title_canon_sha256":"f6ff29574b57aaae330333cc45ae326e3f16ee01c3c7d29823e411e42dbc9103"},"schema_version":"1.0","source":{"id":"2606.07709","kind":"arxiv","version":1}},"canonical_sha256":"8204d7d59f5b9c2a3a3bccac70dd6277610ba7ca5dffcf6dd54bff5cc69ff85a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8204d7d59f5b9c2a3a3bccac70dd6277610ba7ca5dffcf6dd54bff5cc69ff85a","first_computed_at":"2026-06-09T01:04:49.918627Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-09T01:04:49.918627Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"xxitEHstWqcIWxBdul2nQPRpbZCcQg1ZNIAueQ0yDu+KqDqi2H0DFEKCSfQNlfdsWsxh5kgwL7/NHaEzF1+VCw==","signature_status":"signed_v1","signed_at":"2026-06-09T01:04:49.919187Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.07709","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:34fa482cfa7216d9380d20228116ee329f043017ad658d123401b71870ade8d5","sha256:b3aa523b0e44abdfa51134570e6d4ced6b79ad189f594d5fbe98f99f20907647"],"state_sha256":"c8a433e1c771a6069cf3046fd0d01259f281a0bdd57b94b3c485370f060ac0ed"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"CkytaWCXNPbq1+PAhijrbgVPC9dZFI4j1Fo+Va4meX5QdukpUu4TZUZDTQJynmIReWNfuEZeqFVaY9giRHdXCg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T12:31:18.917171Z","bundle_sha256":"17345fa0b6d3e5aec75855d83bf1605ade8aeae7769c66651756f88a73f9b25a"}}