{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:ZLZYVCVVQ34H3NO7YFXTVMSMZX","short_pith_number":"pith:ZLZYVCVV","schema_version":"1.0","canonical_sha256":"caf38a8ab586f87db5dfc16f3ab24ccdd374cbc7ae671cb68dee38cd138b1614","source":{"kind":"arxiv","id":"2606.24968","version":1},"attestation_state":"computed","paper":{"title":"Training Dynamics of Neural Software Defect Predictors under Coupled Data-Quality Issues","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Emmanuel Charleson Dapaah, Jens Grabowski, Philip Makedonski","submitted_at":"2026-06-23T10:08:55Z","abstract_excerpt":"Context: Software defect prediction supports maintenance decisions such as testing prioritization, release-risk assessment, and quality monitoring. However, metric-based SDP datasets often contain coupled data-quality issues, especially class imbalance and class overlap. Prior work has mainly measured their impact through endpoint performance, while recent evidence suggests that such issues may also appear in neural training dynamics (gradients, weights, biases, error trajectories). However, these studies examine issues in isolation, leaving open how internal neural network training patterns m"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.24968","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-06-23T10:08:55Z","cross_cats_sorted":[],"title_canon_sha256":"cf4b2bb9d04deaaa112c1d5aff1d26ade9170ef5e966a3ea9660ba186c868247","abstract_canon_sha256":"bb4c9d935b9d8b6620c45e8563d203da16da60056b64dc42f7bf046c222ef1ca"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-25T00:17:47.138847Z","signature_b64":"Oz2bxM/1jJi0gDEYwwsyTjfEK1JTi8KlUQWSt6arYJNh+Blv/p+9+B9Z1hajpu8mhVcGKHselL0NiUxx9y64AQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"caf38a8ab586f87db5dfc16f3ab24ccdd374cbc7ae671cb68dee38cd138b1614","last_reissued_at":"2026-06-25T00:17:47.138443Z","signature_status":"signed_v1","first_computed_at":"2026-06-25T00:17:47.138443Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Training Dynamics of Neural Software Defect Predictors under Coupled Data-Quality Issues","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Emmanuel Charleson Dapaah, Jens Grabowski, Philip Makedonski","submitted_at":"2026-06-23T10:08:55Z","abstract_excerpt":"Context: Software defect prediction supports maintenance decisions such as testing prioritization, release-risk assessment, and quality monitoring. However, metric-based SDP datasets often contain coupled data-quality issues, especially class imbalance and class overlap. Prior work has mainly measured their impact through endpoint performance, while recent evidence suggests that such issues may also appear in neural training dynamics (gradients, weights, biases, error trajectories). However, these studies examine issues in isolation, leaving open how internal neural network training patterns m"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.24968","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.24968/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.24968","created_at":"2026-06-25T00:17:47.138507+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.24968v1","created_at":"2026-06-25T00:17:47.138507+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.24968","created_at":"2026-06-25T00:17:47.138507+00:00"},{"alias_kind":"pith_short_12","alias_value":"ZLZYVCVVQ34H","created_at":"2026-06-25T00:17:47.138507+00:00"},{"alias_kind":"pith_short_16","alias_value":"ZLZYVCVVQ34H3NO7","created_at":"2026-06-25T00:17:47.138507+00:00"},{"alias_kind":"pith_short_8","alias_value":"ZLZYVCVV","created_at":"2026-06-25T00:17:47.138507+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX","json":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX.json","graph_json":"https://pith.science/api/pith-number/ZLZYVCVVQ34H3NO7YFXTVMSMZX/graph.json","events_json":"https://pith.science/api/pith-number/ZLZYVCVVQ34H3NO7YFXTVMSMZX/events.json","paper":"https://pith.science/paper/ZLZYVCVV"},"agent_actions":{"view_html":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX","download_json":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX.json","view_paper":"https://pith.science/paper/ZLZYVCVV","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.24968&json=true","fetch_graph":"https://pith.science/api/pith-number/ZLZYVCVVQ34H3NO7YFXTVMSMZX/graph.json","fetch_events":"https://pith.science/api/pith-number/ZLZYVCVVQ34H3NO7YFXTVMSMZX/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX/action/timestamp_anchor","attest_storage":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX/action/storage_attestation","attest_author":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX/action/author_attestation","sign_citation":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX/action/citation_signature","submit_replication":"https://pith.science/pith/ZLZYVCVVQ34H3NO7YFXTVMSMZX/action/replication_record"}},"created_at":"2026-06-25T00:17:47.138507+00:00","updated_at":"2026-06-25T00:17:47.138507+00:00"}