{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:AIOQKSXHKB5YZ6EWPRIRX3PZ4H","short_pith_number":"pith:AIOQKSXH","schema_version":"1.0","canonical_sha256":"021d054ae7507b8cf8967c511bedf9e1d5b1a82458846cdebf3ad1deb660318a","source":{"kind":"arxiv","id":"2605.12803","version":1},"attestation_state":"computed","paper":{"title":"Pitfalls of Unlabeled Disagreement-Based Drift Detection in Streaming Tree Ensembles","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"Disagreement-based drift detection underperforms loss-based methods in incremental decision tree ensembles due to structural rigidity.","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Afonso Louren\\c{c}o, Goreti Marreiros, Lara S\\'a Neves, Lizy K. John","submitted_at":"2026-05-12T22:53:03Z","abstract_excerpt":"Detecting concept drift in high-speed data streams remains challenging, particularly when models must operate on unlabeled data and avoid false alarms caused by benign shifts. While disagreement-based uncertainty has shown promise in neural networks, its adaptation to ensembles of incremental decision trees (IDTs) remains largely unexplored. We investigate this approach by constructing batch-specific disagreement measures via label flipping in ensemble members and evaluating their effectiveness for drift detection in tabular data streams. Our experiments show that, although this method perform"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":true,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.12803","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-12T22:53:03Z","cross_cats_sorted":[],"title_canon_sha256":"18caeba6e8cfbecb262799f60ed0cde2e5dabb5cea7168d14601085b7687a6df","abstract_canon_sha256":"acb89353fc9f23f43802e1e3e843598a89481360a086849fad91df8ad3a5a72a"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T03:09:12.684522Z","signature_b64":"ttA8t5YI06iIz9sHsb8TEWc0D/35QMMFF2gcuuUOTxqsPZNDPI/xXHHPgaz31riaQKnd7lACJdA7TK+Dc0yFAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"021d054ae7507b8cf8967c511bedf9e1d5b1a82458846cdebf3ad1deb660318a","last_reissued_at":"2026-05-18T03:09:12.683936Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T03:09:12.683936Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Pitfalls of Unlabeled Disagreement-Based Drift Detection in Streaming Tree Ensembles","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"Disagreement-based drift detection underperforms loss-based methods in incremental decision tree ensembles due to structural rigidity.","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Afonso Louren\\c{c}o, Goreti Marreiros, Lara S\\'a Neves, Lizy K. John","submitted_at":"2026-05-12T22:53:03Z","abstract_excerpt":"Detecting concept drift in high-speed data streams remains challenging, particularly when models must operate on unlabeled data and avoid false alarms caused by benign shifts. While disagreement-based uncertainty has shown promise in neural networks, its adaptation to ensembles of incremental decision trees (IDTs) remains largely unexplored. We investigate this approach by constructing batch-specific disagreement measures via label flipping in ensemble members and evaluating their effectiveness for drift detection in tabular data streams. Our experiments show that, although this method perform"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"Our experiments show that, although this method performs well in ensembles of multi-layer perceptrons (MLPs), it consistently underperforms loss-based detectors when applied to IDTs. We attribute this behavior to the intrinsic rigidity of IDTs: learning primarily through structural expansion, with limited parameter adaptation, restricts model plasticity and prevents disagreement from reliably reflecting learning potential.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"That batch-specific disagreement measures constructed via label flipping accurately reflect learning potential in IDTs and that the observed underperformance is caused by model rigidity rather than other factors in the experimental design.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"Disagreement measures from label flipping in IDT ensembles underperform loss-based drift detectors in streaming tabular data due to the limited plasticity of tree models.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"Disagreement-based drift detection underperforms loss-based methods in incremental decision tree ensembles due to structural rigidity.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"6734399691ada04e0170a3193b2e7352bd5d3f6c43ab3992a3c29fe6fdae8514"},"source":{"id":"2605.12803","kind":"arxiv","version":1},"verdict":{"id":"96f1ff77-01ba-4485-be1e-9e7583c4342a","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-14T20:28:23.101861Z","strongest_claim":"Our experiments show that, although this method performs well in ensembles of multi-layer perceptrons (MLPs), it consistently underperforms loss-based detectors when applied to IDTs. We attribute this behavior to the intrinsic rigidity of IDTs: learning primarily through structural expansion, with limited parameter adaptation, restricts model plasticity and prevents disagreement from reliably reflecting learning potential.","one_line_summary":"Disagreement measures from label flipping in IDT ensembles underperform loss-based drift detectors in streaming tabular data due to the limited plasticity of tree models.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"That batch-specific disagreement measures constructed via label flipping accurately reflect learning potential in IDTs and that the observed underperformance is caused by model rigidity rather than other factors in the experimental design.","pith_extraction_headline":"Disagreement-based drift detection underperforms loss-based methods in incremental decision tree ensembles due to structural rigidity."},"references":{"count":48,"sample":[{"doi":"","year":2025,"title":"Knowledge and Information Systems , pages=","work_id":"c0cabcfa-6d31-4c1c-bd95-78aef4cf33c7","ref_index":1,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery & Data Mining , pages=","work_id":"c03f50e5-d89f-4fab-ab83-3fbc2776f072","ref_index":2,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":2024,"title":"Joint European Conference on Machine Learning and Knowledge Discovery in Databases , pages=","work_id":"9a2b3ac4-dcf8-4d15-b834-daa5361fbd06","ref_index":3,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"arXiv preprint arXiv:2512.11668 , year=","work_id":"7f604e50-de3d-459b-8fec-dd73777f957b","ref_index":4,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"arXiv preprint arXiv:2502.14011 , year=","work_id":"8a4d1e4a-2d3a-42a1-82d3-fa05b3dd3b0b","ref_index":5,"cited_arxiv_id":"","is_internal_anchor":false}],"resolved_work":48,"snapshot_sha256":"47985fba687f25bb97268f1227e5046dcb09e320708715780f233fd704739ced","internal_anchors":2},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.12803","created_at":"2026-05-18T03:09:12.684013+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.12803v1","created_at":"2026-05-18T03:09:12.684013+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.12803","created_at":"2026-05-18T03:09:12.684013+00:00"},{"alias_kind":"pith_short_12","alias_value":"AIOQKSXHKB5Y","created_at":"2026-05-18T12:33:37.589309+00:00"},{"alias_kind":"pith_short_16","alias_value":"AIOQKSXHKB5YZ6EW","created_at":"2026-05-18T12:33:37.589309+00:00"},{"alias_kind":"pith_short_8","alias_value":"AIOQKSXH","created_at":"2026-05-18T12:33:37.589309+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H","json":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H.json","graph_json":"https://pith.science/api/pith-number/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/graph.json","events_json":"https://pith.science/api/pith-number/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/events.json","paper":"https://pith.science/paper/AIOQKSXH"},"agent_actions":{"view_html":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H","download_json":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H.json","view_paper":"https://pith.science/paper/AIOQKSXH","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.12803&json=true","fetch_graph":"https://pith.science/api/pith-number/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/graph.json","fetch_events":"https://pith.science/api/pith-number/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/action/timestamp_anchor","attest_storage":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/action/storage_attestation","attest_author":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/action/author_attestation","sign_citation":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/action/citation_signature","submit_replication":"https://pith.science/pith/AIOQKSXHKB5YZ6EWPRIRX3PZ4H/action/replication_record"}},"created_at":"2026-05-18T03:09:12.684013+00:00","updated_at":"2026-05-18T03:09:12.684013+00:00"}