{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:VTHNCTOK6L6UN2AKXSPKPRLSRT","short_pith_number":"pith:VTHNCTOK","canonical_record":{"source":{"id":"2606.17588","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-16T06:51:04Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"e1b9149a638ecbc46a4545625b16a4062316e4959ed750a9939a323567009338","abstract_canon_sha256":"51299d04ba5878e59c48212673abbbffdcd95b8e1688d119749dc10ae1ca11e1"},"schema_version":"1.0"},"canonical_sha256":"acced14dcaf2fd46e80abc9ea7c5728cdbc71b63940b521ef30370da95de10b3","source":{"kind":"arxiv","id":"2606.17588","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.17588","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"arxiv_version","alias_value":"2606.17588v1","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.17588","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_12","alias_value":"VTHNCTOK6L6U","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_16","alias_value":"VTHNCTOK6L6UN2AK","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_8","alias_value":"VTHNCTOK","created_at":"2026-06-19T16:10:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:VTHNCTOK6L6UN2AKXSPKPRLSRT","target":"record","payload":{"canonical_record":{"source":{"id":"2606.17588","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-16T06:51:04Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"e1b9149a638ecbc46a4545625b16a4062316e4959ed750a9939a323567009338","abstract_canon_sha256":"51299d04ba5878e59c48212673abbbffdcd95b8e1688d119749dc10ae1ca11e1"},"schema_version":"1.0"},"canonical_sha256":"acced14dcaf2fd46e80abc9ea7c5728cdbc71b63940b521ef30370da95de10b3","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-19T16:10:16.670401Z","signature_b64":"oVEQHSkMPTkZKMiHagj8lZKx59eA7SncjEQyHJmW31/AsplJXk8aRd2Eez6KIgdKOwgGa932MQO7uUWM/+BnDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"acced14dcaf2fd46e80abc9ea7c5728cdbc71b63940b521ef30370da95de10b3","last_reissued_at":"2026-06-19T16:10:16.670001Z","signature_status":"signed_v1","first_computed_at":"2026-06-19T16:10:16.670001Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.17588","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:10:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"C9NIlcqK/FVXjtlV1rz9lCq7rcNEEk30th2ucRVJ8+2iaQD3rMm4mRJVqcuQqU+oWGbkqzpYxtdFd/nttkwUAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T08:21:47.728452Z"},"content_sha256":"667d48d482346ad40168f49be25c2d66cedbfaae39875b7104c893d1ea65d08c","schema_version":"1.0","event_id":"sha256:667d48d482346ad40168f49be25c2d66cedbfaae39875b7104c893d1ea65d08c"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:VTHNCTOK6L6UN2AKXSPKPRLSRT","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Understanding LLMs in Title-Abstract Screening: From Disagreements to Recommendations","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.SE","authors_text":"Igor Steinmacher, Katia Romero Felizardo, Marco Gerosa, Miikka Kuutila, Mika M\\\"antyl\\\"a, Patricia Matsubara, Savio de Sousa Sampaio, Tayana Conte","submitted_at":"2026-06-16T06:51:04Z","abstract_excerpt":"Several studies have examined the use of large language models (LLMs) for title-abstract screening in systematic reviews (SRs), reporting mixed accuracy. However, questions of reliability remain largely unaddressed. In this study, we go beyond quantitative LLM-human agreement metrics and qualitatively investigate how and why LLMs fail. We also propose actionable recommendations. We analyzed disagreements between LLMs and researchers across six software engineering SRs and over 1,000 primary study papers. For each SR, papers were screened independently by human experts and LLMs in zero-shot mod"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.17588","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.17588/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-19T16:10:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"iAy80+WTHzpTGvxYjQYqayeIJBKpPQxL/i3v+zQZFkUcEsNflZ15HlExkp2V5DIEY8y19h98zInFia/3GjPpCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-28T08:21:47.729037Z"},"content_sha256":"78a1ec36bc97f2c322117c9f742e7d1f47f66358e27aed506de5b0d922484810","schema_version":"1.0","event_id":"sha256:78a1ec36bc97f2c322117c9f742e7d1f47f66358e27aed506de5b0d922484810"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/VTHNCTOK6L6UN2AKXSPKPRLSRT/bundle.json","state_url":"https://pith.science/pith/VTHNCTOK6L6UN2AKXSPKPRLSRT/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/VTHNCTOK6L6UN2AKXSPKPRLSRT/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-28T08:21:47Z","links":{"resolver":"https://pith.science/pith/VTHNCTOK6L6UN2AKXSPKPRLSRT","bundle":"https://pith.science/pith/VTHNCTOK6L6UN2AKXSPKPRLSRT/bundle.json","state":"https://pith.science/pith/VTHNCTOK6L6UN2AKXSPKPRLSRT/state.json","well_known_bundle":"https://pith.science/.well-known/pith/VTHNCTOK6L6UN2AKXSPKPRLSRT/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:VTHNCTOK6L6UN2AKXSPKPRLSRT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"51299d04ba5878e59c48212673abbbffdcd95b8e1688d119749dc10ae1ca11e1","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-16T06:51:04Z","title_canon_sha256":"e1b9149a638ecbc46a4545625b16a4062316e4959ed750a9939a323567009338"},"schema_version":"1.0","source":{"id":"2606.17588","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.17588","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"arxiv_version","alias_value":"2606.17588v1","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.17588","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_12","alias_value":"VTHNCTOK6L6U","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_16","alias_value":"VTHNCTOK6L6UN2AK","created_at":"2026-06-19T16:10:16Z"},{"alias_kind":"pith_short_8","alias_value":"VTHNCTOK","created_at":"2026-06-19T16:10:16Z"}],"graph_snapshots":[{"event_id":"sha256:78a1ec36bc97f2c322117c9f742e7d1f47f66358e27aed506de5b0d922484810","target":"graph","created_at":"2026-06-19T16:10:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.17588/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Several studies have examined the use of large language models (LLMs) for title-abstract screening in systematic reviews (SRs), reporting mixed accuracy. However, questions of reliability remain largely unaddressed. In this study, we go beyond quantitative LLM-human agreement metrics and qualitatively investigate how and why LLMs fail. We also propose actionable recommendations. We analyzed disagreements between LLMs and researchers across six software engineering SRs and over 1,000 primary study papers. For each SR, papers were screened independently by human experts and LLMs in zero-shot mod","authors_text":"Igor Steinmacher, Katia Romero Felizardo, Marco Gerosa, Miikka Kuutila, Mika M\\\"antyl\\\"a, Patricia Matsubara, Savio de Sousa Sampaio, Tayana Conte","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-16T06:51:04Z","title":"Understanding LLMs in Title-Abstract Screening: From Disagreements to Recommendations"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.17588","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:667d48d482346ad40168f49be25c2d66cedbfaae39875b7104c893d1ea65d08c","target":"record","created_at":"2026-06-19T16:10:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"51299d04ba5878e59c48212673abbbffdcd95b8e1688d119749dc10ae1ca11e1","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.SE","submitted_at":"2026-06-16T06:51:04Z","title_canon_sha256":"e1b9149a638ecbc46a4545625b16a4062316e4959ed750a9939a323567009338"},"schema_version":"1.0","source":{"id":"2606.17588","kind":"arxiv","version":1}},"canonical_sha256":"acced14dcaf2fd46e80abc9ea7c5728cdbc71b63940b521ef30370da95de10b3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"acced14dcaf2fd46e80abc9ea7c5728cdbc71b63940b521ef30370da95de10b3","first_computed_at":"2026-06-19T16:10:16.670001Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:10:16.670001Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"oVEQHSkMPTkZKMiHagj8lZKx59eA7SncjEQyHJmW31/AsplJXk8aRd2Eez6KIgdKOwgGa932MQO7uUWM/+BnDA==","signature_status":"signed_v1","signed_at":"2026-06-19T16:10:16.670401Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.17588","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:667d48d482346ad40168f49be25c2d66cedbfaae39875b7104c893d1ea65d08c","sha256:78a1ec36bc97f2c322117c9f742e7d1f47f66358e27aed506de5b0d922484810"],"state_sha256":"dbf37176ba6aa1e9d80c24a7dd1376ad38a36db210711054d40c455c2fdc01ba"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"stSUt6guz9aZyQmEt04AiW6U8Xu5CR40k0ZcD9B7IyFQlwYooRwm+qmF55RJKu2InthGsizp0MYBIc+0gCKKCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-28T08:21:47.731173Z","bundle_sha256":"acea23d540db788e154d9ce09e0578df011de194c07ffff435f9942586169540"}}