{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:2LGE4ZKGNWNHVLZOGUGFJIMOA6","short_pith_number":"pith:2LGE4ZKG","schema_version":"1.0","canonical_sha256":"d2cc4e65466d9a7aaf2e350c54a18e07b67a277eb911e1929096b40d653c25f2","source":{"kind":"arxiv","id":"2605.18565","version":1},"attestation_state":"computed","paper":{"title":"LongMINT: Evaluating Memory under Multi-Target Interference in Long-Horizon Agent Systems","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CL","authors_text":"Elias Stengel-Eskin, Hyunji Lee, Joykirat Singh, Justin Chih-Yao Chen, Mohit Bansal, Zaid Khan","submitted_at":"2026-05-18T15:43:35Z","abstract_excerpt":"Real-world agents operate over long and evolving horizons, where information is repeatedly updated and may interfere across memories, requiring accurate recall and aggregated reasoning over multiple pieces of information. However, existing benchmarks focus on static, independent recall and fail to capture these dynamic interactions between evolving memories. In this paper, we study how current memory-augmented agents perform in realistic, interference-heavy, long-horizon settings across diverse domains and question types. We introduce LongMINT (Long-Horizon Memory under INTerference), a benchm"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.18565","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-18T15:43:35Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"67f0ae3b485d4c03a3d8a4e9bd3f82ab6652107faab311a59863c29fcf52b093","abstract_canon_sha256":"07cc2cc3668032be4b611ecb3c8e3955dd20a1746e0ec44e418ad71701dee1fc"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:06:07.963487Z","signature_b64":"y6db0OQvqFNQou9OVb0CoKaKGydDN8qkAkcXSsdDpoBBp21srwKUJZZDcf/LLjvgLoGv5YTDq0VLuYZSDEBBDA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d2cc4e65466d9a7aaf2e350c54a18e07b67a277eb911e1929096b40d653c25f2","last_reissued_at":"2026-05-20T00:06:07.962620Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:06:07.962620Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"LongMINT: Evaluating Memory under Multi-Target Interference in Long-Horizon Agent Systems","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.CL","authors_text":"Elias Stengel-Eskin, Hyunji Lee, Joykirat Singh, Justin Chih-Yao Chen, Mohit Bansal, Zaid Khan","submitted_at":"2026-05-18T15:43:35Z","abstract_excerpt":"Real-world agents operate over long and evolving horizons, where information is repeatedly updated and may interfere across memories, requiring accurate recall and aggregated reasoning over multiple pieces of information. However, existing benchmarks focus on static, independent recall and fail to capture these dynamic interactions between evolving memories. In this paper, we study how current memory-augmented agents perform in realistic, interference-heavy, long-horizon settings across diverse domains and question types. We introduce LongMINT (Long-Horizon Memory under INTerference), a benchm"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18565","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18565/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"claim_evidence","ran_at":"2026-05-20T00:01:59.351332Z","status":"completed","version":"1.0.0","findings_count":0}],"snapshot_sha256":"889b1ea0a679a453b7abe093719b0b41470daf93da9836de32262f9e4b76dc81"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.18565","created_at":"2026-05-20T00:06:07.962750+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.18565v1","created_at":"2026-05-20T00:06:07.962750+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18565","created_at":"2026-05-20T00:06:07.962750+00:00"},{"alias_kind":"pith_short_12","alias_value":"2LGE4ZKGNWNH","created_at":"2026-05-20T00:06:07.962750+00:00"},{"alias_kind":"pith_short_16","alias_value":"2LGE4ZKGNWNHVLZO","created_at":"2026-05-20T00:06:07.962750+00:00"},{"alias_kind":"pith_short_8","alias_value":"2LGE4ZKG","created_at":"2026-05-20T00:06:07.962750+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6","json":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6.json","graph_json":"https://pith.science/api/pith-number/2LGE4ZKGNWNHVLZOGUGFJIMOA6/graph.json","events_json":"https://pith.science/api/pith-number/2LGE4ZKGNWNHVLZOGUGFJIMOA6/events.json","paper":"https://pith.science/paper/2LGE4ZKG"},"agent_actions":{"view_html":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6","download_json":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6.json","view_paper":"https://pith.science/paper/2LGE4ZKG","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.18565&json=true","fetch_graph":"https://pith.science/api/pith-number/2LGE4ZKGNWNHVLZOGUGFJIMOA6/graph.json","fetch_events":"https://pith.science/api/pith-number/2LGE4ZKGNWNHVLZOGUGFJIMOA6/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6/action/timestamp_anchor","attest_storage":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6/action/storage_attestation","attest_author":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6/action/author_attestation","sign_citation":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6/action/citation_signature","submit_replication":"https://pith.science/pith/2LGE4ZKGNWNHVLZOGUGFJIMOA6/action/replication_record"}},"created_at":"2026-05-20T00:06:07.962750+00:00","updated_at":"2026-05-20T00:06:07.962750+00:00"}