{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:DHYKZGZW2OB54NNEEPPB3PAD4W","short_pith_number":"pith:DHYKZGZW","canonical_record":{"source":{"id":"2605.18859","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T08:58:59Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"69c90d4b38b73ed64d0658ffba0d21ccc5f6daa79d6ccc54158472e3a282147f","abstract_canon_sha256":"055128c2117627eadc69a2efac5170989e714c5ede5167141b8f4db2d66f8ae1"},"schema_version":"1.0"},"canonical_sha256":"19f0ac9b36d383de35a423de1dbc03e580fd768741045491c72344539a4c8459","source":{"kind":"arxiv","id":"2605.18859","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18859","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18859v1","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18859","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"pith_short_12","alias_value":"DHYKZGZW2OB5","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"pith_short_16","alias_value":"DHYKZGZW2OB54NNE","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"pith_short_8","alias_value":"DHYKZGZW","created_at":"2026-05-20T00:06:26Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:DHYKZGZW2OB54NNEEPPB3PAD4W","target":"record","payload":{"canonical_record":{"source":{"id":"2605.18859","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T08:58:59Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"69c90d4b38b73ed64d0658ffba0d21ccc5f6daa79d6ccc54158472e3a282147f","abstract_canon_sha256":"055128c2117627eadc69a2efac5170989e714c5ede5167141b8f4db2d66f8ae1"},"schema_version":"1.0"},"canonical_sha256":"19f0ac9b36d383de35a423de1dbc03e580fd768741045491c72344539a4c8459","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:06:26.189415Z","signature_b64":"5/SeYlkEIRBoNHPg0gLuILpOh7vGnIU2VTa+Gly8xQUdGHm3VQA79CEFqamE0EV0ZOpe0/X0NuWPyd3KDXKOBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"19f0ac9b36d383de35a423de1dbc03e580fd768741045491c72344539a4c8459","last_reissued_at":"2026-05-20T00:06:26.188488Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:06:26.188488Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.18859","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:26Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YYS6KqbWXqp/biF6bq5FKk/d1fRVJzAX9OwtE2+wYM1EG4SFQnp3TsnxAv/KTjY9orCmZ3gsRnSrXjlVU0jXDg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T09:12:08.256577Z"},"content_sha256":"ba8b061e6456d260b915b440001890b8a64253f0032e732f4da93b1f155b5b27","schema_version":"1.0","event_id":"sha256:ba8b061e6456d260b915b440001890b8a64253f0032e732f4da93b1f155b5b27"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:DHYKZGZW2OB54NNEEPPB3PAD4W","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"TwinRouterBench: Fast Static and Live Dynamic Evaluation for Realistic Agentic LLM Routing","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"Anjie Yang, Eric Yang, Hanchen Li, Jiarong Xing, Jie Xiao, Liang Tian, Lynn Ai, Pei Yang, Pengbin Feng, Tianyu Shi, Tongyun Yang, Wanyi Chen, Wentao Guo, Xu Wang, Yuhang Han, Yuhang Yao, Zeyu Wang","submitted_at":"2026-05-14T08:58:59Z","abstract_excerpt":"LLM routing matters most in long-horizon applications such as coding agents, deep research systems, and computer-use agents, where a single user request triggers many model calls. Routing each call to the cheapest sufficient model can cut costs without sacrificing quality, yet existing router benchmarks evaluate routers only on one-shot prompts. They never expose the router-visible prefix at an intermediate agent step, never test whether a cheaper replacement preserves downstream task success, and often rely on online LLM judges at evaluation time. We introduce TwinRouterBench, a step-level ro"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18859","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.18859/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:06:26Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"niZJuGjuK6XIQCp0RxIP84+Hn0D8gLl159umoiGlNxm6Ga0Z1o1hgn09wSh6b+spJw31mPCBVEdG9PSlWb6eAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T09:12:08.257384Z"},"content_sha256":"b67bc6e04713bea657291987d0f45b17cd383df828b2864703091f329b51a411","schema_version":"1.0","event_id":"sha256:b67bc6e04713bea657291987d0f45b17cd383df828b2864703091f329b51a411"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/DHYKZGZW2OB54NNEEPPB3PAD4W/bundle.json","state_url":"https://pith.science/pith/DHYKZGZW2OB54NNEEPPB3PAD4W/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/DHYKZGZW2OB54NNEEPPB3PAD4W/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T09:12:08Z","links":{"resolver":"https://pith.science/pith/DHYKZGZW2OB54NNEEPPB3PAD4W","bundle":"https://pith.science/pith/DHYKZGZW2OB54NNEEPPB3PAD4W/bundle.json","state":"https://pith.science/pith/DHYKZGZW2OB54NNEEPPB3PAD4W/state.json","well_known_bundle":"https://pith.science/.well-known/pith/DHYKZGZW2OB54NNEEPPB3PAD4W/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:DHYKZGZW2OB54NNEEPPB3PAD4W","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"055128c2117627eadc69a2efac5170989e714c5ede5167141b8f4db2d66f8ae1","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T08:58:59Z","title_canon_sha256":"69c90d4b38b73ed64d0658ffba0d21ccc5f6daa79d6ccc54158472e3a282147f"},"schema_version":"1.0","source":{"id":"2605.18859","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.18859","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"arxiv_version","alias_value":"2605.18859v1","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.18859","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"pith_short_12","alias_value":"DHYKZGZW2OB5","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"pith_short_16","alias_value":"DHYKZGZW2OB54NNE","created_at":"2026-05-20T00:06:26Z"},{"alias_kind":"pith_short_8","alias_value":"DHYKZGZW","created_at":"2026-05-20T00:06:26Z"}],"graph_snapshots":[{"event_id":"sha256:b67bc6e04713bea657291987d0f45b17cd383df828b2864703091f329b51a411","target":"graph","created_at":"2026-05-20T00:06:26Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.18859/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"LLM routing matters most in long-horizon applications such as coding agents, deep research systems, and computer-use agents, where a single user request triggers many model calls. Routing each call to the cheapest sufficient model can cut costs without sacrificing quality, yet existing router benchmarks evaluate routers only on one-shot prompts. They never expose the router-visible prefix at an intermediate agent step, never test whether a cheaper replacement preserves downstream task success, and often rely on online LLM judges at evaluation time. We introduce TwinRouterBench, a step-level ro","authors_text":"Anjie Yang, Eric Yang, Hanchen Li, Jiarong Xing, Jie Xiao, Liang Tian, Lynn Ai, Pei Yang, Pengbin Feng, Tianyu Shi, Tongyun Yang, Wanyi Chen, Wentao Guo, Xu Wang, Yuhang Han, Yuhang Yao, Zeyu Wang","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T08:58:59Z","title":"TwinRouterBench: Fast Static and Live Dynamic Evaluation for Realistic Agentic LLM Routing"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.18859","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:ba8b061e6456d260b915b440001890b8a64253f0032e732f4da93b1f155b5b27","target":"record","created_at":"2026-05-20T00:06:26Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"055128c2117627eadc69a2efac5170989e714c5ede5167141b8f4db2d66f8ae1","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-14T08:58:59Z","title_canon_sha256":"69c90d4b38b73ed64d0658ffba0d21ccc5f6daa79d6ccc54158472e3a282147f"},"schema_version":"1.0","source":{"id":"2605.18859","kind":"arxiv","version":1}},"canonical_sha256":"19f0ac9b36d383de35a423de1dbc03e580fd768741045491c72344539a4c8459","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"19f0ac9b36d383de35a423de1dbc03e580fd768741045491c72344539a4c8459","first_computed_at":"2026-05-20T00:06:26.188488Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:06:26.188488Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"5/SeYlkEIRBoNHPg0gLuILpOh7vGnIU2VTa+Gly8xQUdGHm3VQA79CEFqamE0EV0ZOpe0/X0NuWPyd3KDXKOBQ==","signature_status":"signed_v1","signed_at":"2026-05-20T00:06:26.189415Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.18859","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:ba8b061e6456d260b915b440001890b8a64253f0032e732f4da93b1f155b5b27","sha256:b67bc6e04713bea657291987d0f45b17cd383df828b2864703091f329b51a411"],"state_sha256":"cc430b68b90c665411ebf580ddef7ee332b5c247a47e5c9404d13e8a1569621e"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9aI3o4PdfVGWEkeuwRVaeoBj4HhAn+1J6zzA+QuxpxO5z6fDpC/uUcuJy8gyTjtBNnpKwURVY7z7yjUDJXiKAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T09:12:08.261749Z","bundle_sha256":"7be97172e0f76acb9780309e8f3abd428d77531f8f52feb10a7835b93899faa4"}}