{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2025:RYVQEAUDGW65ZGD55QAOJNHSIW","short_pith_number":"pith:RYVQEAUD","canonical_record":{"source":{"id":"2507.19849","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-26T07:53:11Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"c6efe2ebcc3ed7ebb55512d4066b4de04d544066275cf02ab776cb1a95f4a0df","abstract_canon_sha256":"2d063dcb52d9088260070a91f280b9064b4539cd1d082dfcb0de4de283df80a3"},"schema_version":"1.0"},"canonical_sha256":"8e2b02028335bddc987dec00e4b4f2459a73c968a690cb2f56fc3280e364f4d7","source":{"kind":"arxiv","id":"2507.19849","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.19849","created_at":"2026-05-17T23:38:15Z"},{"alias_kind":"arxiv_version","alias_value":"2507.19849v1","created_at":"2026-05-17T23:38:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.19849","created_at":"2026-05-17T23:38:15Z"},{"alias_kind":"pith_short_12","alias_value":"RYVQEAUDGW65","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"RYVQEAUDGW65ZGD5","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"RYVQEAUD","created_at":"2026-05-18T12:33:37Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2025:RYVQEAUDGW65ZGD55QAOJNHSIW","target":"record","payload":{"canonical_record":{"source":{"id":"2507.19849","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-26T07:53:11Z","cross_cats_sorted":["cs.AI","cs.CL"],"title_canon_sha256":"c6efe2ebcc3ed7ebb55512d4066b4de04d544066275cf02ab776cb1a95f4a0df","abstract_canon_sha256":"2d063dcb52d9088260070a91f280b9064b4539cd1d082dfcb0de4de283df80a3"},"schema_version":"1.0"},"canonical_sha256":"8e2b02028335bddc987dec00e4b4f2459a73c968a690cb2f56fc3280e364f4d7","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:38:15.333885Z","signature_b64":"ysfb8jNGBhZqy1LdoRFEuTVGNj6ZHhBS70b9WsLDgLQLETf5x5+wOubjiUmIZQaWtEdfbdYVdXiwhsqyC8PyAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8e2b02028335bddc987dec00e4b4f2459a73c968a690cb2f56fc3280e364f4d7","last_reissued_at":"2026-05-17T23:38:15.333245Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:38:15.333245Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2507.19849","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:38:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"1S+sfpqH9Bf0jKOQRCCzWRx8SPUMAfbiInjpWYLXGM1YSo57dxDnDFsYmu5kSk/9mEjEwFnxf1e34578fQMHBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T05:10:13.128296Z"},"content_sha256":"f9d1043b1c12a48d506bae72f82cf62fb1a3c2aaa8508568f5f61c9867d01f17","schema_version":"1.0","event_id":"sha256:f9d1043b1c12a48d506bae72f82cf62fb1a3c2aaa8508568f5f61c9867d01f17"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2025:RYVQEAUDGW65ZGD55QAOJNHSIW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Agentic Reinforced Policy Optimization","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"ARPO improves LLM agent performance on long-horizon tasks by sampling more at high-entropy steps right after each tool call.","cross_cats":["cs.AI","cs.CL"],"primary_cat":"cs.LG","authors_text":"Fuzheng Zhang, Guanting Dong, Guorui Zhou, Hangyu Mao, Huiyang Wang, Jiazhen Du, Ji-Rong Wen, Kai Ma, Licheng Bao, Yifei Chen, Yutao Zhu, Zhicheng Dou, Zhongxia Chen, Zhongyuan Wang","submitted_at":"2025-07-26T07:53:11Z","abstract_excerpt":"Large-scale reinforcement learning with verifiable rewards (RLVR) has demonstrated its effectiveness in harnessing the potential of large language models (LLMs) for single-turn reasoning tasks. In realistic reasoning scenarios, LLMs can often utilize external tools to assist in task-solving processes. However, current RL algorithms inadequately balance the models' intrinsic long-horizon reasoning capabilities and their proficiency in multi-turn tool interactions. To bridge this gap, we propose Agentic Reinforced Policy Optimization (ARPO), a novel agentic RL algorithm tailored for training mul"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"ARPO achieves improved performance using only half of the tool-use budget required by existing methods, offering a scalable solution for aligning LLM-based agents with real-time dynamic environments.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"The preliminary observation that LLMs exhibit highly uncertain behavior (increased entropy) immediately following tool interactions is general enough to guide adaptive sampling across tasks and that this mechanism reliably improves long-horizon performance.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"ARPO adds entropy-based adaptive rollouts and stepwise advantage attribution to RL for LLM agents, outperforming prior trajectory-level methods on 13 benchmarks with half the tool budget.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"ARPO improves LLM agent performance on long-horizon tasks by sampling more at high-entropy steps right after each tool call.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"7ac708c2735623518227c9c9fea38d27afe5c25896ce4e08a003e3e3bca89518"},"source":{"id":"2507.19849","kind":"arxiv","version":1},"verdict":{"id":"a88afeff-b07d-47e7-826b-849b9284cf41","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-17T02:53:04.888884Z","strongest_claim":"ARPO achieves improved performance using only half of the tool-use budget required by existing methods, offering a scalable solution for aligning LLM-based agents with real-time dynamic environments.","one_line_summary":"ARPO adds entropy-based adaptive rollouts and stepwise advantage attribution to RL for LLM agents, outperforming prior trajectory-level methods on 13 benchmarks with half the tool budget.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"The preliminary observation that LLMs exhibit highly uncertain behavior (increased entropy) immediately following tool interactions is general enough to guide adaptive sampling across tasks and that this mechanism reliably improves long-horizon performance.","pith_extraction_headline":"ARPO improves LLM agent performance on long-horizon tasks by sampling more at high-entropy steps right after each tool call."},"references":{"count":11,"sample":[{"doi":"10.18653/v1/2020.coling-main.580","year":2020,"title":"REINFORCE++: Stabilizing Critic-Free Policy Optimization with Global Advantage Normalization","work_id":"557f9e99-cb00-4dd2-92fd-67ddcddbb35d","ref_index":1,"cited_arxiv_id":"2501.03262","is_internal_anchor":true},{"doi":"10.18653/v1/2023.findings-emnlp.378","year":2023,"title":"Prabha, D., Aswini, J., Maheswari, B., Subramanian, R","work_id":"d690fac4-0cde-42d6-958a-77a77c0e7bd0","ref_index":3,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"10.48550/arxiv","year":2025,"title":"Scaling Relationship on Learning Mathematical Reasoning with Large Language Models","work_id":"15eea2e2-dff3-42a7-842a-b663d50f64cb","ref_index":5,"cited_arxiv_id":"2308.01825","is_internal_anchor":true},{"doi":"","year":2024,"title":"thinking while doing","work_id":"a538c3a8-43ab-4c98-9bce-23c1952d7dc1","ref_index":6,"cited_arxiv_id":"","is_internal_anchor":false},{"doi":"","year":null,"title":"Each interaction response length is capped at 4096 tokens","work_id":"7f546fee-7358-4734-a82f-45417904c092","ref_index":7,"cited_arxiv_id":"","is_internal_anchor":false}],"resolved_work":11,"snapshot_sha256":"9e5ed862b21c0d38e4ad20f60781ea547fee361314ab61e7fd1611873909a002","internal_anchors":2},"formal_canon":{"evidence_count":2,"snapshot_sha256":"57118c3a0ee8588e8a444efaf89d75ec04ca7b43baec44d67609ee1f2b70d331"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"a88afeff-b07d-47e7-826b-849b9284cf41"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:38:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ng4MYqpcaJuMO5fHRG3NqgwH+qy5MRVRjwiQML4ZhxiEFPHCVExuKaiapQa0NYWBVfPhky98x0ijcwuWMQGuDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-23T05:10:13.129250Z"},"content_sha256":"8842a7e3887b5b7875f3490dfdffab12575ed7365989bb5601699d481ea1f03e","schema_version":"1.0","event_id":"sha256:8842a7e3887b5b7875f3490dfdffab12575ed7365989bb5601699d481ea1f03e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RYVQEAUDGW65ZGD55QAOJNHSIW/bundle.json","state_url":"https://pith.science/pith/RYVQEAUDGW65ZGD55QAOJNHSIW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RYVQEAUDGW65ZGD55QAOJNHSIW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-23T05:10:13Z","links":{"resolver":"https://pith.science/pith/RYVQEAUDGW65ZGD55QAOJNHSIW","bundle":"https://pith.science/pith/RYVQEAUDGW65ZGD55QAOJNHSIW/bundle.json","state":"https://pith.science/pith/RYVQEAUDGW65ZGD55QAOJNHSIW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RYVQEAUDGW65ZGD55QAOJNHSIW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:RYVQEAUDGW65ZGD55QAOJNHSIW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"2d063dcb52d9088260070a91f280b9064b4539cd1d082dfcb0de4de283df80a3","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-26T07:53:11Z","title_canon_sha256":"c6efe2ebcc3ed7ebb55512d4066b4de04d544066275cf02ab776cb1a95f4a0df"},"schema_version":"1.0","source":{"id":"2507.19849","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2507.19849","created_at":"2026-05-17T23:38:15Z"},{"alias_kind":"arxiv_version","alias_value":"2507.19849v1","created_at":"2026-05-17T23:38:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2507.19849","created_at":"2026-05-17T23:38:15Z"},{"alias_kind":"pith_short_12","alias_value":"RYVQEAUDGW65","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_16","alias_value":"RYVQEAUDGW65ZGD5","created_at":"2026-05-18T12:33:37Z"},{"alias_kind":"pith_short_8","alias_value":"RYVQEAUD","created_at":"2026-05-18T12:33:37Z"}],"graph_snapshots":[{"event_id":"sha256:8842a7e3887b5b7875f3490dfdffab12575ed7365989bb5601699d481ea1f03e","target":"graph","created_at":"2026-05-17T23:38:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"ARPO achieves improved performance using only half of the tool-use budget required by existing methods, offering a scalable solution for aligning LLM-based agents with real-time dynamic environments."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"The preliminary observation that LLMs exhibit highly uncertain behavior (increased entropy) immediately following tool interactions is general enough to guide adaptive sampling across tasks and that this mechanism reliably improves long-horizon performance."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"ARPO adds entropy-based adaptive rollouts and stepwise advantage attribution to RL for LLM agents, outperforming prior trajectory-level methods on 13 benchmarks with half the tool budget."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"ARPO improves LLM agent performance on long-horizon tasks by sampling more at high-entropy steps right after each tool call."}],"snapshot_sha256":"7ac708c2735623518227c9c9fea38d27afe5c25896ce4e08a003e3e3bca89518"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"57118c3a0ee8588e8a444efaf89d75ec04ca7b43baec44d67609ee1f2b70d331"},"paper":{"abstract_excerpt":"Large-scale reinforcement learning with verifiable rewards (RLVR) has demonstrated its effectiveness in harnessing the potential of large language models (LLMs) for single-turn reasoning tasks. In realistic reasoning scenarios, LLMs can often utilize external tools to assist in task-solving processes. However, current RL algorithms inadequately balance the models' intrinsic long-horizon reasoning capabilities and their proficiency in multi-turn tool interactions. To bridge this gap, we propose Agentic Reinforced Policy Optimization (ARPO), a novel agentic RL algorithm tailored for training mul","authors_text":"Fuzheng Zhang, Guanting Dong, Guorui Zhou, Hangyu Mao, Huiyang Wang, Jiazhen Du, Ji-Rong Wen, Kai Ma, Licheng Bao, Yifei Chen, Yutao Zhu, Zhicheng Dou, Zhongxia Chen, Zhongyuan Wang","cross_cats":["cs.AI","cs.CL"],"headline":"ARPO improves LLM agent performance on long-horizon tasks by sampling more at high-entropy steps right after each tool call.","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-26T07:53:11Z","title":"Agentic Reinforced Policy Optimization"},"references":{"count":11,"internal_anchors":2,"resolved_work":11,"sample":[{"cited_arxiv_id":"2501.03262","doi":"10.18653/v1/2020.coling-main.580","is_internal_anchor":true,"ref_index":1,"title":"REINFORCE++: Stabilizing Critic-Free Policy Optimization with Global Advantage Normalization","work_id":"557f9e99-cb00-4dd2-92fd-67ddcddbb35d","year":2020},{"cited_arxiv_id":"","doi":"10.18653/v1/2023.findings-emnlp.378","is_internal_anchor":false,"ref_index":3,"title":"Prabha, D., Aswini, J., Maheswari, B., Subramanian, R","work_id":"d690fac4-0cde-42d6-958a-77a77c0e7bd0","year":2023},{"cited_arxiv_id":"2308.01825","doi":"10.48550/arxiv","is_internal_anchor":true,"ref_index":5,"title":"Scaling Relationship on Learning Mathematical Reasoning with Large Language Models","work_id":"15eea2e2-dff3-42a7-842a-b663d50f64cb","year":2025},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":6,"title":"thinking while doing","work_id":"a538c3a8-43ab-4c98-9bce-23c1952d7dc1","year":2024},{"cited_arxiv_id":"","doi":"","is_internal_anchor":false,"ref_index":7,"title":"Each interaction response length is capped at 4096 tokens","work_id":"7f546fee-7358-4734-a82f-45417904c092","year":null}],"snapshot_sha256":"9e5ed862b21c0d38e4ad20f60781ea547fee361314ab61e7fd1611873909a002"},"source":{"id":"2507.19849","kind":"arxiv","version":1},"verdict":{"created_at":"2026-05-17T02:53:04.888884Z","id":"a88afeff-b07d-47e7-826b-849b9284cf41","model_set":{"reader":"grok-4.3"},"one_line_summary":"ARPO adds entropy-based adaptive rollouts and stepwise advantage attribution to RL for LLM agents, outperforming prior trajectory-level methods on 13 benchmarks with half the tool budget.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"ARPO improves LLM agent performance on long-horizon tasks by sampling more at high-entropy steps right after each tool call.","strongest_claim":"ARPO achieves improved performance using only half of the tool-use budget required by existing methods, offering a scalable solution for aligning LLM-based agents with real-time dynamic environments.","weakest_assumption":"The preliminary observation that LLMs exhibit highly uncertain behavior (increased entropy) immediately following tool interactions is general enough to guide adaptive sampling across tasks and that this mechanism reliably improves long-horizon performance."}},"verdict_id":"a88afeff-b07d-47e7-826b-849b9284cf41"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f9d1043b1c12a48d506bae72f82cf62fb1a3c2aaa8508568f5f61c9867d01f17","target":"record","created_at":"2026-05-17T23:38:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"2d063dcb52d9088260070a91f280b9064b4539cd1d082dfcb0de4de283df80a3","cross_cats_sorted":["cs.AI","cs.CL"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2025-07-26T07:53:11Z","title_canon_sha256":"c6efe2ebcc3ed7ebb55512d4066b4de04d544066275cf02ab776cb1a95f4a0df"},"schema_version":"1.0","source":{"id":"2507.19849","kind":"arxiv","version":1}},"canonical_sha256":"8e2b02028335bddc987dec00e4b4f2459a73c968a690cb2f56fc3280e364f4d7","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8e2b02028335bddc987dec00e4b4f2459a73c968a690cb2f56fc3280e364f4d7","first_computed_at":"2026-05-17T23:38:15.333245Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:38:15.333245Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"ysfb8jNGBhZqy1LdoRFEuTVGNj6ZHhBS70b9WsLDgLQLETf5x5+wOubjiUmIZQaWtEdfbdYVdXiwhsqyC8PyAQ==","signature_status":"signed_v1","signed_at":"2026-05-17T23:38:15.333885Z","signed_message":"canonical_sha256_bytes"},"source_id":"2507.19849","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f9d1043b1c12a48d506bae72f82cf62fb1a3c2aaa8508568f5f61c9867d01f17","sha256:8842a7e3887b5b7875f3490dfdffab12575ed7365989bb5601699d481ea1f03e"],"state_sha256":"4943f81ba94dcef98d2bfdfdaa5b22f838bc1442e87a7cd0de278c5692fe5210"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"GNVmpUei1qcYf4ZfuF8Wv/7JWBmpU7X7OXsxeKfTU7fPgiFjhMXArkvcJHyHHFnFZdKRFCdy6vKBYJgxKC1qDg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-23T05:10:13.133458Z","bundle_sha256":"da8aca9b8e4a16b0cc70e1f8a184ddd3195b93dc2999301838501f11a6d89022"}}