{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2024:L6DVLFH6QKIWIGB7R7CPWUXCFV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"654701d4e58c0507d9184e948dad726d351f36869d2390268207012df903bc7d","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2024-02-14T04:50:18Z","title_canon_sha256":"a01f4cce52ba2285d96b23396284fb31c8534d7f322ffb897956b57687ad02b5"},"schema_version":"1.0","source":{"id":"2402.08939","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2402.08939","created_at":"2026-07-05T08:24:01Z"},{"alias_kind":"arxiv_version","alias_value":"2402.08939v3","created_at":"2026-07-05T08:24:01Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2402.08939","created_at":"2026-07-05T08:24:01Z"},{"alias_kind":"pith_short_12","alias_value":"L6DVLFH6QKIW","created_at":"2026-07-05T08:24:01Z"},{"alias_kind":"pith_short_16","alias_value":"L6DVLFH6QKIWIGB7","created_at":"2026-07-05T08:24:01Z"},{"alias_kind":"pith_short_8","alias_value":"L6DVLFH6","created_at":"2026-07-05T08:24:01Z"}],"graph_snapshots":[{"event_id":"sha256:9ca54dec6e1fb99cb5a1e99dc57959fdd7ca8d2dec95e2df8a58d1d17e689ab4","target":"graph","created_at":"2026-07-05T08:24:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2402.08939/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large language models (LLMs) have accomplished remarkable reasoning performance in various domains. However, in the domain of reasoning tasks, we discover a frailty: LLMs are surprisingly brittle to the ordering of the premises, despite the fact that such ordering does not alter the underlying task. In particular, we observe that LLMs achieve the best performance when the premise order aligns with the context required in intermediate reasoning steps. For example, in deductive reasoning tasks, presenting the premises in the same order as the ground truth proof in the prompt (as opposed to rando","authors_text":"Denny Zhou, Ryan A. Chi, Xinyun Chen, Xuezhi Wang","cross_cats":["cs.CL"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2024-02-14T04:50:18Z","title":"Premise Order Matters in Reasoning with Large Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2402.08939","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:96eb23bf1bfd8bb164c3d1291078d84469445e0ca255106cea85873a5dab5d00","target":"record","created_at":"2026-07-05T08:24:01Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"654701d4e58c0507d9184e948dad726d351f36869d2390268207012df903bc7d","cross_cats_sorted":["cs.CL"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.AI","submitted_at":"2024-02-14T04:50:18Z","title_canon_sha256":"a01f4cce52ba2285d96b23396284fb31c8534d7f322ffb897956b57687ad02b5"},"schema_version":"1.0","source":{"id":"2402.08939","kind":"arxiv","version":3}},"canonical_sha256":"5f875594fe829164183f8fc4fb52e22d7b29f29eb0955ca7b1ee4b0c67e5fb8a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5f875594fe829164183f8fc4fb52e22d7b29f29eb0955ca7b1ee4b0c67e5fb8a","first_computed_at":"2026-07-05T08:24:01.582751Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T08:24:01.582751Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"a/Bil8IA0J165vmTnIJ8U0h1uyIy6h04OIXcpTP5dNEHxLkkDwoE4fRMQKNML8/YdCURTRO/Y049MFcvi2NpCg==","signature_status":"signed_v1","signed_at":"2026-07-05T08:24:01.583236Z","signed_message":"canonical_sha256_bytes"},"source_id":"2402.08939","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:96eb23bf1bfd8bb164c3d1291078d84469445e0ca255106cea85873a5dab5d00","sha256:9ca54dec6e1fb99cb5a1e99dc57959fdd7ca8d2dec95e2df8a58d1d17e689ab4"],"state_sha256":"cce8908d80bdc9182328f7fcf0a4f2791b3d73a7fa489808722e886279baeabc"}