{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:A7GTVK4T6XJ2F4XI74PTGHWHMQ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"3704f56d1ce9bbaabc91bc2798caae9fd4faaf1993d13b37e14d45bcca669c30","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-03T15:05:44Z","title_canon_sha256":"d73baeb8155395957b1a8e8b3a72f867961207c1fcd005d05df49e329994aa7b"},"schema_version":"1.0","source":{"id":"2511.01650","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2511.01650","created_at":"2026-06-19T16:10:32Z"},{"alias_kind":"arxiv_version","alias_value":"2511.01650v3","created_at":"2026-06-19T16:10:32Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2511.01650","created_at":"2026-06-19T16:10:32Z"},{"alias_kind":"pith_short_12","alias_value":"A7GTVK4T6XJ2","created_at":"2026-06-19T16:10:32Z"},{"alias_kind":"pith_short_16","alias_value":"A7GTVK4T6XJ2F4XI","created_at":"2026-06-19T16:10:32Z"},{"alias_kind":"pith_short_8","alias_value":"A7GTVK4T","created_at":"2026-06-19T16:10:32Z"}],"graph_snapshots":[{"event_id":"sha256:da7fb2e984627eca253b3ec187f9bf6ef8d7053f6bf330f29dce9502b326f0ad","target":"graph","created_at":"2026-06-19T16:10:32Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2511.01650/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Large Language Models (LLMs) are increasingly entering specialized, safety-critical engineering workflows governed by strict quantitative standards and immutable physical laws, making rigorous evaluation of their reasoning capabilities imperative. However, existing benchmarks such as MMLU, MATH, and HumanEval assess isolated cognitive skills, failing to capture the physically grounded reasoning central to engineering, where scientific principles, quantitative modeling, and practical constraints must converge. To enable verifiable process supervision in engineering, we introduce EngTrace, a sym","authors_text":"Ayesha Gull, Fan Zhang, Muhammad Usman Safder, Preslav Nakov, Rania Elbadry, Veselin Stoyanov, Zhuohan Xie","cross_cats":["cs.AI","cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-03T15:05:44Z","title":"EngTrace: A Symbolic Benchmark for Verifiable Process Supervision of Engineering Reasoning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2511.01650","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d204394a4b23eea6d7a1bd1c79418008dece0f0671d2466176be3184815ae0be","target":"record","created_at":"2026-06-19T16:10:32Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"3704f56d1ce9bbaabc91bc2798caae9fd4faaf1993d13b37e14d45bcca669c30","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CL","submitted_at":"2025-11-03T15:05:44Z","title_canon_sha256":"d73baeb8155395957b1a8e8b3a72f867961207c1fcd005d05df49e329994aa7b"},"schema_version":"1.0","source":{"id":"2511.01650","kind":"arxiv","version":3}},"canonical_sha256":"07cd3aab93f5d3a2f2e8ff1f331ec7643cbe5b0577a533f4e5c56aa0d35abe8f","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"07cd3aab93f5d3a2f2e8ff1f331ec7643cbe5b0577a533f4e5c56aa0d35abe8f","first_computed_at":"2026-06-19T16:10:32.050398Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-19T16:10:32.050398Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UcIlHIzj+oX7+B2phmAX/+tcuiFPe1IaXTzS0+GtIKz/cn5caog6FW9Wm3iuTcqsxjiHnhw1ENJtFYQo10Y0CQ==","signature_status":"signed_v1","signed_at":"2026-06-19T16:10:32.050833Z","signed_message":"canonical_sha256_bytes"},"source_id":"2511.01650","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d204394a4b23eea6d7a1bd1c79418008dece0f0671d2466176be3184815ae0be","sha256:da7fb2e984627eca253b3ec187f9bf6ef8d7053f6bf330f29dce9502b326f0ad"],"state_sha256":"3c034b91c81a833d34dc0cb14fff2f828e4d57e50da83e72204422a9aeb150cb"}