{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:QBDA5KU5FNO4N6WU6RLKYU2MCG","short_pith_number":"pith:QBDA5KU5","canonical_record":{"source":{"id":"2603.20088","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CY","submitted_at":"2026-03-20T16:13:03Z","cross_cats_sorted":[],"title_canon_sha256":"fe16bcdc9387b9c702d7f0ffc8741acf0135f5625a1583c2cb1458bdb8dfd023","abstract_canon_sha256":"cd0a8419f3a6681176846344a39160060c9c9372cab523556eeab689249efafc"},"schema_version":"1.0"},"canonical_sha256":"80460eaa9d2b5dc6fad4f456ac534c11b774a5e36f3f4492dcc77d41affae5f3","source":{"kind":"arxiv","id":"2603.20088","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2603.20088","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"arxiv_version","alias_value":"2603.20088v2","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2603.20088","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"pith_short_12","alias_value":"QBDA5KU5FNO4","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"pith_short_16","alias_value":"QBDA5KU5FNO4N6WU","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"pith_short_8","alias_value":"QBDA5KU5","created_at":"2026-05-25T02:02:14Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:QBDA5KU5FNO4N6WU6RLKYU2MCG","target":"record","payload":{"canonical_record":{"source":{"id":"2603.20088","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CY","submitted_at":"2026-03-20T16:13:03Z","cross_cats_sorted":[],"title_canon_sha256":"fe16bcdc9387b9c702d7f0ffc8741acf0135f5625a1583c2cb1458bdb8dfd023","abstract_canon_sha256":"cd0a8419f3a6681176846344a39160060c9c9372cab523556eeab689249efafc"},"schema_version":"1.0"},"canonical_sha256":"80460eaa9d2b5dc6fad4f456ac534c11b774a5e36f3f4492dcc77d41affae5f3","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-25T02:02:14.517394Z","signature_b64":"hcDzkXD0am5DWVppsEsdCNNoiDueyMPplox4x7Ynqlth458K2EoC0aLBd5FlzqYnaTQV4SKZFLYixemiqAgxAA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"80460eaa9d2b5dc6fad4f456ac534c11b774a5e36f3f4492dcc77d41affae5f3","last_reissued_at":"2026-05-25T02:02:14.516713Z","signature_status":"signed_v1","first_computed_at":"2026-05-25T02:02:14.516713Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2603.20088","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-25T02:02:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"81n960I7XMFBQBXo1C3e52Uml+9Ncy3gggdsoghT5p4Apr9+u9OBzSnsAGJnLInY5b5fjXoN6krF2AwnIrkjAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T16:56:09.462800Z"},"content_sha256":"420a5fadb1fccd180fc14c1887d02d9dacd49c766703397276cf2d76ec6d6650","schema_version":"1.0","event_id":"sha256:420a5fadb1fccd180fc14c1887d02d9dacd49c766703397276cf2d76ec6d6650"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:QBDA5KU5FNO4N6WU6RLKYU2MCG","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Towards an Evaluation Methodology for AI in Second Language Education: Lessons Learned from Developing L2-Bench","license":"http://creativecommons.org/licenses/by-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CY","authors_text":"Ben Knight, Danielle Carvalho, Elizabeth Wonnacott, Isaac Pattis, James Edgell, Wm. Matthew Kennedy","submitted_at":"2026-03-20T16:13:03Z","abstract_excerpt":"The rapid adoption of large language models in AI-powered language education has created an urgent need for evaluations that assess pedagogical effectiveness, particularly in language learning--one of the most common LLM use cases (Tamkin et al. 2024; Costa-Gomes et al. 2025). With only narrowly defined task-specific evaluations of AI system capabilities in second language (L2) education existing in the literature, we require more holistic approaches in this AI for education space. To address this gap, we describe the iteration of the methodology we developed to build L2-Bench, a novel, contex"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2603.20088","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2603.20088/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-25T02:02:14Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"r1czsU7D5MvoATaznQzVarUdvqmy7OlcgbBRt4Jq005JLOuZAsfawMBDwi7p3g7jM7HK3gNsNmNiUBiYY+poAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T16:56:09.463529Z"},"content_sha256":"f55cec18b015cb4a0f62dcf73b47a6ab608ee814d23d19f3326a939aa1ab0ead","schema_version":"1.0","event_id":"sha256:f55cec18b015cb4a0f62dcf73b47a6ab608ee814d23d19f3326a939aa1ab0ead"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/QBDA5KU5FNO4N6WU6RLKYU2MCG/bundle.json","state_url":"https://pith.science/pith/QBDA5KU5FNO4N6WU6RLKYU2MCG/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/QBDA5KU5FNO4N6WU6RLKYU2MCG/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T16:56:09Z","links":{"resolver":"https://pith.science/pith/QBDA5KU5FNO4N6WU6RLKYU2MCG","bundle":"https://pith.science/pith/QBDA5KU5FNO4N6WU6RLKYU2MCG/bundle.json","state":"https://pith.science/pith/QBDA5KU5FNO4N6WU6RLKYU2MCG/state.json","well_known_bundle":"https://pith.science/.well-known/pith/QBDA5KU5FNO4N6WU6RLKYU2MCG/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:QBDA5KU5FNO4N6WU6RLKYU2MCG","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"cd0a8419f3a6681176846344a39160060c9c9372cab523556eeab689249efafc","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CY","submitted_at":"2026-03-20T16:13:03Z","title_canon_sha256":"fe16bcdc9387b9c702d7f0ffc8741acf0135f5625a1583c2cb1458bdb8dfd023"},"schema_version":"1.0","source":{"id":"2603.20088","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2603.20088","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"arxiv_version","alias_value":"2603.20088v2","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2603.20088","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"pith_short_12","alias_value":"QBDA5KU5FNO4","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"pith_short_16","alias_value":"QBDA5KU5FNO4N6WU","created_at":"2026-05-25T02:02:14Z"},{"alias_kind":"pith_short_8","alias_value":"QBDA5KU5","created_at":"2026-05-25T02:02:14Z"}],"graph_snapshots":[{"event_id":"sha256:f55cec18b015cb4a0f62dcf73b47a6ab608ee814d23d19f3326a939aa1ab0ead","target":"graph","created_at":"2026-05-25T02:02:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2603.20088/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"The rapid adoption of large language models in AI-powered language education has created an urgent need for evaluations that assess pedagogical effectiveness, particularly in language learning--one of the most common LLM use cases (Tamkin et al. 2024; Costa-Gomes et al. 2025). With only narrowly defined task-specific evaluations of AI system capabilities in second language (L2) education existing in the literature, we require more holistic approaches in this AI for education space. To address this gap, we describe the iteration of the methodology we developed to build L2-Bench, a novel, contex","authors_text":"Ben Knight, Danielle Carvalho, Elizabeth Wonnacott, Isaac Pattis, James Edgell, Wm. Matthew Kennedy","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CY","submitted_at":"2026-03-20T16:13:03Z","title":"Towards an Evaluation Methodology for AI in Second Language Education: Lessons Learned from Developing L2-Bench"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2603.20088","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:420a5fadb1fccd180fc14c1887d02d9dacd49c766703397276cf2d76ec6d6650","target":"record","created_at":"2026-05-25T02:02:14Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"cd0a8419f3a6681176846344a39160060c9c9372cab523556eeab689249efafc","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by-sa/4.0/","primary_cat":"cs.CY","submitted_at":"2026-03-20T16:13:03Z","title_canon_sha256":"fe16bcdc9387b9c702d7f0ffc8741acf0135f5625a1583c2cb1458bdb8dfd023"},"schema_version":"1.0","source":{"id":"2603.20088","kind":"arxiv","version":2}},"canonical_sha256":"80460eaa9d2b5dc6fad4f456ac534c11b774a5e36f3f4492dcc77d41affae5f3","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"80460eaa9d2b5dc6fad4f456ac534c11b774a5e36f3f4492dcc77d41affae5f3","first_computed_at":"2026-05-25T02:02:14.516713Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-25T02:02:14.516713Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"hcDzkXD0am5DWVppsEsdCNNoiDueyMPplox4x7Ynqlth458K2EoC0aLBd5FlzqYnaTQV4SKZFLYixemiqAgxAA==","signature_status":"signed_v1","signed_at":"2026-05-25T02:02:14.517394Z","signed_message":"canonical_sha256_bytes"},"source_id":"2603.20088","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:420a5fadb1fccd180fc14c1887d02d9dacd49c766703397276cf2d76ec6d6650","sha256:f55cec18b015cb4a0f62dcf73b47a6ab608ee814d23d19f3326a939aa1ab0ead"],"state_sha256":"bb7b1747a1651cdf532c4fda17c717486332ef9d44223d8b062e7e2af778907a"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"vmftmUbjFIUJ5RxOO8bDA5amd0de1N+OycrIKJx9AmGhqIp8P1cD/i2xLNOhX8KNHkc5mSHS5RqltNgZq6NLDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T16:56:09.467389Z","bundle_sha256":"0cd645eb5add3952dc75e307fd6c6d358cd260dba5dfb95708514255e6d95e13"}}