{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:BMJESM6C7IKYADU6SGRARGO6OB","short_pith_number":"pith:BMJESM6C","canonical_record":{"source":{"id":"2605.15734","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-15T08:43:26Z","cross_cats_sorted":[],"title_canon_sha256":"05edfaae8e7e5eaee5082c21e8e43cbfcbe14780cce772bd8d13e1d54f60dee6","abstract_canon_sha256":"2c322aedb84a9363cfa5f6534b0bb991a4be35dc765a8ac650765ff6022adff9"},"schema_version":"1.0"},"canonical_sha256":"0b124933c2fa15800e9e91a20899de705e9c48696b99c0bd16c8fa1dfe7f45ac","source":{"kind":"arxiv","id":"2605.15734","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.15734","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"arxiv_version","alias_value":"2605.15734v1","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.15734","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"pith_short_12","alias_value":"BMJESM6C7IKY","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"pith_short_16","alias_value":"BMJESM6C7IKYADU6","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"pith_short_8","alias_value":"BMJESM6C","created_at":"2026-05-20T00:01:15Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:BMJESM6C7IKYADU6SGRARGO6OB","target":"record","payload":{"canonical_record":{"source":{"id":"2605.15734","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-15T08:43:26Z","cross_cats_sorted":[],"title_canon_sha256":"05edfaae8e7e5eaee5082c21e8e43cbfcbe14780cce772bd8d13e1d54f60dee6","abstract_canon_sha256":"2c322aedb84a9363cfa5f6534b0bb991a4be35dc765a8ac650765ff6022adff9"},"schema_version":"1.0"},"canonical_sha256":"0b124933c2fa15800e9e91a20899de705e9c48696b99c0bd16c8fa1dfe7f45ac","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T00:01:15.432090Z","signature_b64":"UJZhiKjpiVuN8E/WIl3yaVM/6r4YIMxDJv+NA+Ngtk9+dMyg5dxvTlBNuHBArItlSBfIZlc+yho4vxM+D88PCA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"0b124933c2fa15800e9e91a20899de705e9c48696b99c0bd16c8fa1dfe7f45ac","last_reissued_at":"2026-05-20T00:01:15.431271Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T00:01:15.431271Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.15734","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:01:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"JvvThTWk2VzDvuAdr1/t72aEwk1aHvfHGK7Qa7pNP9+ffMFv+5fEATSn+uIdiRos+nGoI4HB5wq/X/ImwWmvCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T15:04:55.276596Z"},"content_sha256":"4dace16e1d76a4bdfdbfef76ea1048c4244ce2348a072be6cc6601c0f777fa90","schema_version":"1.0","event_id":"sha256:4dace16e1d76a4bdfdbfef76ea1048c4244ce2348a072be6cc6601c0f777fa90"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:BMJESM6C7IKYADU6SGRARGO6OB","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Can We Trust AI-Inferred User States. A Psychometric Framework for Validating the Reliability of Users States Classification by LLMs in Operational Environments","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Ewa Komkowska, Izabella Krzeminska, Michal Butkiewicz","submitted_at":"2026-05-15T08:43:26Z","abstract_excerpt":"The use of large language models to assess user states in conversational and adaptive systems is based on the assumption that the metrics used for such assessment are stable and interpretable at the level of individual scores. This paper empirically tests this assumption, focusing on the psychometric reliability of artificial intelligence (AI) measures of user states.\n  This study employed replication evaluation procedures to assess the repeatability of a broad set of metrics across three different bimodal large language models (GPT-4o audio, Gemini 2.0 Flash, Gemini 2.5 Flash). Analyses inclu"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.15734","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.15734/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"ai_meta_artifact","ran_at":"2026-05-19T19:33:24.069328Z","status":"skipped","version":"1.0.0","findings_count":0},{"name":"claim_evidence","ran_at":"2026-05-19T17:21:55.988733Z","status":"completed","version":"1.0.0","findings_count":0}],"snapshot_sha256":"a7a5d8141aac675adfd5e83fb24b8cfc5e58e47bc56f3184220be8b95c218a35"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T00:01:15Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ie9ouEATG8g/p+R+ePTv19+GmxALVKpaD77ywC54rBVRZWW3RGqTp+FPMQZ3WWYw5VbPm3RTzWo6sQ7BJnM0Bw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T15:04:55.277010Z"},"content_sha256":"98f9f838546a53b6ef8bb21c44760669cedbba7853d807e0f7b0b869930b75ba","schema_version":"1.0","event_id":"sha256:98f9f838546a53b6ef8bb21c44760669cedbba7853d807e0f7b0b869930b75ba"},{"event_type":"integrity_finding","subject_pith_number":"pith:2026:BMJESM6C7IKYADU6SGRARGO6OB","target":"integrity","payload":{"note":"DOI in the printed bibliography is fragmented by whitespace or line breaks. A longer candidate (10.1109/ACII.2011.5951547.Sheng) was visible in the surrounding text but could not be confirmed against doi.org as printed.","snippet":"Schuller, Bj¨ ornet al., (2011). “Recognising Realistic Emotions and Affect in Speech and Text”, International Conference on Affective Computing.doi:10.1109/ACII.2011.5951547. Sheng, Emilyet al., (2019). “The Woman Worked as a Babysitter: O","arxiv_id":"2605.15734","detector":"doi_compliance","evidence":{"ref_index":12,"verdict_class":"incontrovertible","resolved_title":null,"printed_excerpt":"Schuller, Bj¨ ornet al., (2011). “Recognising Realistic Emotions and Affect in Speech and Text”, International Conference on Affective Computing.doi:10.1109/ACII.2011.5951547. Sheng, Emilyet al., (2019). “The Woman Worked as a Babysitter: O","reconstructed_doi":"10.1109/ACII.2011.5951547.Sheng"},"severity":"advisory","ref_index":12,"audited_at":"2026-05-20T19:23:30.631661Z","event_type":"pith.integrity.v1","detected_doi":"10.1109/ACII.2011.5951547.Sheng","detector_url":"https://pith.science/pith-integrity-protocol#doi_compliance","external_url":null,"finding_type":"recoverable_identifier","evidence_hash":"e116f6042a0d2b5fd6707f56c70c77d76724eabb607b3bdfc9fb73cf45fbbcc5","paper_version":1,"verdict_class":"incontrovertible","resolved_title":null,"detector_version":"1.0.0","detected_arxiv_id":null,"integrity_event_id":5431,"payload_sha256":"7a48fc6c099312e28937eda3b63b1fa486007055ffa6a3c9c410d44e199b8777","signature_b64":"0AYkeUIRuqvbMhohQBtCiR2/GsVH9MYjVAArNHbZK68m+3sgOIpN2PLlB+1HT8xpBTBq2ArBzS+M/tTf0XpNDQ==","signing_key_id":"pith-v1-2026-05"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T19:28:26Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"44togmvmB45A/wtpI1hs5n2OZNu1jSBr4bop+RENZoiWyTw2OCBG8BvN7lTJCaQLVonokMjJO+TME3w2h6GxCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T15:04:55.277914Z"},"content_sha256":"e24ec61498cf85f6e6f91e036a8c4a891af3191d32e0b156ce8fe908ed3356cb","schema_version":"1.0","event_id":"sha256:e24ec61498cf85f6e6f91e036a8c4a891af3191d32e0b156ce8fe908ed3356cb"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/BMJESM6C7IKYADU6SGRARGO6OB/bundle.json","state_url":"https://pith.science/pith/BMJESM6C7IKYADU6SGRARGO6OB/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/BMJESM6C7IKYADU6SGRARGO6OB/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T15:04:55Z","links":{"resolver":"https://pith.science/pith/BMJESM6C7IKYADU6SGRARGO6OB","bundle":"https://pith.science/pith/BMJESM6C7IKYADU6SGRARGO6OB/bundle.json","state":"https://pith.science/pith/BMJESM6C7IKYADU6SGRARGO6OB/state.json","well_known_bundle":"https://pith.science/.well-known/pith/BMJESM6C7IKYADU6SGRARGO6OB/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:BMJESM6C7IKYADU6SGRARGO6OB","merge_version":"pith-open-graph-merge-v1","event_count":3,"valid_event_count":3,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"2c322aedb84a9363cfa5f6534b0bb991a4be35dc765a8ac650765ff6022adff9","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-15T08:43:26Z","title_canon_sha256":"05edfaae8e7e5eaee5082c21e8e43cbfcbe14780cce772bd8d13e1d54f60dee6"},"schema_version":"1.0","source":{"id":"2605.15734","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.15734","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"arxiv_version","alias_value":"2605.15734v1","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.15734","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"pith_short_12","alias_value":"BMJESM6C7IKY","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"pith_short_16","alias_value":"BMJESM6C7IKYADU6","created_at":"2026-05-20T00:01:15Z"},{"alias_kind":"pith_short_8","alias_value":"BMJESM6C","created_at":"2026-05-20T00:01:15Z"}],"graph_snapshots":[{"event_id":"sha256:98f9f838546a53b6ef8bb21c44760669cedbba7853d807e0f7b0b869930b75ba","target":"graph","created_at":"2026-05-20T00:01:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-19T19:33:24.069328Z","status":"skipped","version":"1.0.0"},{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-19T17:21:55.988733Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2605.15734/integrity.json","findings":[],"snapshot_sha256":"a7a5d8141aac675adfd5e83fb24b8cfc5e58e47bc56f3184220be8b95c218a35","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"The use of large language models to assess user states in conversational and adaptive systems is based on the assumption that the metrics used for such assessment are stable and interpretable at the level of individual scores. This paper empirically tests this assumption, focusing on the psychometric reliability of artificial intelligence (AI) measures of user states.\n  This study employed replication evaluation procedures to assess the repeatability of a broad set of metrics across three different bimodal large language models (GPT-4o audio, Gemini 2.0 Flash, Gemini 2.5 Flash). Analyses inclu","authors_text":"Ewa Komkowska, Izabella Krzeminska, Michal Butkiewicz","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-15T08:43:26Z","title":"Can We Trust AI-Inferred User States. A Psychometric Framework for Validating the Reliability of Users States Classification by LLMs in Operational Environments"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.15734","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:4dace16e1d76a4bdfdbfef76ea1048c4244ce2348a072be6cc6601c0f777fa90","target":"record","created_at":"2026-05-20T00:01:15Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"2c322aedb84a9363cfa5f6534b0bb991a4be35dc765a8ac650765ff6022adff9","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2026-05-15T08:43:26Z","title_canon_sha256":"05edfaae8e7e5eaee5082c21e8e43cbfcbe14780cce772bd8d13e1d54f60dee6"},"schema_version":"1.0","source":{"id":"2605.15734","kind":"arxiv","version":1}},"canonical_sha256":"0b124933c2fa15800e9e91a20899de705e9c48696b99c0bd16c8fa1dfe7f45ac","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"0b124933c2fa15800e9e91a20899de705e9c48696b99c0bd16c8fa1dfe7f45ac","first_computed_at":"2026-05-20T00:01:15.431271Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T00:01:15.431271Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UJZhiKjpiVuN8E/WIl3yaVM/6r4YIMxDJv+NA+Ngtk9+dMyg5dxvTlBNuHBArItlSBfIZlc+yho4vxM+D88PCA==","signature_status":"signed_v1","signed_at":"2026-05-20T00:01:15.432090Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.15734","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:4dace16e1d76a4bdfdbfef76ea1048c4244ce2348a072be6cc6601c0f777fa90","sha256:98f9f838546a53b6ef8bb21c44760669cedbba7853d807e0f7b0b869930b75ba","sha256:e24ec61498cf85f6e6f91e036a8c4a891af3191d32e0b156ce8fe908ed3356cb"],"state_sha256":"c7a55694a950f1815ab643f589d9745906d1ca000e8da7f34ca951ba144879a7"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"G3henm4q0NGWRVxt6mjWglzYMqCqh2MOObRPVvb7/8bxvMgXyGMPFvZa/SgQOh8gVmuoWo+1y3zoeWFOn3q4Cw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T15:04:55.280094Z","bundle_sha256":"5e4bae253d7dd7ffb1b059193a451b3d5ebad47e06bfeceb47d490186d58baf3"}}