{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:SBM7WDJDH4LHHBUYVJFKTEGFUV","short_pith_number":"pith:SBM7WDJD","schema_version":"1.0","canonical_sha256":"9059fb0d233f16738698aa4aa990c5a5700c74f7beac5e28931be7d9df455390","source":{"kind":"arxiv","id":"2606.07127","version":1},"attestation_state":"computed","paper":{"title":"Learning Explicit Behavioral Models with Adaptive Questions and World-Model Probes","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Christopher Tauchmann, Gopika Sudhakaran, Hikaru Shindo, Jannis Bl\\\"uml, Kristian Kersting, Quentin Delfosse, Teng Cao, Yu Deng","submitted_at":"2026-06-05T10:34:55Z","abstract_excerpt":"Interactive agents trained only against task return can achieve high scores while failing to represent the mechanisms that make their actions succeed. This makes brittle behavior difficult to diagnose and limits adaptation when environment dynamics change. Existing LLM reflection and policy-code repair can revise behavior from failed trajectories, but questions and world-understanding tests are usually used only after training. We introduce an Explicit Symbolic Behavioral Model (ESBM), a trainable behavioral model that couples task performance with evidence-grounded question answering and exec"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.07127","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-05T10:34:55Z","cross_cats_sorted":[],"title_canon_sha256":"484b2bd691f4af08045004dbeb91d181cf8f0e32c30d3fda5076b3ffa14123aa","abstract_canon_sha256":"a0720399165bc12e6f61928eed77907406d9d2adab6c4efbea267209d039c443"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-08T01:04:47.889719Z","signature_b64":"A5XgfEvg9vfD0g+8/5oboP2+m5SOCbhqjRVm3i2Qob7vjr8+WytGAmGAgs1qZO0B1U1Qc0lbtwfll3wJFOxUDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9059fb0d233f16738698aa4aa990c5a5700c74f7beac5e28931be7d9df455390","last_reissued_at":"2026-06-08T01:04:47.888894Z","signature_status":"signed_v1","first_computed_at":"2026-06-08T01:04:47.888894Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Learning Explicit Behavioral Models with Adaptive Questions and World-Model Probes","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Christopher Tauchmann, Gopika Sudhakaran, Hikaru Shindo, Jannis Bl\\\"uml, Kristian Kersting, Quentin Delfosse, Teng Cao, Yu Deng","submitted_at":"2026-06-05T10:34:55Z","abstract_excerpt":"Interactive agents trained only against task return can achieve high scores while failing to represent the mechanisms that make their actions succeed. This makes brittle behavior difficult to diagnose and limits adaptation when environment dynamics change. Existing LLM reflection and policy-code repair can revise behavior from failed trajectories, but questions and world-understanding tests are usually used only after training. We introduce an Explicit Symbolic Behavioral Model (ESBM), a trainable behavioral model that couples task performance with evidence-grounded question answering and exec"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07127","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.07127/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.07127","created_at":"2026-06-08T01:04:47.889019+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.07127v1","created_at":"2026-06-08T01:04:47.889019+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07127","created_at":"2026-06-08T01:04:47.889019+00:00"},{"alias_kind":"pith_short_12","alias_value":"SBM7WDJDH4LH","created_at":"2026-06-08T01:04:47.889019+00:00"},{"alias_kind":"pith_short_16","alias_value":"SBM7WDJDH4LHHBUY","created_at":"2026-06-08T01:04:47.889019+00:00"},{"alias_kind":"pith_short_8","alias_value":"SBM7WDJD","created_at":"2026-06-08T01:04:47.889019+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV","json":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV.json","graph_json":"https://pith.science/api/pith-number/SBM7WDJDH4LHHBUYVJFKTEGFUV/graph.json","events_json":"https://pith.science/api/pith-number/SBM7WDJDH4LHHBUYVJFKTEGFUV/events.json","paper":"https://pith.science/paper/SBM7WDJD"},"agent_actions":{"view_html":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV","download_json":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV.json","view_paper":"https://pith.science/paper/SBM7WDJD","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.07127&json=true","fetch_graph":"https://pith.science/api/pith-number/SBM7WDJDH4LHHBUYVJFKTEGFUV/graph.json","fetch_events":"https://pith.science/api/pith-number/SBM7WDJDH4LHHBUYVJFKTEGFUV/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/action/timestamp_anchor","attest_storage":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/action/storage_attestation","attest_author":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/action/author_attestation","sign_citation":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/action/citation_signature","submit_replication":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/action/replication_record"}},"created_at":"2026-06-08T01:04:47.889019+00:00","updated_at":"2026-06-08T01:04:47.889019+00:00"}