{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:SBM7WDJDH4LHHBUYVJFKTEGFUV","short_pith_number":"pith:SBM7WDJD","canonical_record":{"source":{"id":"2606.07127","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-05T10:34:55Z","cross_cats_sorted":[],"title_canon_sha256":"484b2bd691f4af08045004dbeb91d181cf8f0e32c30d3fda5076b3ffa14123aa","abstract_canon_sha256":"a0720399165bc12e6f61928eed77907406d9d2adab6c4efbea267209d039c443"},"schema_version":"1.0"},"canonical_sha256":"9059fb0d233f16738698aa4aa990c5a5700c74f7beac5e28931be7d9df455390","source":{"kind":"arxiv","id":"2606.07127","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07127","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07127v1","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07127","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"pith_short_12","alias_value":"SBM7WDJDH4LH","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"pith_short_16","alias_value":"SBM7WDJDH4LHHBUY","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"pith_short_8","alias_value":"SBM7WDJD","created_at":"2026-06-08T01:04:47Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:SBM7WDJDH4LHHBUYVJFKTEGFUV","target":"record","payload":{"canonical_record":{"source":{"id":"2606.07127","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-05T10:34:55Z","cross_cats_sorted":[],"title_canon_sha256":"484b2bd691f4af08045004dbeb91d181cf8f0e32c30d3fda5076b3ffa14123aa","abstract_canon_sha256":"a0720399165bc12e6f61928eed77907406d9d2adab6c4efbea267209d039c443"},"schema_version":"1.0"},"canonical_sha256":"9059fb0d233f16738698aa4aa990c5a5700c74f7beac5e28931be7d9df455390","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-08T01:04:47.889719Z","signature_b64":"A5XgfEvg9vfD0g+8/5oboP2+m5SOCbhqjRVm3i2Qob7vjr8+WytGAmGAgs1qZO0B1U1Qc0lbtwfll3wJFOxUDw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9059fb0d233f16738698aa4aa990c5a5700c74f7beac5e28931be7d9df455390","last_reissued_at":"2026-06-08T01:04:47.888894Z","signature_status":"signed_v1","first_computed_at":"2026-06-08T01:04:47.888894Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.07127","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-08T01:04:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"PDLz+NE8asKtVxzbQgDlMHMHo/MKj5cbrcfzUmGEjEO4GxGAs3fejxYaDAbkCs6Gk82TpPrC1McqjzfCXCQqDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T01:30:13.921985Z"},"content_sha256":"d77d925b744640c027d8ea42270c8b5f781b4f45580adbf734dcc92a0186ed10","schema_version":"1.0","event_id":"sha256:d77d925b744640c027d8ea42270c8b5f781b4f45580adbf734dcc92a0186ed10"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:SBM7WDJDH4LHHBUYVJFKTEGFUV","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Learning Explicit Behavioral Models with Adaptive Questions and World-Model Probes","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Christopher Tauchmann, Gopika Sudhakaran, Hikaru Shindo, Jannis Bl\\\"uml, Kristian Kersting, Quentin Delfosse, Teng Cao, Yu Deng","submitted_at":"2026-06-05T10:34:55Z","abstract_excerpt":"Interactive agents trained only against task return can achieve high scores while failing to represent the mechanisms that make their actions succeed. This makes brittle behavior difficult to diagnose and limits adaptation when environment dynamics change. Existing LLM reflection and policy-code repair can revise behavior from failed trajectories, but questions and world-understanding tests are usually used only after training. We introduce an Explicit Symbolic Behavioral Model (ESBM), a trainable behavioral model that couples task performance with evidence-grounded question answering and exec"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07127","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.07127/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-08T01:04:47Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"F1hl5e4BFeHvfgkdx6mDiuD9BvAPpIJ+Ku0pd1gNbzZ3ooMRn6X0qJ68Fcy9JT0fbktge7w+LoLThZX0ToOHBQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-02T01:30:13.922381Z"},"content_sha256":"f49eecb7df73c23a2ceb77ce98189f76fe6da804d263108435c745b57a602006","schema_version":"1.0","event_id":"sha256:f49eecb7df73c23a2ceb77ce98189f76fe6da804d263108435c745b57a602006"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/bundle.json","state_url":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-02T01:30:13Z","links":{"resolver":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV","bundle":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/bundle.json","state":"https://pith.science/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/state.json","well_known_bundle":"https://pith.science/.well-known/pith/SBM7WDJDH4LHHBUYVJFKTEGFUV/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:SBM7WDJDH4LHHBUYVJFKTEGFUV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a0720399165bc12e6f61928eed77907406d9d2adab6c4efbea267209d039c443","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-05T10:34:55Z","title_canon_sha256":"484b2bd691f4af08045004dbeb91d181cf8f0e32c30d3fda5076b3ffa14123aa"},"schema_version":"1.0","source":{"id":"2606.07127","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.07127","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"arxiv_version","alias_value":"2606.07127v1","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.07127","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"pith_short_12","alias_value":"SBM7WDJDH4LH","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"pith_short_16","alias_value":"SBM7WDJDH4LHHBUY","created_at":"2026-06-08T01:04:47Z"},{"alias_kind":"pith_short_8","alias_value":"SBM7WDJD","created_at":"2026-06-08T01:04:47Z"}],"graph_snapshots":[{"event_id":"sha256:f49eecb7df73c23a2ceb77ce98189f76fe6da804d263108435c745b57a602006","target":"graph","created_at":"2026-06-08T01:04:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.07127/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Interactive agents trained only against task return can achieve high scores while failing to represent the mechanisms that make their actions succeed. This makes brittle behavior difficult to diagnose and limits adaptation when environment dynamics change. Existing LLM reflection and policy-code repair can revise behavior from failed trajectories, but questions and world-understanding tests are usually used only after training. We introduce an Explicit Symbolic Behavioral Model (ESBM), a trainable behavioral model that couples task performance with evidence-grounded question answering and exec","authors_text":"Christopher Tauchmann, Gopika Sudhakaran, Hikaru Shindo, Jannis Bl\\\"uml, Kristian Kersting, Quentin Delfosse, Teng Cao, Yu Deng","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-05T10:34:55Z","title":"Learning Explicit Behavioral Models with Adaptive Questions and World-Model Probes"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.07127","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d77d925b744640c027d8ea42270c8b5f781b4f45580adbf734dcc92a0186ed10","target":"record","created_at":"2026-06-08T01:04:47Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a0720399165bc12e6f61928eed77907406d9d2adab6c4efbea267209d039c443","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.LG","submitted_at":"2026-06-05T10:34:55Z","title_canon_sha256":"484b2bd691f4af08045004dbeb91d181cf8f0e32c30d3fda5076b3ffa14123aa"},"schema_version":"1.0","source":{"id":"2606.07127","kind":"arxiv","version":1}},"canonical_sha256":"9059fb0d233f16738698aa4aa990c5a5700c74f7beac5e28931be7d9df455390","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9059fb0d233f16738698aa4aa990c5a5700c74f7beac5e28931be7d9df455390","first_computed_at":"2026-06-08T01:04:47.888894Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-08T01:04:47.888894Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"A5XgfEvg9vfD0g+8/5oboP2+m5SOCbhqjRVm3i2Qob7vjr8+WytGAmGAgs1qZO0B1U1Qc0lbtwfll3wJFOxUDw==","signature_status":"signed_v1","signed_at":"2026-06-08T01:04:47.889719Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.07127","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d77d925b744640c027d8ea42270c8b5f781b4f45580adbf734dcc92a0186ed10","sha256:f49eecb7df73c23a2ceb77ce98189f76fe6da804d263108435c745b57a602006"],"state_sha256":"663e4712c0c59f76e814bccd95f63da11d02c35b65a507cb043816fd58592e42"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"D/gv/gBG7Nzsphx8p4/b2o9mCt6BEwGRcGHw4vydcXfZRHnTniGenNRV7U0MWSJ1PHzpGXRq9sT5DScrLBTSDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-02T01:30:13.924364Z","bundle_sha256":"ccf1f9e5b9faa63186a9f0df91871451de41c2b9db75c35b078c99d91ff44b76"}}