{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:Z43LXKWPAMDLOHNY4PQIQY6JLV","short_pith_number":"pith:Z43LXKWP","canonical_record":{"source":{"id":"2605.11021","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-10T16:21:31Z","cross_cats_sorted":[],"title_canon_sha256":"1367a8f9dfe7deeb7b6cda9fc40c07ae986d30178b072d47d5f2fd1ecdc94c61","abstract_canon_sha256":"50e911934cfb9d76dc0b2679b68867559464df43c129533a94dbdd78c07fee9c"},"schema_version":"1.0"},"canonical_sha256":"cf36bbaacf0306b71db8e3e08863c95d6d665df4fce51a86f60fe5cac9432b80","source":{"kind":"arxiv","id":"2605.11021","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.11021","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"arxiv_version","alias_value":"2605.11021v2","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.11021","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"pith_short_12","alias_value":"Z43LXKWPAMDL","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"pith_short_16","alias_value":"Z43LXKWPAMDLOHNY","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"pith_short_8","alias_value":"Z43LXKWP","created_at":"2026-05-20T01:05:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:Z43LXKWPAMDLOHNY4PQIQY6JLV","target":"record","payload":{"canonical_record":{"source":{"id":"2605.11021","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-10T16:21:31Z","cross_cats_sorted":[],"title_canon_sha256":"1367a8f9dfe7deeb7b6cda9fc40c07ae986d30178b072d47d5f2fd1ecdc94c61","abstract_canon_sha256":"50e911934cfb9d76dc0b2679b68867559464df43c129533a94dbdd78c07fee9c"},"schema_version":"1.0"},"canonical_sha256":"cf36bbaacf0306b71db8e3e08863c95d6d665df4fce51a86f60fe5cac9432b80","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:05:16.523167Z","signature_b64":"e+6q1gk2IbGp7bW84tBBG6n0UsRbAng4Z8QGQwSFubzROvbN66+RDeI749PNkbBQHW2r05tdmZSmKhyzHXElBA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"cf36bbaacf0306b71db8e3e08863c95d6d665df4fce51a86f60fe5cac9432b80","last_reissued_at":"2026-05-20T01:05:16.522625Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:05:16.522625Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.11021","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Po++cX9RD0O/kzx8zdEjQqYxODnomHBjnvE2ZbI+kdnG4DmxAUgjRmIY80zzHhm8LLIS2mAixO5SA8H5qgh9Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T08:19:58.065975Z"},"content_sha256":"96cfa87bc83254b015d60f2c05baa266dfc2d5ca093180fe0dc1f6c28b5b6b23","schema_version":"1.0","event_id":"sha256:96cfa87bc83254b015d60f2c05baa266dfc2d5ca093180fe0dc1f6c28b5b6b23"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:Z43LXKWPAMDLOHNY4PQIQY6JLV","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"A Switching System Theory of Q-Learning with Linear Function Approximation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"The mean dynamics of Q-learning with linear function approximation are exactly equivalent to a linear switched system whose stability determines convergence.","cross_cats":[],"primary_cat":"cs.LG","authors_text":"Donghwan Lee, Han-Dong Lim","submitted_at":"2026-05-10T16:21:31Z","abstract_excerpt":"This paper develops a switching-system interpretation of Q-learning with linear function approximation (LFA) based on the joint spectral radius (JSR). We derive an exact linear switched model for the mean dynamics and relate convergence to stability of the corresponding switched system. The same construction is then used for stochastic linear Q-learning with independent and identically distributed (i.i.d.) observations and with Markovian observations. Although exact JSR computation is difficult in general, the certificate captures products of switching modes and can be less conservative than o"},"claims":{"count":4,"items":[{"kind":"strongest_claim","text":"We derive an exact linear switched model for the mean dynamics and relate convergence to stability of the corresponding switched system.","source":"verdict.strongest_claim","status":"machine_extracted","claim_id":"C1","attestation":"unclaimed"},{"kind":"weakest_assumption","text":"That the mean dynamics of Q-learning with linear function approximation admit an exact representation as a finite set of linear switching modes whose joint spectral radius governs convergence.","source":"verdict.weakest_assumption","status":"machine_extracted","claim_id":"C2","attestation":"unclaimed"},{"kind":"one_line_summary","text":"Q-learning with linear function approximation is recast as a switched linear system whose mean dynamics converge precisely when the joint spectral radius of the switching matrices is less than one.","source":"verdict.one_line_summary","status":"machine_extracted","claim_id":"C3","attestation":"unclaimed"},{"kind":"headline","text":"The mean dynamics of Q-learning with linear function approximation are exactly equivalent to a linear switched system whose stability determines convergence.","source":"verdict.pith_extraction.headline","status":"machine_extracted","claim_id":"C4","attestation":"unclaimed"}],"snapshot_sha256":"a247039adf7c2c82490ccff4e02adeb57ca275eaec16da47124a3be6fb0711bd"},"source":{"id":"2605.11021","kind":"arxiv","version":2},"verdict":{"id":"4ea7ee26-af9d-4ea6-a95b-6ba0ed2d5db3","model_set":{"reader":"grok-4.3"},"created_at":"2026-05-13T06:10:24.513147Z","strongest_claim":"We derive an exact linear switched model for the mean dynamics and relate convergence to stability of the corresponding switched system.","one_line_summary":"Q-learning with linear function approximation is recast as a switched linear system whose mean dynamics converge precisely when the joint spectral radius of the switching matrices is less than one.","pipeline_version":"pith-pipeline@v0.9.0","weakest_assumption":"That the mean dynamics of Q-learning with linear function approximation admit an exact representation as a finite set of linear switching modes whose joint spectral radius governs convergence.","pith_extraction_headline":"The mean dynamics of Q-learning with linear function approximation are exactly equivalent to a linear switched system whose stability determines convergence."},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.11021/integrity.json","findings":[],"available":true,"detectors_run":[{"name":"ai_meta_artifact","ran_at":"2026-05-19T16:38:37.979452Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"doi_title_agreement","ran_at":"2026-05-19T12:31:18.615231Z","status":"completed","version":"1.0.0","findings_count":0},{"name":"doi_compliance","ran_at":"2026-05-19T10:01:55.864039Z","status":"completed","version":"1.0.0","findings_count":0}],"snapshot_sha256":"d945f3abaec74bf6fcc6b26cb0613bdcf3d7b3efd19ea009b0fc4674ea76b303"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":2,"snapshot_sha256":"fa7fc3100520dbfff4d4799d0c1459456edb08313e192ec1c9de9bff4712aadc"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":"4ea7ee26-af9d-4ea6-a95b-6ba0ed2d5db3"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:16Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"gn3DpLUdPeZh6LHeOxKLhF2ZMKFUZSx0GfDbfz6hEZ1TbsLfAozzAEkGgIAXpM5tsrVEJZbiMQxuwvd2uAEnDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-07T08:19:58.066804Z"},"content_sha256":"6df9e2ecba1f157fb0a364efb49fcfc93e6fe37ef10c24a1cf0fe4ca900bebfe","schema_version":"1.0","event_id":"sha256:6df9e2ecba1f157fb0a364efb49fcfc93e6fe37ef10c24a1cf0fe4ca900bebfe"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/Z43LXKWPAMDLOHNY4PQIQY6JLV/bundle.json","state_url":"https://pith.science/pith/Z43LXKWPAMDLOHNY4PQIQY6JLV/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/Z43LXKWPAMDLOHNY4PQIQY6JLV/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-07T08:19:58Z","links":{"resolver":"https://pith.science/pith/Z43LXKWPAMDLOHNY4PQIQY6JLV","bundle":"https://pith.science/pith/Z43LXKWPAMDLOHNY4PQIQY6JLV/bundle.json","state":"https://pith.science/pith/Z43LXKWPAMDLOHNY4PQIQY6JLV/state.json","well_known_bundle":"https://pith.science/.well-known/pith/Z43LXKWPAMDLOHNY4PQIQY6JLV/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:Z43LXKWPAMDLOHNY4PQIQY6JLV","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"50e911934cfb9d76dc0b2679b68867559464df43c129533a94dbdd78c07fee9c","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-10T16:21:31Z","title_canon_sha256":"1367a8f9dfe7deeb7b6cda9fc40c07ae986d30178b072d47d5f2fd1ecdc94c61"},"schema_version":"1.0","source":{"id":"2605.11021","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.11021","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"arxiv_version","alias_value":"2605.11021v2","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.11021","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"pith_short_12","alias_value":"Z43LXKWPAMDL","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"pith_short_16","alias_value":"Z43LXKWPAMDLOHNY","created_at":"2026-05-20T01:05:16Z"},{"alias_kind":"pith_short_8","alias_value":"Z43LXKWP","created_at":"2026-05-20T01:05:16Z"}],"graph_snapshots":[{"event_id":"sha256:6df9e2ecba1f157fb0a364efb49fcfc93e6fe37ef10c24a1cf0fe4ca900bebfe","target":"graph","created_at":"2026-05-20T01:05:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"We derive an exact linear switched model for the mean dynamics and relate convergence to stability of the corresponding switched system."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"That the mean dynamics of Q-learning with linear function approximation admit an exact representation as a finite set of linear switching modes whose joint spectral radius governs convergence."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"Q-learning with linear function approximation is recast as a switched linear system whose mean dynamics converge precisely when the joint spectral radius of the switching matrices is less than one."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"The mean dynamics of Q-learning with linear function approximation are exactly equivalent to a linear switched system whose stability determines convergence."}],"snapshot_sha256":"a247039adf7c2c82490ccff4e02adeb57ca275eaec16da47124a3be6fb0711bd"},"formal_canon":{"evidence_count":2,"snapshot_sha256":"fa7fc3100520dbfff4d4799d0c1459456edb08313e192ec1c9de9bff4712aadc"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-19T16:38:37.979452Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_title_agreement","ran_at":"2026-05-19T12:31:18.615231Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-19T10:01:55.864039Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2605.11021/integrity.json","findings":[],"snapshot_sha256":"d945f3abaec74bf6fcc6b26cb0613bdcf3d7b3efd19ea009b0fc4674ea76b303","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"This paper develops a switching-system interpretation of Q-learning with linear function approximation (LFA) based on the joint spectral radius (JSR). We derive an exact linear switched model for the mean dynamics and relate convergence to stability of the corresponding switched system. The same construction is then used for stochastic linear Q-learning with independent and identically distributed (i.i.d.) observations and with Markovian observations. Although exact JSR computation is difficult in general, the certificate captures products of switching modes and can be less conservative than o","authors_text":"Donghwan Lee, Han-Dong Lim","cross_cats":[],"headline":"The mean dynamics of Q-learning with linear function approximation are exactly equivalent to a linear switched system whose stability determines convergence.","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-10T16:21:31Z","title":"A Switching System Theory of Q-Learning with Linear Function Approximation"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.11021","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-13T06:10:24.513147Z","id":"4ea7ee26-af9d-4ea6-a95b-6ba0ed2d5db3","model_set":{"reader":"grok-4.3"},"one_line_summary":"Q-learning with linear function approximation is recast as a switched linear system whose mean dynamics converge precisely when the joint spectral radius of the switching matrices is less than one.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"The mean dynamics of Q-learning with linear function approximation are exactly equivalent to a linear switched system whose stability determines convergence.","strongest_claim":"We derive an exact linear switched model for the mean dynamics and relate convergence to stability of the corresponding switched system.","weakest_assumption":"That the mean dynamics of Q-learning with linear function approximation admit an exact representation as a finite set of linear switching modes whose joint spectral radius governs convergence."}},"verdict_id":"4ea7ee26-af9d-4ea6-a95b-6ba0ed2d5db3"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:96cfa87bc83254b015d60f2c05baa266dfc2d5ca093180fe0dc1f6c28b5b6b23","target":"record","created_at":"2026-05-20T01:05:16Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"50e911934cfb9d76dc0b2679b68867559464df43c129533a94dbdd78c07fee9c","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2026-05-10T16:21:31Z","title_canon_sha256":"1367a8f9dfe7deeb7b6cda9fc40c07ae986d30178b072d47d5f2fd1ecdc94c61"},"schema_version":"1.0","source":{"id":"2605.11021","kind":"arxiv","version":2}},"canonical_sha256":"cf36bbaacf0306b71db8e3e08863c95d6d665df4fce51a86f60fe5cac9432b80","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"cf36bbaacf0306b71db8e3e08863c95d6d665df4fce51a86f60fe5cac9432b80","first_computed_at":"2026-05-20T01:05:16.522625Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T01:05:16.522625Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"e+6q1gk2IbGp7bW84tBBG6n0UsRbAng4Z8QGQwSFubzROvbN66+RDeI749PNkbBQHW2r05tdmZSmKhyzHXElBA==","signature_status":"signed_v1","signed_at":"2026-05-20T01:05:16.523167Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.11021","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:96cfa87bc83254b015d60f2c05baa266dfc2d5ca093180fe0dc1f6c28b5b6b23","sha256:6df9e2ecba1f157fb0a364efb49fcfc93e6fe37ef10c24a1cf0fe4ca900bebfe"],"state_sha256":"21149654361ab4b6c8f3623ee7e9bc05aacbe045396c5e220de4ae032997dcbb"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"Q5Yp2Mi4GrriaeyFdWzibM1QZP8ATMdhDr9PeTL/mu8FHk4jtm1g7P3N7vGNDbKphLz8piRXMJmm73poy53iDA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-07T08:19:58.071181Z","bundle_sha256":"67518f0f0ada21be9f90044c6e1acd34f01ed04a7013292dbe7365615158fe36"}}