{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:L3NEF557LERCRR2XQTV2BZNUIX","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"d0c921b202f2c21575d4c14c774ce69539d3cbabd7d560b66f5b36c9a46108ee","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"physics.flu-dyn","submitted_at":"2026-06-04T14:36:14Z","title_canon_sha256":"c877e4043c98b530ca47cd28db6f1ed934aac6af4e74799e88a6a673b1cf8e8c"},"schema_version":"1.0","source":{"id":"2606.06227","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.06227","created_at":"2026-06-05T01:15:38Z"},{"alias_kind":"arxiv_version","alias_value":"2606.06227v1","created_at":"2026-06-05T01:15:38Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.06227","created_at":"2026-06-05T01:15:38Z"},{"alias_kind":"pith_short_12","alias_value":"L3NEF557LERC","created_at":"2026-06-05T01:15:38Z"},{"alias_kind":"pith_short_16","alias_value":"L3NEF557LERCRR2X","created_at":"2026-06-05T01:15:38Z"},{"alias_kind":"pith_short_8","alias_value":"L3NEF557","created_at":"2026-06-05T01:15:38Z"}],"graph_snapshots":[{"event_id":"sha256:02d8e1429d88a19430519301012405eff6e199cf84610e75e36c8d92f6c82e4f","target":"graph","created_at":"2026-06-05T01:15:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.06227/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"A reinforcement-learning agent maximises its reward, which can diverge from the outcome its designer intended. In physical control the reward rarely closes that gap, and drag reduction in wall turbulence makes it concrete. A mass-conservation projection couples agents' outputs and erases the per-agent credit the policy gradient needs; a memoryless policy cannot resolve the slow near-wall cycle it acts on; and a pressure-gradient reward pays for nominal drag reduction by pumping power through the wall. Two degenerate controllers achieve large drag reductions while total dissipation rises, so th","authors_text":"Alfredo Pinelli, Giorgio Maria Cavallazzi, Miguel P\\'erez-Cuadrado","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"physics.flu-dyn","submitted_at":"2026-06-04T14:36:14Z","title":"Drag reduction or reward hacking? Recurrent multi-agent reinforcement learning that earns its reward"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.06227","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:b054e1beef895862a1402ed2514f60907188fab366e83e498b4d2d4b7c2d85e4","target":"record","created_at":"2026-06-05T01:15:38Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"d0c921b202f2c21575d4c14c774ce69539d3cbabd7d560b66f5b36c9a46108ee","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"physics.flu-dyn","submitted_at":"2026-06-04T14:36:14Z","title_canon_sha256":"c877e4043c98b530ca47cd28db6f1ed934aac6af4e74799e88a6a673b1cf8e8c"},"schema_version":"1.0","source":{"id":"2606.06227","kind":"arxiv","version":1}},"canonical_sha256":"5eda42f7bf592228c75784eba0e5b445c8f3b4979c384fa4bf8cad5e20756a6e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"5eda42f7bf592228c75784eba0e5b445c8f3b4979c384fa4bf8cad5e20756a6e","first_computed_at":"2026-06-05T01:15:38.545643Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-05T01:15:38.545643Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"h/lRL/Wz0xiHgTxnalqYxHo+rMqbK1BmYrC/8qjnzEoEyyRFxrbrZayaLfytj1WvHmj1d3Ct3oFmU84AOPznAQ==","signature_status":"signed_v1","signed_at":"2026-06-05T01:15:38.546134Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.06227","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:b054e1beef895862a1402ed2514f60907188fab366e83e498b4d2d4b7c2d85e4","sha256:02d8e1429d88a19430519301012405eff6e199cf84610e75e36c8d92f6c82e4f"],"state_sha256":"edcfc2f3fa0a965b0361a5fcbe30efea2de1ddd7bbb07749cd94b925a8d45144"}