{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:IEZ5MUYE3HMDJ4AWN2VXBLIJMZ","short_pith_number":"pith:IEZ5MUYE","canonical_record":{"source":{"id":"1805.06020","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-15T20:15:05Z","cross_cats_sorted":[],"title_canon_sha256":"e3e452104e3d8ab72344156b5d8ca773f209f9daea0135cd903a6d1ba7d6476c","abstract_canon_sha256":"f14a3878a162c6b42351f72281d4577937a4d118d59357ba88ae41f69d2a2a0d"},"schema_version":"1.0"},"canonical_sha256":"4133d65304d9d834f0166eab70ad0966475f3b8e70e16824c6e840753bea4cc1","source":{"kind":"arxiv","id":"1805.06020","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.06020","created_at":"2026-05-18T00:15:36Z"},{"alias_kind":"arxiv_version","alias_value":"1805.06020v2","created_at":"2026-05-18T00:15:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.06020","created_at":"2026-05-18T00:15:36Z"},{"alias_kind":"pith_short_12","alias_value":"IEZ5MUYE3HMD","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"IEZ5MUYE3HMDJ4AW","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"IEZ5MUYE","created_at":"2026-05-18T12:32:28Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:IEZ5MUYE3HMDJ4AWN2VXBLIJMZ","target":"record","payload":{"canonical_record":{"source":{"id":"1805.06020","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-15T20:15:05Z","cross_cats_sorted":[],"title_canon_sha256":"e3e452104e3d8ab72344156b5d8ca773f209f9daea0135cd903a6d1ba7d6476c","abstract_canon_sha256":"f14a3878a162c6b42351f72281d4577937a4d118d59357ba88ae41f69d2a2a0d"},"schema_version":"1.0"},"canonical_sha256":"4133d65304d9d834f0166eab70ad0966475f3b8e70e16824c6e840753bea4cc1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:15:36.098850Z","signature_b64":"b8i5KT4L+9YcT2JZStHJDI1fhG7/7umb3p0+QxGFkP4udRPG4U54r82CRCpNV+yWDd3rCmfAzS2AtLSFOIH/AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4133d65304d9d834f0166eab70ad0966475f3b8e70e16824c6e840753bea4cc1","last_reissued_at":"2026-05-18T00:15:36.098065Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:15:36.098065Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1805.06020","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FdG7e3qET3HBQaXsa2chOfn4AtTEWEwRsrWoEHWO32fkyp3uSzmzpq7oRnCxAZkw8fhUokSMnxMYtrakBrLLBw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T23:09:31.427156Z"},"content_sha256":"bd7a705b72b5228f0455e618edba21f91a38e1bf7d00318c5b8f79f08b436b8c","schema_version":"1.0","event_id":"sha256:bd7a705b72b5228f0455e618edba21f91a38e1bf7d00318c5b8f79f08b436b8c"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:IEZ5MUYE3HMDJ4AWN2VXBLIJMZ","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Do deep reinforcement learning agents model intentions?","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Aqeel Labash, Daniel Majoral, Jaan Aru, Raul Vicente, Tambet Matiisen","submitted_at":"2018-05-15T20:15:05Z","abstract_excerpt":"Inferring other agents' mental states such as their knowledge, beliefs and intentions is thought to be essential for effective interactions with other agents. Recently, multiagent systems trained via deep reinforcement learning have been shown to succeed in solving different tasks, but it remains unclear how each agent modeled or represented other agents in their environment. In this work we test whether deep reinforcement learning agents explicitly represent other agents' intentions (their specific aims or goals) during a task in which the agents had to coordinate the covering of different sp"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.06020","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:36Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"5/vF1DzwKqvsafecYKos3yOYBdzZuuMYW3NMRtJLGv1o9h1YDGpz2mxBMCP8YTZH/TksqpfiBoDS8W2rDj5BBg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T23:09:31.427615Z"},"content_sha256":"cb7a83d102e675294b4defbe794481a0425e1190f3564d788496334746ddf80e","schema_version":"1.0","event_id":"sha256:cb7a83d102e675294b4defbe794481a0425e1190f3564d788496334746ddf80e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/IEZ5MUYE3HMDJ4AWN2VXBLIJMZ/bundle.json","state_url":"https://pith.science/pith/IEZ5MUYE3HMDJ4AWN2VXBLIJMZ/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/IEZ5MUYE3HMDJ4AWN2VXBLIJMZ/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T23:09:31Z","links":{"resolver":"https://pith.science/pith/IEZ5MUYE3HMDJ4AWN2VXBLIJMZ","bundle":"https://pith.science/pith/IEZ5MUYE3HMDJ4AWN2VXBLIJMZ/bundle.json","state":"https://pith.science/pith/IEZ5MUYE3HMDJ4AWN2VXBLIJMZ/state.json","well_known_bundle":"https://pith.science/.well-known/pith/IEZ5MUYE3HMDJ4AWN2VXBLIJMZ/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:IEZ5MUYE3HMDJ4AWN2VXBLIJMZ","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"f14a3878a162c6b42351f72281d4577937a4d118d59357ba88ae41f69d2a2a0d","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-15T20:15:05Z","title_canon_sha256":"e3e452104e3d8ab72344156b5d8ca773f209f9daea0135cd903a6d1ba7d6476c"},"schema_version":"1.0","source":{"id":"1805.06020","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.06020","created_at":"2026-05-18T00:15:36Z"},{"alias_kind":"arxiv_version","alias_value":"1805.06020v2","created_at":"2026-05-18T00:15:36Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.06020","created_at":"2026-05-18T00:15:36Z"},{"alias_kind":"pith_short_12","alias_value":"IEZ5MUYE3HMD","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_16","alias_value":"IEZ5MUYE3HMDJ4AW","created_at":"2026-05-18T12:32:28Z"},{"alias_kind":"pith_short_8","alias_value":"IEZ5MUYE","created_at":"2026-05-18T12:32:28Z"}],"graph_snapshots":[{"event_id":"sha256:cb7a83d102e675294b4defbe794481a0425e1190f3564d788496334746ddf80e","target":"graph","created_at":"2026-05-18T00:15:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Inferring other agents' mental states such as their knowledge, beliefs and intentions is thought to be essential for effective interactions with other agents. Recently, multiagent systems trained via deep reinforcement learning have been shown to succeed in solving different tasks, but it remains unclear how each agent modeled or represented other agents in their environment. In this work we test whether deep reinforcement learning agents explicitly represent other agents' intentions (their specific aims or goals) during a task in which the agents had to coordinate the covering of different sp","authors_text":"Aqeel Labash, Daniel Majoral, Jaan Aru, Raul Vicente, Tambet Matiisen","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-15T20:15:05Z","title":"Do deep reinforcement learning agents model intentions?"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.06020","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:bd7a705b72b5228f0455e618edba21f91a38e1bf7d00318c5b8f79f08b436b8c","target":"record","created_at":"2026-05-18T00:15:36Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"f14a3878a162c6b42351f72281d4577937a4d118d59357ba88ae41f69d2a2a0d","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2018-05-15T20:15:05Z","title_canon_sha256":"e3e452104e3d8ab72344156b5d8ca773f209f9daea0135cd903a6d1ba7d6476c"},"schema_version":"1.0","source":{"id":"1805.06020","kind":"arxiv","version":2}},"canonical_sha256":"4133d65304d9d834f0166eab70ad0966475f3b8e70e16824c6e840753bea4cc1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4133d65304d9d834f0166eab70ad0966475f3b8e70e16824c6e840753bea4cc1","first_computed_at":"2026-05-18T00:15:36.098065Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:15:36.098065Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"b8i5KT4L+9YcT2JZStHJDI1fhG7/7umb3p0+QxGFkP4udRPG4U54r82CRCpNV+yWDd3rCmfAzS2AtLSFOIH/AA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:15:36.098850Z","signed_message":"canonical_sha256_bytes"},"source_id":"1805.06020","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:bd7a705b72b5228f0455e618edba21f91a38e1bf7d00318c5b8f79f08b436b8c","sha256:cb7a83d102e675294b4defbe794481a0425e1190f3564d788496334746ddf80e"],"state_sha256":"61e8a85f2f312d4a99640712dabb74600f4321c6a6f87c8ec720befb597baa47"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RT8lFU8LcpXJY51DYWayl3rfKURP8bFPzntbJ7OhRJK7J8D31QSKsCGg9gcRoyuSf44OZYdPJiuycNUiH6khAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T23:09:31.431086Z","bundle_sha256":"87be02743ac934a74e52b63e101eacdf7dfe690c7435754d6ecbd688c40bdbfa"}}