{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2016:4OMAO5DMTGY2YUSUEO6GSMCTN4","short_pith_number":"pith:4OMAO5DM","canonical_record":{"source":{"id":"1611.08666","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-26T06:25:08Z","cross_cats_sorted":["cs.AI","cs.RO"],"title_canon_sha256":"ff440039ed5631300a2a881f52399208f4e8f2604dd804d6308b0d1173e92f5d","abstract_canon_sha256":"31fab59f8e11c8d3d4d5b91053471a7feaa33a8618c1bf7282ead1c63cb1247e"},"schema_version":"1.0"},"canonical_sha256":"e39807746c99b1ac525423bc6930536f1d393cf51fe5977715cd9c23245896dc","source":{"kind":"arxiv","id":"1611.08666","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.08666","created_at":"2026-05-18T00:56:37Z"},{"alias_kind":"arxiv_version","alias_value":"1611.08666v1","created_at":"2026-05-18T00:56:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.08666","created_at":"2026-05-18T00:56:37Z"},{"alias_kind":"pith_short_12","alias_value":"4OMAO5DMTGY2","created_at":"2026-05-18T12:29:58Z"},{"alias_kind":"pith_short_16","alias_value":"4OMAO5DMTGY2YUSU","created_at":"2026-05-18T12:29:58Z"},{"alias_kind":"pith_short_8","alias_value":"4OMAO5DM","created_at":"2026-05-18T12:29:58Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2016:4OMAO5DMTGY2YUSUEO6GSMCTN4","target":"record","payload":{"canonical_record":{"source":{"id":"1611.08666","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-26T06:25:08Z","cross_cats_sorted":["cs.AI","cs.RO"],"title_canon_sha256":"ff440039ed5631300a2a881f52399208f4e8f2604dd804d6308b0d1173e92f5d","abstract_canon_sha256":"31fab59f8e11c8d3d4d5b91053471a7feaa33a8618c1bf7282ead1c63cb1247e"},"schema_version":"1.0"},"canonical_sha256":"e39807746c99b1ac525423bc6930536f1d393cf51fe5977715cd9c23245896dc","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:56:37.174773Z","signature_b64":"tbn0lShVKRq66DM/80cZGvfqgs4MG8q3kWYXuwq6L1A6WfhS5Blkz0S92fHkqRZZbbpEIC7PgyGdV+BqB80sCw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"e39807746c99b1ac525423bc6930536f1d393cf51fe5977715cd9c23245896dc","last_reissued_at":"2026-05-18T00:56:37.174086Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:56:37.174086Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1611.08666","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:56:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"OMQgi2KVznmV7oznO6qyW5VPXOrfx/eyCrYRRsBHRHGX0k5FMZXMQDpJT7SdZChCcwray2rwHeAYHaK1wI0zDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T21:15:51.322947Z"},"content_sha256":"32403388fc4ddc21c8556dcddb597d54f1da463491772f4a24a06675b320ece4","schema_version":"1.0","event_id":"sha256:32403388fc4ddc21c8556dcddb597d54f1da463491772f4a24a06675b320ece4"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2016:4OMAO5DMTGY2YUSUEO6GSMCTN4","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Training an Interactive Humanoid Robot Using Multimodal Deep Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.RO"],"primary_cat":"cs.LG","authors_text":"Cl\\'ement Olalainty, Guillaume Couly, Heriberto Cuay\\'ahuitl","submitted_at":"2016-11-26T06:25:08Z","abstract_excerpt":"Training robots to perceive, act and communicate using multiple modalities still represents a challenging problem, particularly if robots are expected to learn efficiently from small sets of example interactions. We describe a learning approach as a step in this direction, where we teach a humanoid robot how to play the game of noughts and crosses. Given that multiple multimodal skills can be trained to play this game, we focus our attention to training the robot to perceive the game, and to interact in this game. Our multimodal deep reinforcement learning agent perceives multimodal features a"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.08666","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:56:37Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8xcqg6he1rvLurMTb+/8BhAoOZFtxMtRxmGb9yCrYbRGYkf0CGQQxoRcT7PpGlJOQHlsUMYnPU8SiPd5LvbhAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-10T21:15:51.323524Z"},"content_sha256":"b81299a8a051d58307751208970c83680a614c73fc9048f2470238a8fecdb6c1","schema_version":"1.0","event_id":"sha256:b81299a8a051d58307751208970c83680a614c73fc9048f2470238a8fecdb6c1"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/4OMAO5DMTGY2YUSUEO6GSMCTN4/bundle.json","state_url":"https://pith.science/pith/4OMAO5DMTGY2YUSUEO6GSMCTN4/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/4OMAO5DMTGY2YUSUEO6GSMCTN4/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-10T21:15:51Z","links":{"resolver":"https://pith.science/pith/4OMAO5DMTGY2YUSUEO6GSMCTN4","bundle":"https://pith.science/pith/4OMAO5DMTGY2YUSUEO6GSMCTN4/bundle.json","state":"https://pith.science/pith/4OMAO5DMTGY2YUSUEO6GSMCTN4/state.json","well_known_bundle":"https://pith.science/.well-known/pith/4OMAO5DMTGY2YUSUEO6GSMCTN4/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2016:4OMAO5DMTGY2YUSUEO6GSMCTN4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"31fab59f8e11c8d3d4d5b91053471a7feaa33a8618c1bf7282ead1c63cb1247e","cross_cats_sorted":["cs.AI","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-26T06:25:08Z","title_canon_sha256":"ff440039ed5631300a2a881f52399208f4e8f2604dd804d6308b0d1173e92f5d"},"schema_version":"1.0","source":{"id":"1611.08666","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1611.08666","created_at":"2026-05-18T00:56:37Z"},{"alias_kind":"arxiv_version","alias_value":"1611.08666v1","created_at":"2026-05-18T00:56:37Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1611.08666","created_at":"2026-05-18T00:56:37Z"},{"alias_kind":"pith_short_12","alias_value":"4OMAO5DMTGY2","created_at":"2026-05-18T12:29:58Z"},{"alias_kind":"pith_short_16","alias_value":"4OMAO5DMTGY2YUSU","created_at":"2026-05-18T12:29:58Z"},{"alias_kind":"pith_short_8","alias_value":"4OMAO5DM","created_at":"2026-05-18T12:29:58Z"}],"graph_snapshots":[{"event_id":"sha256:b81299a8a051d58307751208970c83680a614c73fc9048f2470238a8fecdb6c1","target":"graph","created_at":"2026-05-18T00:56:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Training robots to perceive, act and communicate using multiple modalities still represents a challenging problem, particularly if robots are expected to learn efficiently from small sets of example interactions. We describe a learning approach as a step in this direction, where we teach a humanoid robot how to play the game of noughts and crosses. Given that multiple multimodal skills can be trained to play this game, we focus our attention to training the robot to perceive the game, and to interact in this game. Our multimodal deep reinforcement learning agent perceives multimodal features a","authors_text":"Cl\\'ement Olalainty, Guillaume Couly, Heriberto Cuay\\'ahuitl","cross_cats":["cs.AI","cs.RO"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-26T06:25:08Z","title":"Training an Interactive Humanoid Robot Using Multimodal Deep Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1611.08666","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:32403388fc4ddc21c8556dcddb597d54f1da463491772f4a24a06675b320ece4","target":"record","created_at":"2026-05-18T00:56:37Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"31fab59f8e11c8d3d4d5b91053471a7feaa33a8618c1bf7282ead1c63cb1247e","cross_cats_sorted":["cs.AI","cs.RO"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2016-11-26T06:25:08Z","title_canon_sha256":"ff440039ed5631300a2a881f52399208f4e8f2604dd804d6308b0d1173e92f5d"},"schema_version":"1.0","source":{"id":"1611.08666","kind":"arxiv","version":1}},"canonical_sha256":"e39807746c99b1ac525423bc6930536f1d393cf51fe5977715cd9c23245896dc","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"e39807746c99b1ac525423bc6930536f1d393cf51fe5977715cd9c23245896dc","first_computed_at":"2026-05-18T00:56:37.174086Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:56:37.174086Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"tbn0lShVKRq66DM/80cZGvfqgs4MG8q3kWYXuwq6L1A6WfhS5Blkz0S92fHkqRZZbbpEIC7PgyGdV+BqB80sCw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:56:37.174773Z","signed_message":"canonical_sha256_bytes"},"source_id":"1611.08666","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:32403388fc4ddc21c8556dcddb597d54f1da463491772f4a24a06675b320ece4","sha256:b81299a8a051d58307751208970c83680a614c73fc9048f2470238a8fecdb6c1"],"state_sha256":"883fa6ba980bae37b56eb4b44b5c15f48c4da4fd01c3d3ed2df7850175e7467b"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"xvS6DJLHUkpuPDQry5ALEfBtHzTT+TzYv7ikxyq+QqNzu4IJPEfeq54pHuFzV2jHsCDVJvxQjRemSpVKd0eyBA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-10T21:15:51.325792Z","bundle_sha256":"ff89bac00d7b3d6fb2a34f485b64b0f0174cf4b4f7cb5a5860f9a22fbb8e743c"}}