{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:CGT4MQZA2QP5KCC3G25ZL3TG2T","short_pith_number":"pith:CGT4MQZA","canonical_record":{"source":{"id":"1810.05762","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-12T23:48:09Z","cross_cats_sorted":[],"title_canon_sha256":"99974912b39c93d62ea6f510e07214628408608f97dbde0e63ebd4b49ab6a652","abstract_canon_sha256":"a2e22d2eed588259ed2aedaf9678e082f8758e4c908c8236126be495f95a955b"},"schema_version":"1.0"},"canonical_sha256":"11a7c64320d41fd5085b36bb95ee66d4c87fb745dccd7409ea15f7528707eb88","source":{"kind":"arxiv","id":"1810.05762","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.05762","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"arxiv_version","alias_value":"1810.05762v2","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.05762","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"pith_short_12","alias_value":"CGT4MQZA2QP5","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_16","alias_value":"CGT4MQZA2QP5KCC3","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_8","alias_value":"CGT4MQZA","created_at":"2026-05-18T12:32:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:CGT4MQZA2QP5KCC3G25ZL3TG2T","target":"record","payload":{"canonical_record":{"source":{"id":"1810.05762","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-12T23:48:09Z","cross_cats_sorted":[],"title_canon_sha256":"99974912b39c93d62ea6f510e07214628408608f97dbde0e63ebd4b49ab6a652","abstract_canon_sha256":"a2e22d2eed588259ed2aedaf9678e082f8758e4c908c8236126be495f95a955b"},"schema_version":"1.0"},"canonical_sha256":"11a7c64320d41fd5085b36bb95ee66d4c87fb745dccd7409ea15f7528707eb88","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:02:24.601937Z","signature_b64":"LZ+jqFGkYawcFpCGWs0XncL6i6vdZxre1leecxq1PBJTVkHmaA8UbPVN+UrGV5Yj8WrB0BUP10zUwDEAB4Q+DQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"11a7c64320d41fd5085b36bb95ee66d4c87fb745dccd7409ea15f7528707eb88","last_reissued_at":"2026-05-18T00:02:24.601263Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:02:24.601263Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1810.05762","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"6O+yoYAXu2UMxUql3h6oCPDsxok3DIw6DwnGpL6Lxy9AdHz7LhZsWcZ8Q6a6TrZrvoF27mjwOLhB7e4TrFHaCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T02:41:49.721894Z"},"content_sha256":"8e96ce103a47f7651789a2a5a7d62a2cb6879024ce568e44ef600e8ccaa13ee4","schema_version":"1.0","event_id":"sha256:8e96ce103a47f7651789a2a5a7d62a2cb6879024ce568e44ef600e8ccaa13ee4"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:CGT4MQZA2QP5KCC3G25ZL3TG2T","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"GPU-Accelerated Robotic Simulation for Distributed Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.RO","authors_text":"Ankur Handa, Dieter Fox, Jacky Liang, Miles Macklin, Nuttapong Chentanez, Viktor Makoviychuk","submitted_at":"2018-10-12T23:48:09Z","abstract_excerpt":"Most Deep Reinforcement Learning (Deep RL) algorithms require a prohibitively large number of training samples for learning complex tasks. Many recent works on speeding up Deep RL have focused on distributed training and simulation. While distributed training is often done on the GPU, simulation is not. In this work, we propose using GPU-accelerated RL simulations as an alternative to CPU ones. Using NVIDIA Flex, a GPU-based physics engine, we show promising speed-ups of learning various continuous-control, locomotion tasks. With one GPU and CPU core, we are able to train the Humanoid running "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.05762","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:02:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"bFPia0symxzANw3nyh5yKmJnNnMPmprCVETvVR4jyuxEsGgZYQYBD0//R8aj6YbzVWgOdbxBNUD4p+R0xn/SAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T02:41:49.722618Z"},"content_sha256":"f90efa6960a0f88acb8482fdb8a2cde8549fb8d1b556cf961bf8e676704e7178","schema_version":"1.0","event_id":"sha256:f90efa6960a0f88acb8482fdb8a2cde8549fb8d1b556cf961bf8e676704e7178"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CGT4MQZA2QP5KCC3G25ZL3TG2T/bundle.json","state_url":"https://pith.science/pith/CGT4MQZA2QP5KCC3G25ZL3TG2T/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CGT4MQZA2QP5KCC3G25ZL3TG2T/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T02:41:49Z","links":{"resolver":"https://pith.science/pith/CGT4MQZA2QP5KCC3G25ZL3TG2T","bundle":"https://pith.science/pith/CGT4MQZA2QP5KCC3G25ZL3TG2T/bundle.json","state":"https://pith.science/pith/CGT4MQZA2QP5KCC3G25ZL3TG2T/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CGT4MQZA2QP5KCC3G25ZL3TG2T/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:CGT4MQZA2QP5KCC3G25ZL3TG2T","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"a2e22d2eed588259ed2aedaf9678e082f8758e4c908c8236126be495f95a955b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-12T23:48:09Z","title_canon_sha256":"99974912b39c93d62ea6f510e07214628408608f97dbde0e63ebd4b49ab6a652"},"schema_version":"1.0","source":{"id":"1810.05762","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1810.05762","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"arxiv_version","alias_value":"1810.05762v2","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1810.05762","created_at":"2026-05-18T00:02:24Z"},{"alias_kind":"pith_short_12","alias_value":"CGT4MQZA2QP5","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_16","alias_value":"CGT4MQZA2QP5KCC3","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_8","alias_value":"CGT4MQZA","created_at":"2026-05-18T12:32:16Z"}],"graph_snapshots":[{"event_id":"sha256:f90efa6960a0f88acb8482fdb8a2cde8549fb8d1b556cf961bf8e676704e7178","target":"graph","created_at":"2026-05-18T00:02:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Most Deep Reinforcement Learning (Deep RL) algorithms require a prohibitively large number of training samples for learning complex tasks. Many recent works on speeding up Deep RL have focused on distributed training and simulation. While distributed training is often done on the GPU, simulation is not. In this work, we propose using GPU-accelerated RL simulations as an alternative to CPU ones. Using NVIDIA Flex, a GPU-based physics engine, we show promising speed-ups of learning various continuous-control, locomotion tasks. With one GPU and CPU core, we are able to train the Humanoid running ","authors_text":"Ankur Handa, Dieter Fox, Jacky Liang, Miles Macklin, Nuttapong Chentanez, Viktor Makoviychuk","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-12T23:48:09Z","title":"GPU-Accelerated Robotic Simulation for Distributed Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1810.05762","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:8e96ce103a47f7651789a2a5a7d62a2cb6879024ce568e44ef600e8ccaa13ee4","target":"record","created_at":"2026-05-18T00:02:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"a2e22d2eed588259ed2aedaf9678e082f8758e4c908c8236126be495f95a955b","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-10-12T23:48:09Z","title_canon_sha256":"99974912b39c93d62ea6f510e07214628408608f97dbde0e63ebd4b49ab6a652"},"schema_version":"1.0","source":{"id":"1810.05762","kind":"arxiv","version":2}},"canonical_sha256":"11a7c64320d41fd5085b36bb95ee66d4c87fb745dccd7409ea15f7528707eb88","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"11a7c64320d41fd5085b36bb95ee66d4c87fb745dccd7409ea15f7528707eb88","first_computed_at":"2026-05-18T00:02:24.601263Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:02:24.601263Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"LZ+jqFGkYawcFpCGWs0XncL6i6vdZxre1leecxq1PBJTVkHmaA8UbPVN+UrGV5Yj8WrB0BUP10zUwDEAB4Q+DQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:02:24.601937Z","signed_message":"canonical_sha256_bytes"},"source_id":"1810.05762","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:8e96ce103a47f7651789a2a5a7d62a2cb6879024ce568e44ef600e8ccaa13ee4","sha256:f90efa6960a0f88acb8482fdb8a2cde8549fb8d1b556cf961bf8e676704e7178"],"state_sha256":"ae76abf5c389437dd75dfda9f93c6eaab5b3bdb1a11bf6c80945b5f3c0c147c3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"v5iPQOUYd4ppRVtmY1w/jXr2lS1t4GJqPcgXem2glCbqL/CER+pmMGzot9F/dWXYHuemvRmqV/DzFEivb1gYAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T02:41:49.726487Z","bundle_sha256":"240b826b0da378d721362410c940b99103c872b91e5036b5fa414a3dd60d64c4"}}