{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:CQ3BKGTDLUN4BXO7XILEQPMECW","short_pith_number":"pith:CQ3BKGTD","canonical_record":{"source":{"id":"1804.10332","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-04-27T03:42:55Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"99b1a8dedf87a7ad7589b1f49a45befdc58caad26c3d5872955939448777fdd1","abstract_canon_sha256":"99f3d7b91b95a3eb0cb59e80ede37584a5e8d18ae880e90b1e0af6a16261cce2"},"schema_version":"1.0"},"canonical_sha256":"1436151a635d1bc0dddfba16483d8415811ce85e3ae8887bf364a0f6864ed474","source":{"kind":"arxiv","id":"1804.10332","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.10332","created_at":"2026-05-18T00:15:46Z"},{"alias_kind":"arxiv_version","alias_value":"1804.10332v2","created_at":"2026-05-18T00:15:46Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.10332","created_at":"2026-05-18T00:15:46Z"},{"alias_kind":"pith_short_12","alias_value":"CQ3BKGTDLUN4","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_16","alias_value":"CQ3BKGTDLUN4BXO7","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_8","alias_value":"CQ3BKGTD","created_at":"2026-05-18T12:32:16Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:CQ3BKGTDLUN4BXO7XILEQPMECW","target":"record","payload":{"canonical_record":{"source":{"id":"1804.10332","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-04-27T03:42:55Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"99b1a8dedf87a7ad7589b1f49a45befdc58caad26c3d5872955939448777fdd1","abstract_canon_sha256":"99f3d7b91b95a3eb0cb59e80ede37584a5e8d18ae880e90b1e0af6a16261cce2"},"schema_version":"1.0"},"canonical_sha256":"1436151a635d1bc0dddfba16483d8415811ce85e3ae8887bf364a0f6864ed474","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:15:46.341017Z","signature_b64":"l01ZXoaOGfkdkALL2BS2K39AzKVfBUiTOL2NRtymxEFF2DxECZOby3f40UuW10cyxBTd+PCAx1ovnm3wJlOyAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1436151a635d1bc0dddfba16483d8415811ce85e3ae8887bf364a0f6864ed474","last_reissued_at":"2026-05-18T00:15:46.340345Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:15:46.340345Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1804.10332","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:46Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"uTflziXhroagNILLIBx6MbbdS6PV0JHq8QHi3o9F4zh51+zyZYnznsAn/NzUroEiry/NdYVEgYualVOWLX3ADw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T16:31:33.444991Z"},"content_sha256":"338126a296c30f7ecdd4060dbc776eb65cfce2f207e69963cadd83605c41af1d","schema_version":"1.0","event_id":"sha256:338126a296c30f7ecdd4060dbc776eb65cfce2f207e69963cadd83605c41af1d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:CQ3BKGTDLUN4BXO7XILEQPMECW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Sim-to-Real: Learning Agile Locomotion For Quadruped Robots","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.RO","authors_text":"Atil Iscen, Danijar Hafner, Erwin Coumans, Jie Tan, Steven Bohez, Tingnan Zhang, Vincent Vanhoucke, Yunfei Bai","submitted_at":"2018-04-27T03:42:55Z","abstract_excerpt":"Designing agile locomotion for quadruped robots often requires extensive expertise and tedious manual tuning. In this paper, we present a system to automate this process by leveraging deep reinforcement learning techniques. Our system can learn quadruped locomotion from scratch using simple reward signals. In addition, users can provide an open loop reference to guide the learning process when more control over the learned gait is needed. The control policies are learned in a physics simulator and then deployed on real robots. In robotics, policies trained in simulation often do not transfer t"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.10332","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:15:46Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"qcNQ42p9GnlfhLDUY7cADqFTU/FYN2hUcG2ngW15F7dENi+uhRpRI7lYKiXy0TsT7E7Sz6xmrLFQn3c6j0X7Cw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-28T16:31:33.445663Z"},"content_sha256":"dc6cd3aec614326bff3f8f200190bb89bc3a8fb0856e8fbc9063e8385e083588","schema_version":"1.0","event_id":"sha256:dc6cd3aec614326bff3f8f200190bb89bc3a8fb0856e8fbc9063e8385e083588"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/CQ3BKGTDLUN4BXO7XILEQPMECW/bundle.json","state_url":"https://pith.science/pith/CQ3BKGTDLUN4BXO7XILEQPMECW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/CQ3BKGTDLUN4BXO7XILEQPMECW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-28T16:31:33Z","links":{"resolver":"https://pith.science/pith/CQ3BKGTDLUN4BXO7XILEQPMECW","bundle":"https://pith.science/pith/CQ3BKGTDLUN4BXO7XILEQPMECW/bundle.json","state":"https://pith.science/pith/CQ3BKGTDLUN4BXO7XILEQPMECW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/CQ3BKGTDLUN4BXO7XILEQPMECW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:CQ3BKGTDLUN4BXO7XILEQPMECW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"99f3d7b91b95a3eb0cb59e80ede37584a5e8d18ae880e90b1e0af6a16261cce2","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-04-27T03:42:55Z","title_canon_sha256":"99b1a8dedf87a7ad7589b1f49a45befdc58caad26c3d5872955939448777fdd1"},"schema_version":"1.0","source":{"id":"1804.10332","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1804.10332","created_at":"2026-05-18T00:15:46Z"},{"alias_kind":"arxiv_version","alias_value":"1804.10332v2","created_at":"2026-05-18T00:15:46Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1804.10332","created_at":"2026-05-18T00:15:46Z"},{"alias_kind":"pith_short_12","alias_value":"CQ3BKGTDLUN4","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_16","alias_value":"CQ3BKGTDLUN4BXO7","created_at":"2026-05-18T12:32:16Z"},{"alias_kind":"pith_short_8","alias_value":"CQ3BKGTD","created_at":"2026-05-18T12:32:16Z"}],"graph_snapshots":[{"event_id":"sha256:dc6cd3aec614326bff3f8f200190bb89bc3a8fb0856e8fbc9063e8385e083588","target":"graph","created_at":"2026-05-18T00:15:46Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Designing agile locomotion for quadruped robots often requires extensive expertise and tedious manual tuning. In this paper, we present a system to automate this process by leveraging deep reinforcement learning techniques. Our system can learn quadruped locomotion from scratch using simple reward signals. In addition, users can provide an open loop reference to guide the learning process when more control over the learned gait is needed. The control policies are learned in a physics simulator and then deployed on real robots. In robotics, policies trained in simulation often do not transfer t","authors_text":"Atil Iscen, Danijar Hafner, Erwin Coumans, Jie Tan, Steven Bohez, Tingnan Zhang, Vincent Vanhoucke, Yunfei Bai","cross_cats":["cs.AI"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-04-27T03:42:55Z","title":"Sim-to-Real: Learning Agile Locomotion For Quadruped Robots"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1804.10332","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:338126a296c30f7ecdd4060dbc776eb65cfce2f207e69963cadd83605c41af1d","target":"record","created_at":"2026-05-18T00:15:46Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"99f3d7b91b95a3eb0cb59e80ede37584a5e8d18ae880e90b1e0af6a16261cce2","cross_cats_sorted":["cs.AI"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-04-27T03:42:55Z","title_canon_sha256":"99b1a8dedf87a7ad7589b1f49a45befdc58caad26c3d5872955939448777fdd1"},"schema_version":"1.0","source":{"id":"1804.10332","kind":"arxiv","version":2}},"canonical_sha256":"1436151a635d1bc0dddfba16483d8415811ce85e3ae8887bf364a0f6864ed474","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1436151a635d1bc0dddfba16483d8415811ce85e3ae8887bf364a0f6864ed474","first_computed_at":"2026-05-18T00:15:46.340345Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:15:46.340345Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"l01ZXoaOGfkdkALL2BS2K39AzKVfBUiTOL2NRtymxEFF2DxECZOby3f40UuW10cyxBTd+PCAx1ovnm3wJlOyAw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:15:46.341017Z","signed_message":"canonical_sha256_bytes"},"source_id":"1804.10332","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:338126a296c30f7ecdd4060dbc776eb65cfce2f207e69963cadd83605c41af1d","sha256:dc6cd3aec614326bff3f8f200190bb89bc3a8fb0856e8fbc9063e8385e083588"],"state_sha256":"5a816e45283148e8f6b433952196f40ec7d2065f06ffd084ea5053e24339f7b5"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"X5U31Es+NtkAvGxYW1kud6wLF3ncuL/7fMHvIhVJmNAAq1dbEco+Ptl0IKLNjIQV0OwYkU2LNEt/778ipgWHCw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-28T16:31:33.448415Z","bundle_sha256":"0a0417858f354cdc784bc4bc10e81b92957708ad850a13f2ae93a8109174b510"}}