{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:5U4RO7WOTWEPZINNWPAJ6DQ5LY","short_pith_number":"pith:5U4RO7WO","canonical_record":{"source":{"id":"1811.04624","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-11-12T09:44:50Z","cross_cats_sorted":["cs.LG","cs.NE"],"title_canon_sha256":"797118ad1fc9163f26a26cd87e2fb33547df17e1ec22d27e66a201625ab5039b","abstract_canon_sha256":"7b85fbef4d6fe0b3b5827bb5297cb62cca87e2793c84a4f465e055d18e34b111"},"schema_version":"1.0"},"canonical_sha256":"ed39177ece9d88fca1adb3c09f0e1d5e165591a9600eda433cdb6ee1e9dbf78d","source":{"kind":"arxiv","id":"1811.04624","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.04624","created_at":"2026-05-18T00:01:04Z"},{"alias_kind":"arxiv_version","alias_value":"1811.04624v1","created_at":"2026-05-18T00:01:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.04624","created_at":"2026-05-18T00:01:04Z"},{"alias_kind":"pith_short_12","alias_value":"5U4RO7WOTWEP","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_16","alias_value":"5U4RO7WOTWEPZINN","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_8","alias_value":"5U4RO7WO","created_at":"2026-05-18T12:32:08Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:5U4RO7WOTWEPZINNWPAJ6DQ5LY","target":"record","payload":{"canonical_record":{"source":{"id":"1811.04624","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-11-12T09:44:50Z","cross_cats_sorted":["cs.LG","cs.NE"],"title_canon_sha256":"797118ad1fc9163f26a26cd87e2fb33547df17e1ec22d27e66a201625ab5039b","abstract_canon_sha256":"7b85fbef4d6fe0b3b5827bb5297cb62cca87e2793c84a4f465e055d18e34b111"},"schema_version":"1.0"},"canonical_sha256":"ed39177ece9d88fca1adb3c09f0e1d5e165591a9600eda433cdb6ee1e9dbf78d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:01:04.552002Z","signature_b64":"3jb4ww9eb2STJWdeH/Z1Kv4DCP0zhJjYBC+iM4BqJQe5YbuTKGnrlTHzQGfg0D71a53MZ8mw/lxirAj1Jz16AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"ed39177ece9d88fca1adb3c09f0e1d5e165591a9600eda433cdb6ee1e9dbf78d","last_reissued_at":"2026-05-18T00:01:04.551397Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:01:04.551397Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1811.04624","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ArtQkJrVr70tC1jANQoOJ9f5gwFBT7/GCkDVz9aB1aoKIH70lRI1L/ux/wxuqUoAMG2HmMNv49ZqBEQ0xOBdAw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T20:32:12.121887Z"},"content_sha256":"c5146434340f12dfae0b1c794626e58bd2718a18c24bb0e40ad0e812645b89c7","schema_version":"1.0","event_id":"sha256:c5146434340f12dfae0b1c794626e58bd2718a18c24bb0e40ad0e812645b89c7"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:5U4RO7WOTWEPZINNWPAJ6DQ5LY","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Importance Weighted Evolution Strategies","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.LG","cs.NE"],"primary_cat":"stat.ML","authors_text":"Jordi Torres, V\\'ictor Campos, Xavier Giro-i-Nieto","submitted_at":"2018-11-12T09:44:50Z","abstract_excerpt":"Evolution Strategies (ES) emerged as a scalable alternative to popular Reinforcement Learning (RL) techniques, providing an almost perfect speedup when distributed across hundreds of CPU cores thanks to a reduced communication overhead. Despite providing large improvements in wall-clock time, ES is data inefficient when compared to competing RL methods. One of the main causes of such inefficiency is the collection of large batches of experience, which are discarded after each policy update. In this work, we study how to perform more than one update per batch of experience by means of Importanc"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.04624","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:04Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"WCVgsg7Ub3+MNojURelbfDI3VpTcq29qVAnmcV99Q9cNVny1gkc1puuabx2rmPqGjG7lKIsFj1ehDue5/dXwCQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-03T20:32:12.122224Z"},"content_sha256":"12338a6119bcd40e11c8febbab598e963566a6990616f31c9e7fe7cd48693548","schema_version":"1.0","event_id":"sha256:12338a6119bcd40e11c8febbab598e963566a6990616f31c9e7fe7cd48693548"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/5U4RO7WOTWEPZINNWPAJ6DQ5LY/bundle.json","state_url":"https://pith.science/pith/5U4RO7WOTWEPZINNWPAJ6DQ5LY/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/5U4RO7WOTWEPZINNWPAJ6DQ5LY/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-03T20:32:12Z","links":{"resolver":"https://pith.science/pith/5U4RO7WOTWEPZINNWPAJ6DQ5LY","bundle":"https://pith.science/pith/5U4RO7WOTWEPZINNWPAJ6DQ5LY/bundle.json","state":"https://pith.science/pith/5U4RO7WOTWEPZINNWPAJ6DQ5LY/state.json","well_known_bundle":"https://pith.science/.well-known/pith/5U4RO7WOTWEPZINNWPAJ6DQ5LY/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:5U4RO7WOTWEPZINNWPAJ6DQ5LY","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"7b85fbef4d6fe0b3b5827bb5297cb62cca87e2793c84a4f465e055d18e34b111","cross_cats_sorted":["cs.LG","cs.NE"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-11-12T09:44:50Z","title_canon_sha256":"797118ad1fc9163f26a26cd87e2fb33547df17e1ec22d27e66a201625ab5039b"},"schema_version":"1.0","source":{"id":"1811.04624","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1811.04624","created_at":"2026-05-18T00:01:04Z"},{"alias_kind":"arxiv_version","alias_value":"1811.04624v1","created_at":"2026-05-18T00:01:04Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1811.04624","created_at":"2026-05-18T00:01:04Z"},{"alias_kind":"pith_short_12","alias_value":"5U4RO7WOTWEP","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_16","alias_value":"5U4RO7WOTWEPZINN","created_at":"2026-05-18T12:32:08Z"},{"alias_kind":"pith_short_8","alias_value":"5U4RO7WO","created_at":"2026-05-18T12:32:08Z"}],"graph_snapshots":[{"event_id":"sha256:12338a6119bcd40e11c8febbab598e963566a6990616f31c9e7fe7cd48693548","target":"graph","created_at":"2026-05-18T00:01:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Evolution Strategies (ES) emerged as a scalable alternative to popular Reinforcement Learning (RL) techniques, providing an almost perfect speedup when distributed across hundreds of CPU cores thanks to a reduced communication overhead. Despite providing large improvements in wall-clock time, ES is data inefficient when compared to competing RL methods. One of the main causes of such inefficiency is the collection of large batches of experience, which are discarded after each policy update. In this work, we study how to perform more than one update per batch of experience by means of Importanc","authors_text":"Jordi Torres, V\\'ictor Campos, Xavier Giro-i-Nieto","cross_cats":["cs.LG","cs.NE"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-11-12T09:44:50Z","title":"Importance Weighted Evolution Strategies"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1811.04624","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:c5146434340f12dfae0b1c794626e58bd2718a18c24bb0e40ad0e812645b89c7","target":"record","created_at":"2026-05-18T00:01:04Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"7b85fbef4d6fe0b3b5827bb5297cb62cca87e2793c84a4f465e055d18e34b111","cross_cats_sorted":["cs.LG","cs.NE"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"stat.ML","submitted_at":"2018-11-12T09:44:50Z","title_canon_sha256":"797118ad1fc9163f26a26cd87e2fb33547df17e1ec22d27e66a201625ab5039b"},"schema_version":"1.0","source":{"id":"1811.04624","kind":"arxiv","version":1}},"canonical_sha256":"ed39177ece9d88fca1adb3c09f0e1d5e165591a9600eda433cdb6ee1e9dbf78d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"ed39177ece9d88fca1adb3c09f0e1d5e165591a9600eda433cdb6ee1e9dbf78d","first_computed_at":"2026-05-18T00:01:04.551397Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:01:04.551397Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"3jb4ww9eb2STJWdeH/Z1Kv4DCP0zhJjYBC+iM4BqJQe5YbuTKGnrlTHzQGfg0D71a53MZ8mw/lxirAj1Jz16AA==","signature_status":"signed_v1","signed_at":"2026-05-18T00:01:04.552002Z","signed_message":"canonical_sha256_bytes"},"source_id":"1811.04624","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:c5146434340f12dfae0b1c794626e58bd2718a18c24bb0e40ad0e812645b89c7","sha256:12338a6119bcd40e11c8febbab598e963566a6990616f31c9e7fe7cd48693548"],"state_sha256":"1b831559ddb6007a68b0de3e6d077fc9765007af9a6c886da3836abd37c93c34"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yLDaZpv3fitp0g9475x7/wZXeVsbs9DH9yEVM8qJNgO/xOZZMiZW5iu8Av1yD1XbVaqBRb8R0FihR0hkkkp0AQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-03T20:32:12.124175Z","bundle_sha256":"eb701d088b3c7c882059823ca8d0e485c41058d953d73f01cb73b180263fc9d4"}}