{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:ST3GONLEYLNIJBDU52WCSUCS66","short_pith_number":"pith:ST3GONLE","canonical_record":{"source":{"id":"1802.05098","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T14:05:54Z","cross_cats_sorted":["cs.AI","cs.NE"],"title_canon_sha256":"eaff8be5d2834a124df15236f87c6afc083e816cda56518464a37843ed7bee49","abstract_canon_sha256":"e7e455a62d86dad82a2e611726e71cee3027f87a7c00d35c8568a0c2d1357095"},"schema_version":"1.0"},"canonical_sha256":"94f6673564c2da848474eeac295052f7b53c86eec25ab254c37e02a381328838","source":{"kind":"arxiv","id":"1802.05098","version":3},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.05098","created_at":"2026-05-18T00:01:30Z"},{"alias_kind":"arxiv_version","alias_value":"1802.05098v3","created_at":"2026-05-18T00:01:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.05098","created_at":"2026-05-18T00:01:30Z"},{"alias_kind":"pith_short_12","alias_value":"ST3GONLEYLNI","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_16","alias_value":"ST3GONLEYLNIJBDU","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_8","alias_value":"ST3GONLE","created_at":"2026-05-18T12:32:53Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:ST3GONLEYLNIJBDU52WCSUCS66","target":"record","payload":{"canonical_record":{"source":{"id":"1802.05098","kind":"arxiv","version":3},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T14:05:54Z","cross_cats_sorted":["cs.AI","cs.NE"],"title_canon_sha256":"eaff8be5d2834a124df15236f87c6afc083e816cda56518464a37843ed7bee49","abstract_canon_sha256":"e7e455a62d86dad82a2e611726e71cee3027f87a7c00d35c8568a0c2d1357095"},"schema_version":"1.0"},"canonical_sha256":"94f6673564c2da848474eeac295052f7b53c86eec25ab254c37e02a381328838","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:01:30.118156Z","signature_b64":"AIZYI7hZoEVY+IIYNUupXxbAA0gHiNyxxkWG2nnipQuqbiFdmK5q2EETvnI+SXdTT2944fDw1x4SYXwODrLQBQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"94f6673564c2da848474eeac295052f7b53c86eec25ab254c37e02a381328838","last_reissued_at":"2026-05-18T00:01:30.117570Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:01:30.117570Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1802.05098","source_version":3,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"NCKHU4R6WXBLHHX8WG/sCUSymkir5OeJsRdN/Y7yEHuF6RFbB5DNjEovJA2aybM+l33/MHibXZshBnlMb0eZAA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T19:12:26.222486Z"},"content_sha256":"7bd4be56527526cd16f2010b3a68dad76cd0cfd74b92e57376b637dbdf36b6b9","schema_version":"1.0","event_id":"sha256:7bd4be56527526cd16f2010b3a68dad76cd0cfd74b92e57376b637dbdf36b6b9"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:ST3GONLEYLNIJBDU52WCSUCS66","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"DiCE: The Infinitely Differentiable Monte-Carlo Estimator","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.NE"],"primary_cat":"cs.LG","authors_text":"Eric P. Xing, Gregory Farquhar, Jakob Foerster, Maruan Al-Shedivat, Shimon Whiteson, Tim Rockt\\\"aschel","submitted_at":"2018-02-14T14:05:54Z","abstract_excerpt":"The score function estimator is widely used for estimating gradients of stochastic objectives in stochastic computation graphs (SCG), eg, in reinforcement learning and meta-learning. While deriving the first-order gradient estimators by differentiating a surrogate loss (SL) objective is computationally and conceptually simple, using the same approach for higher-order derivatives is more challenging. Firstly, analytically deriving and implementing such estimators is laborious and not compliant with automatic differentiation. Secondly, repeatedly applying SL to construct new objectives for each "},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.05098","kind":"arxiv","version":3},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:30Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"/VRa2lGuD/zaBjEWLS7hexc0FCWAjwYcXgtzcbIor9/WpBDdIwWam4LByhvije4O5blfQ4PSru5nykX/3E4ACA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T19:12:26.223169Z"},"content_sha256":"c57a447ae2a02509674c4027c30bc80426f88cf7293624428acec2c000b0346e","schema_version":"1.0","event_id":"sha256:c57a447ae2a02509674c4027c30bc80426f88cf7293624428acec2c000b0346e"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ST3GONLEYLNIJBDU52WCSUCS66/bundle.json","state_url":"https://pith.science/pith/ST3GONLEYLNIJBDU52WCSUCS66/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ST3GONLEYLNIJBDU52WCSUCS66/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T19:12:26Z","links":{"resolver":"https://pith.science/pith/ST3GONLEYLNIJBDU52WCSUCS66","bundle":"https://pith.science/pith/ST3GONLEYLNIJBDU52WCSUCS66/bundle.json","state":"https://pith.science/pith/ST3GONLEYLNIJBDU52WCSUCS66/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ST3GONLEYLNIJBDU52WCSUCS66/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:ST3GONLEYLNIJBDU52WCSUCS66","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e7e455a62d86dad82a2e611726e71cee3027f87a7c00d35c8568a0c2d1357095","cross_cats_sorted":["cs.AI","cs.NE"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T14:05:54Z","title_canon_sha256":"eaff8be5d2834a124df15236f87c6afc083e816cda56518464a37843ed7bee49"},"schema_version":"1.0","source":{"id":"1802.05098","kind":"arxiv","version":3}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1802.05098","created_at":"2026-05-18T00:01:30Z"},{"alias_kind":"arxiv_version","alias_value":"1802.05098v3","created_at":"2026-05-18T00:01:30Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1802.05098","created_at":"2026-05-18T00:01:30Z"},{"alias_kind":"pith_short_12","alias_value":"ST3GONLEYLNI","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_16","alias_value":"ST3GONLEYLNIJBDU","created_at":"2026-05-18T12:32:53Z"},{"alias_kind":"pith_short_8","alias_value":"ST3GONLE","created_at":"2026-05-18T12:32:53Z"}],"graph_snapshots":[{"event_id":"sha256:c57a447ae2a02509674c4027c30bc80426f88cf7293624428acec2c000b0346e","target":"graph","created_at":"2026-05-18T00:01:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"The score function estimator is widely used for estimating gradients of stochastic objectives in stochastic computation graphs (SCG), eg, in reinforcement learning and meta-learning. While deriving the first-order gradient estimators by differentiating a surrogate loss (SL) objective is computationally and conceptually simple, using the same approach for higher-order derivatives is more challenging. Firstly, analytically deriving and implementing such estimators is laborious and not compliant with automatic differentiation. Secondly, repeatedly applying SL to construct new objectives for each ","authors_text":"Eric P. Xing, Gregory Farquhar, Jakob Foerster, Maruan Al-Shedivat, Shimon Whiteson, Tim Rockt\\\"aschel","cross_cats":["cs.AI","cs.NE"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T14:05:54Z","title":"DiCE: The Infinitely Differentiable Monte-Carlo Estimator"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1802.05098","kind":"arxiv","version":3},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7bd4be56527526cd16f2010b3a68dad76cd0cfd74b92e57376b637dbdf36b6b9","target":"record","created_at":"2026-05-18T00:01:30Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e7e455a62d86dad82a2e611726e71cee3027f87a7c00d35c8568a0c2d1357095","cross_cats_sorted":["cs.AI","cs.NE"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-02-14T14:05:54Z","title_canon_sha256":"eaff8be5d2834a124df15236f87c6afc083e816cda56518464a37843ed7bee49"},"schema_version":"1.0","source":{"id":"1802.05098","kind":"arxiv","version":3}},"canonical_sha256":"94f6673564c2da848474eeac295052f7b53c86eec25ab254c37e02a381328838","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"94f6673564c2da848474eeac295052f7b53c86eec25ab254c37e02a381328838","first_computed_at":"2026-05-18T00:01:30.117570Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:01:30.117570Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"AIZYI7hZoEVY+IIYNUupXxbAA0gHiNyxxkWG2nnipQuqbiFdmK5q2EETvnI+SXdTT2944fDw1x4SYXwODrLQBQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:01:30.118156Z","signed_message":"canonical_sha256_bytes"},"source_id":"1802.05098","source_kind":"arxiv","source_version":3}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7bd4be56527526cd16f2010b3a68dad76cd0cfd74b92e57376b637dbdf36b6b9","sha256:c57a447ae2a02509674c4027c30bc80426f88cf7293624428acec2c000b0346e"],"state_sha256":"a6a7fac301648267a5c38ae6366232b574ccf983a68586611f4e3e8f566c64c6"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"zdrzjMtaxc/Y0hs+rDY3CDPpxFsx/TQu2eP67Knp1f7nNS4A+n5H9ipKus8zumpb/6C8eDeHqjS/E0/LZvSyAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T19:12:26.226696Z","bundle_sha256":"528148b2c76b48b5ec8300ba530f6dd174f2d42197f1e5aaa30ba02262984c02"}}