{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:YDZLJE52OPNUUHWISG7RYMBQH6","short_pith_number":"pith:YDZLJE52","canonical_record":{"source":{"id":"1805.09360","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-23T18:06:10Z","cross_cats_sorted":["cs.SI","stat.ML"],"title_canon_sha256":"40b8a87c61ca2f1da6e708701e2f0a20af7fd8c9fa4e3ed4868a7d10381b3ff5","abstract_canon_sha256":"80ceffb0444fb15f997612b95c3fa56f03f9f9f5fe92b7b20dcc6100fdc3a614"},"schema_version":"1.0"},"canonical_sha256":"c0f2b493ba73db4a1ec891bf1c30303fb36a9ede599d67736b72e291e6dc2d2a","source":{"kind":"arxiv","id":"1805.09360","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.09360","created_at":"2026-05-18T00:01:29Z"},{"alias_kind":"arxiv_version","alias_value":"1805.09360v2","created_at":"2026-05-18T00:01:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.09360","created_at":"2026-05-18T00:01:29Z"},{"alias_kind":"pith_short_12","alias_value":"YDZLJE52OPNU","created_at":"2026-05-18T12:33:04Z"},{"alias_kind":"pith_short_16","alias_value":"YDZLJE52OPNUUHWI","created_at":"2026-05-18T12:33:04Z"},{"alias_kind":"pith_short_8","alias_value":"YDZLJE52","created_at":"2026-05-18T12:33:04Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:YDZLJE52OPNUUHWISG7RYMBQH6","target":"record","payload":{"canonical_record":{"source":{"id":"1805.09360","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-23T18:06:10Z","cross_cats_sorted":["cs.SI","stat.ML"],"title_canon_sha256":"40b8a87c61ca2f1da6e708701e2f0a20af7fd8c9fa4e3ed4868a7d10381b3ff5","abstract_canon_sha256":"80ceffb0444fb15f997612b95c3fa56f03f9f9f5fe92b7b20dcc6100fdc3a614"},"schema_version":"1.0"},"canonical_sha256":"c0f2b493ba73db4a1ec891bf1c30303fb36a9ede599d67736b72e291e6dc2d2a","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:01:29.520292Z","signature_b64":"n05iWHj1XDOL0/o2kCCD6qqP5GGTmQCkfjs1L1GjbeK5Up4RIzhGI7Er1Oh5k0NDe2jyUYiiaknOoJ+y7IF4BQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c0f2b493ba73db4a1ec891bf1c30303fb36a9ede599d67736b72e291e6dc2d2a","last_reissued_at":"2026-05-18T00:01:29.519846Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:01:29.519846Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1805.09360","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ItYOXMzM0TzJqJBbLCjxCG/NuE/4gqa5LjFRd2OWyndOc0q0UucXK8+6ukDHxRZxgxufQ5Oxt5Er/w3tFTpnDQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T12:26:30.088804Z"},"content_sha256":"d1e0a72ce4ea77d7db7c088759b84f73e0b68a3c5cb9c218ea7965bcf483ded0","schema_version":"1.0","event_id":"sha256:d1e0a72ce4ea77d7db7c088759b84f73e0b68a3c5cb9c218ea7965bcf483ded0"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:YDZLJE52OPNUUHWISG7RYMBQH6","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Deep Reinforcement Learning of Marked Temporal Point Processes","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.SI","stat.ML"],"primary_cat":"cs.LG","authors_text":"Abir De, Manuel Gomez-Rodriguez, Utkarsh Upadhyay","submitted_at":"2018-05-23T18:06:10Z","abstract_excerpt":"In a wide variety of applications, humans interact with a complex environment by means of asynchronous stochastic discrete events in continuous time. Can we design online interventions that will help humans achieve certain goals in such asynchronous setting? In this paper, we address the above problem from the perspective of deep reinforcement learning of marked temporal point processes, where both the actions taken by an agent and the feedback it receives from the environment are asynchronous stochastic discrete events characterized using marked temporal point processes. In doing so, we defin"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.09360","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:01:29Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3SYpkAaZnrXxz23HWKFcGdJYPZQF44BNCGVbQmLuu+8RARYvIQjkBGTIaqfNId9/klAEXzbDlY0wfoginG5ADw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-27T12:26:30.089165Z"},"content_sha256":"d0fedab831f55fd7ffd76085f6c965204fe8d9341e5644cbd5fc909c9c29bc89","schema_version":"1.0","event_id":"sha256:d0fedab831f55fd7ffd76085f6c965204fe8d9341e5644cbd5fc909c9c29bc89"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/YDZLJE52OPNUUHWISG7RYMBQH6/bundle.json","state_url":"https://pith.science/pith/YDZLJE52OPNUUHWISG7RYMBQH6/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/YDZLJE52OPNUUHWISG7RYMBQH6/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-27T12:26:30Z","links":{"resolver":"https://pith.science/pith/YDZLJE52OPNUUHWISG7RYMBQH6","bundle":"https://pith.science/pith/YDZLJE52OPNUUHWISG7RYMBQH6/bundle.json","state":"https://pith.science/pith/YDZLJE52OPNUUHWISG7RYMBQH6/state.json","well_known_bundle":"https://pith.science/.well-known/pith/YDZLJE52OPNUUHWISG7RYMBQH6/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:YDZLJE52OPNUUHWISG7RYMBQH6","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"80ceffb0444fb15f997612b95c3fa56f03f9f9f5fe92b7b20dcc6100fdc3a614","cross_cats_sorted":["cs.SI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-23T18:06:10Z","title_canon_sha256":"40b8a87c61ca2f1da6e708701e2f0a20af7fd8c9fa4e3ed4868a7d10381b3ff5"},"schema_version":"1.0","source":{"id":"1805.09360","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1805.09360","created_at":"2026-05-18T00:01:29Z"},{"alias_kind":"arxiv_version","alias_value":"1805.09360v2","created_at":"2026-05-18T00:01:29Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1805.09360","created_at":"2026-05-18T00:01:29Z"},{"alias_kind":"pith_short_12","alias_value":"YDZLJE52OPNU","created_at":"2026-05-18T12:33:04Z"},{"alias_kind":"pith_short_16","alias_value":"YDZLJE52OPNUUHWI","created_at":"2026-05-18T12:33:04Z"},{"alias_kind":"pith_short_8","alias_value":"YDZLJE52","created_at":"2026-05-18T12:33:04Z"}],"graph_snapshots":[{"event_id":"sha256:d0fedab831f55fd7ffd76085f6c965204fe8d9341e5644cbd5fc909c9c29bc89","target":"graph","created_at":"2026-05-18T00:01:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"In a wide variety of applications, humans interact with a complex environment by means of asynchronous stochastic discrete events in continuous time. Can we design online interventions that will help humans achieve certain goals in such asynchronous setting? In this paper, we address the above problem from the perspective of deep reinforcement learning of marked temporal point processes, where both the actions taken by an agent and the feedback it receives from the environment are asynchronous stochastic discrete events characterized using marked temporal point processes. In doing so, we defin","authors_text":"Abir De, Manuel Gomez-Rodriguez, Utkarsh Upadhyay","cross_cats":["cs.SI","stat.ML"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-23T18:06:10Z","title":"Deep Reinforcement Learning of Marked Temporal Point Processes"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1805.09360","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:d1e0a72ce4ea77d7db7c088759b84f73e0b68a3c5cb9c218ea7965bcf483ded0","target":"record","created_at":"2026-05-18T00:01:29Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"80ceffb0444fb15f997612b95c3fa56f03f9f9f5fe92b7b20dcc6100fdc3a614","cross_cats_sorted":["cs.SI","stat.ML"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2018-05-23T18:06:10Z","title_canon_sha256":"40b8a87c61ca2f1da6e708701e2f0a20af7fd8c9fa4e3ed4868a7d10381b3ff5"},"schema_version":"1.0","source":{"id":"1805.09360","kind":"arxiv","version":2}},"canonical_sha256":"c0f2b493ba73db4a1ec891bf1c30303fb36a9ede599d67736b72e291e6dc2d2a","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c0f2b493ba73db4a1ec891bf1c30303fb36a9ede599d67736b72e291e6dc2d2a","first_computed_at":"2026-05-18T00:01:29.519846Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:01:29.519846Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"n05iWHj1XDOL0/o2kCCD6qqP5GGTmQCkfjs1L1GjbeK5Up4RIzhGI7Er1Oh5k0NDe2jyUYiiaknOoJ+y7IF4BQ==","signature_status":"signed_v1","signed_at":"2026-05-18T00:01:29.520292Z","signed_message":"canonical_sha256_bytes"},"source_id":"1805.09360","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:d1e0a72ce4ea77d7db7c088759b84f73e0b68a3c5cb9c218ea7965bcf483ded0","sha256:d0fedab831f55fd7ffd76085f6c965204fe8d9341e5644cbd5fc909c9c29bc89"],"state_sha256":"6dcbda3425673df21fd23705b42cbfd8210df27c1c1b3d467107057004b3d332"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"FkiHvix83/Dfv0UsqLuGgXpAvwVhSPpalr92DpWpJX3lYX34EH0xHZO6rmi1VRZ0/Ifl5i4ozD3z3GyMFL3DAw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-27T12:26:30.091665Z","bundle_sha256":"097c43b57977375886a2d2f962d4b079bff2564cfb7e74f0a4358a039a0619c8"}}