{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:TX2UO76WNS4Z75Q7NLCKH7W3EK","short_pith_number":"pith:TX2UO76W","canonical_record":{"source":{"id":"1709.05638","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-17T10:56:41Z","cross_cats_sorted":[],"title_canon_sha256":"124785db82bb83929c9306a024e9e027690c696f026d74883dcfef880a6e29b2","abstract_canon_sha256":"0074089eb690da15cdd62010c69c0d66f03288b80a7b5f4a2617f8368cfa7f0e"},"schema_version":"1.0"},"canonical_sha256":"9df5477fd66cb99ff61f6ac4a3fedb229e99da5e2c1bb29f651010cb99640249","source":{"kind":"arxiv","id":"1709.05638","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1709.05638","created_at":"2026-05-18T00:07:50Z"},{"alias_kind":"arxiv_version","alias_value":"1709.05638v2","created_at":"2026-05-18T00:07:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1709.05638","created_at":"2026-05-18T00:07:50Z"},{"alias_kind":"pith_short_12","alias_value":"TX2UO76WNS4Z","created_at":"2026-05-18T12:31:46Z"},{"alias_kind":"pith_short_16","alias_value":"TX2UO76WNS4Z75Q7","created_at":"2026-05-18T12:31:46Z"},{"alias_kind":"pith_short_8","alias_value":"TX2UO76W","created_at":"2026-05-18T12:31:46Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:TX2UO76WNS4Z75Q7NLCKH7W3EK","target":"record","payload":{"canonical_record":{"source":{"id":"1709.05638","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-17T10:56:41Z","cross_cats_sorted":[],"title_canon_sha256":"124785db82bb83929c9306a024e9e027690c696f026d74883dcfef880a6e29b2","abstract_canon_sha256":"0074089eb690da15cdd62010c69c0d66f03288b80a7b5f4a2617f8368cfa7f0e"},"schema_version":"1.0"},"canonical_sha256":"9df5477fd66cb99ff61f6ac4a3fedb229e99da5e2c1bb29f651010cb99640249","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:07:50.559983Z","signature_b64":"bUMiui34FNqyMNUHOtxEjrH2x+3bf73/qzC1jT2ZbhoPCt0i3hkvF46OLF4K6E1fht6HePOdm2Wt+fvHiJtwDg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"9df5477fd66cb99ff61f6ac4a3fedb229e99da5e2c1bb29f651010cb99640249","last_reissued_at":"2026-05-18T00:07:50.559307Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:07:50.559307Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1709.05638","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:50Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RJ1NgISowiRw2S8t/4UXLIfCgV5AoQ2QUUYS10Qv1pO1ia0Fdvxo7S71h7kCiJyaoI4UkcQglJbWJQ0uKszPDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T02:29:45.644738Z"},"content_sha256":"816eb1e1380ceaaa78349bff8320a0842ed646da9d4f2cdda38d180b9f272bc4","schema_version":"1.0","event_id":"sha256:816eb1e1380ceaaa78349bff8320a0842ed646da9d4f2cdda38d180b9f272bc4"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:TX2UO76WNS4Z75Q7NLCKH7W3EK","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Improving Search through A3C Reinforcement Learning based Conversational Agent","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Aarushi Arora, Balaji Krishnamurthy, Milan Aggarwal, Shagun Sodhani","submitted_at":"2017-09-17T10:56:41Z","abstract_excerpt":"We develop a reinforcement learning based search assistant which can assist users through a set of actions and sequence of interactions to enable them realize their intent. Our approach caters to subjective search where the user is seeking digital assets such as images which is fundamentally different from the tasks which have objective and limited search modalities. Labeled conversational data is generally not available in such search tasks and training the agent through human interactions can be time consuming. We propose a stochastic virtual user which impersonates a real user and can be us"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1709.05638","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:07:50Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ozOMDRQFqGJ6MeXOFzz/Q1CC2uBWYQ6X+qWXPAF5kbmA2pm/+2XQvJebBAQIevP4RA9iCl1amKP078PteE9MAQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-08T02:29:45.645444Z"},"content_sha256":"2c0f2c0cbf55ac83fd2d59bfcc1e6a19a206c38f04c21ac7587275ca95764651","schema_version":"1.0","event_id":"sha256:2c0f2c0cbf55ac83fd2d59bfcc1e6a19a206c38f04c21ac7587275ca95764651"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/TX2UO76WNS4Z75Q7NLCKH7W3EK/bundle.json","state_url":"https://pith.science/pith/TX2UO76WNS4Z75Q7NLCKH7W3EK/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/TX2UO76WNS4Z75Q7NLCKH7W3EK/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-08T02:29:45Z","links":{"resolver":"https://pith.science/pith/TX2UO76WNS4Z75Q7NLCKH7W3EK","bundle":"https://pith.science/pith/TX2UO76WNS4Z75Q7NLCKH7W3EK/bundle.json","state":"https://pith.science/pith/TX2UO76WNS4Z75Q7NLCKH7W3EK/state.json","well_known_bundle":"https://pith.science/.well-known/pith/TX2UO76WNS4Z75Q7NLCKH7W3EK/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:TX2UO76WNS4Z75Q7NLCKH7W3EK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"0074089eb690da15cdd62010c69c0d66f03288b80a7b5f4a2617f8368cfa7f0e","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-17T10:56:41Z","title_canon_sha256":"124785db82bb83929c9306a024e9e027690c696f026d74883dcfef880a6e29b2"},"schema_version":"1.0","source":{"id":"1709.05638","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1709.05638","created_at":"2026-05-18T00:07:50Z"},{"alias_kind":"arxiv_version","alias_value":"1709.05638v2","created_at":"2026-05-18T00:07:50Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1709.05638","created_at":"2026-05-18T00:07:50Z"},{"alias_kind":"pith_short_12","alias_value":"TX2UO76WNS4Z","created_at":"2026-05-18T12:31:46Z"},{"alias_kind":"pith_short_16","alias_value":"TX2UO76WNS4Z75Q7","created_at":"2026-05-18T12:31:46Z"},{"alias_kind":"pith_short_8","alias_value":"TX2UO76W","created_at":"2026-05-18T12:31:46Z"}],"graph_snapshots":[{"event_id":"sha256:2c0f2c0cbf55ac83fd2d59bfcc1e6a19a206c38f04c21ac7587275ca95764651","target":"graph","created_at":"2026-05-18T00:07:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"We develop a reinforcement learning based search assistant which can assist users through a set of actions and sequence of interactions to enable them realize their intent. Our approach caters to subjective search where the user is seeking digital assets such as images which is fundamentally different from the tasks which have objective and limited search modalities. Labeled conversational data is generally not available in such search tasks and training the agent through human interactions can be time consuming. We propose a stochastic virtual user which impersonates a real user and can be us","authors_text":"Aarushi Arora, Balaji Krishnamurthy, Milan Aggarwal, Shagun Sodhani","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-17T10:56:41Z","title":"Improving Search through A3C Reinforcement Learning based Conversational Agent"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1709.05638","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:816eb1e1380ceaaa78349bff8320a0842ed646da9d4f2cdda38d180b9f272bc4","target":"record","created_at":"2026-05-18T00:07:50Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"0074089eb690da15cdd62010c69c0d66f03288b80a7b5f4a2617f8368cfa7f0e","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2017-09-17T10:56:41Z","title_canon_sha256":"124785db82bb83929c9306a024e9e027690c696f026d74883dcfef880a6e29b2"},"schema_version":"1.0","source":{"id":"1709.05638","kind":"arxiv","version":2}},"canonical_sha256":"9df5477fd66cb99ff61f6ac4a3fedb229e99da5e2c1bb29f651010cb99640249","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"9df5477fd66cb99ff61f6ac4a3fedb229e99da5e2c1bb29f651010cb99640249","first_computed_at":"2026-05-18T00:07:50.559307Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:07:50.559307Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"bUMiui34FNqyMNUHOtxEjrH2x+3bf73/qzC1jT2ZbhoPCt0i3hkvF46OLF4K6E1fht6HePOdm2Wt+fvHiJtwDg==","signature_status":"signed_v1","signed_at":"2026-05-18T00:07:50.559983Z","signed_message":"canonical_sha256_bytes"},"source_id":"1709.05638","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:816eb1e1380ceaaa78349bff8320a0842ed646da9d4f2cdda38d180b9f272bc4","sha256:2c0f2c0cbf55ac83fd2d59bfcc1e6a19a206c38f04c21ac7587275ca95764651"],"state_sha256":"4e3a439343427ad426de88ef66c839e3d3c3349b5f76b5a8e89b978406bfd2f2"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"kfMuAfM4H0pXAdYpKRz3q+QECdXbI6ZWcNV41sz2Ir2RpSL/feY9+pFpH0BVWHevDGAyue4V8Zz8Gjurbcv9Cw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-08T02:29:45.649989Z","bundle_sha256":"4936024985c1b0ded8d61875d3821a5053ca5b7adc540b5d6925907d6c77cfe2"}}