{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2015:RLW6WDKTXUQPG5CP5OQ7BVCFTK","short_pith_number":"pith:RLW6WDKT","canonical_record":{"source":{"id":"1505.00284","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2015-05-01T21:13:00Z","cross_cats_sorted":[],"title_canon_sha256":"8300b509bd3c39462e85e8c3d1ec49bc78035757398358298d69c697bc85a28c","abstract_canon_sha256":"ff3af234fb5b0cb6d5bf6bbdbefc4c9ce46e846fe21342c649aa0f681805df83"},"schema_version":"1.0"},"canonical_sha256":"8aedeb0d53bd20f3744feba1f0d4459abfa767bc7a89c6cdf0088aa1d46013f8","source":{"kind":"arxiv","id":"1505.00284","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1505.00284","created_at":"2026-05-18T01:24:24Z"},{"alias_kind":"arxiv_version","alias_value":"1505.00284v2","created_at":"2026-05-18T01:24:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1505.00284","created_at":"2026-05-18T01:24:24Z"},{"alias_kind":"pith_short_12","alias_value":"RLW6WDKTXUQP","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_16","alias_value":"RLW6WDKTXUQPG5CP","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_8","alias_value":"RLW6WDKT","created_at":"2026-05-18T12:29:39Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2015:RLW6WDKTXUQPG5CP5OQ7BVCFTK","target":"record","payload":{"canonical_record":{"source":{"id":"1505.00284","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2015-05-01T21:13:00Z","cross_cats_sorted":[],"title_canon_sha256":"8300b509bd3c39462e85e8c3d1ec49bc78035757398358298d69c697bc85a28c","abstract_canon_sha256":"ff3af234fb5b0cb6d5bf6bbdbefc4c9ce46e846fe21342c649aa0f681805df83"},"schema_version":"1.0"},"canonical_sha256":"8aedeb0d53bd20f3744feba1f0d4459abfa767bc7a89c6cdf0088aa1d46013f8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T01:24:24.937735Z","signature_b64":"UGFeosI8TBuinoeLtNyV4VLs7JQ8moTzijRkslyZ9f/tL2staruQkObOusPA46gHInalSRbUfyeW73VgpCvfAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"8aedeb0d53bd20f3744feba1f0d4459abfa767bc7a89c6cdf0088aa1d46013f8","last_reissued_at":"2026-05-18T01:24:24.937091Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T01:24:24.937091Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1505.00284","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:24:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"eeMbvzVtvT6EUNE29xEu6ojsyOJqD5vb6FiB1PcsF7teewjVJ2NeRxSCpR8du79Ew4sAVVCV2rgz0POtKV/sCA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T20:30:15.195251Z"},"content_sha256":"833b801fbdfd5883f2f832e968aebda46e25999173eaaca8a8177f0b90cb3605","schema_version":"1.0","event_id":"sha256:833b801fbdfd5883f2f832e968aebda46e25999173eaaca8a8177f0b90cb3605"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2015:RLW6WDKTXUQPG5CP5OQ7BVCFTK","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Bayesian Policy Reuse","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.AI","authors_text":"Benjamin Rosman, Majd Hawasly, Subramanian Ramamoorthy","submitted_at":"2015-05-01T21:13:00Z","abstract_excerpt":"A long-lived autonomous agent should be able to respond online to novel instances of tasks from a familiar domain. Acting online requires 'fast' responses, in terms of rapid convergence, especially when the task instance has a short duration, such as in applications involving interactions with humans. These requirements can be problematic for many established methods for learning to act. In domains where the agent knows that the task instance is drawn from a family of related tasks, albeit without access to the label of any given instance, it can choose to act through a process of policy reuse"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1505.00284","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T01:24:24Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ETO3leGpRIafnUoAndYEGbnkSdfT1Vu2rICsBh27n1ikRiHDQHL5ak82TrUENHL6qXy3XVGQHDPZER/v+8M4DA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-25T20:30:15.195897Z"},"content_sha256":"7d748e3414525244b8463a7caceafd615b71ad912e19d9e18e675b35ac4ab528","schema_version":"1.0","event_id":"sha256:7d748e3414525244b8463a7caceafd615b71ad912e19d9e18e675b35ac4ab528"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/RLW6WDKTXUQPG5CP5OQ7BVCFTK/bundle.json","state_url":"https://pith.science/pith/RLW6WDKTXUQPG5CP5OQ7BVCFTK/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/RLW6WDKTXUQPG5CP5OQ7BVCFTK/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-25T20:30:15Z","links":{"resolver":"https://pith.science/pith/RLW6WDKTXUQPG5CP5OQ7BVCFTK","bundle":"https://pith.science/pith/RLW6WDKTXUQPG5CP5OQ7BVCFTK/bundle.json","state":"https://pith.science/pith/RLW6WDKTXUQPG5CP5OQ7BVCFTK/state.json","well_known_bundle":"https://pith.science/.well-known/pith/RLW6WDKTXUQPG5CP5OQ7BVCFTK/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2015:RLW6WDKTXUQPG5CP5OQ7BVCFTK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ff3af234fb5b0cb6d5bf6bbdbefc4c9ce46e846fe21342c649aa0f681805df83","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2015-05-01T21:13:00Z","title_canon_sha256":"8300b509bd3c39462e85e8c3d1ec49bc78035757398358298d69c697bc85a28c"},"schema_version":"1.0","source":{"id":"1505.00284","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1505.00284","created_at":"2026-05-18T01:24:24Z"},{"alias_kind":"arxiv_version","alias_value":"1505.00284v2","created_at":"2026-05-18T01:24:24Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1505.00284","created_at":"2026-05-18T01:24:24Z"},{"alias_kind":"pith_short_12","alias_value":"RLW6WDKTXUQP","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_16","alias_value":"RLW6WDKTXUQPG5CP","created_at":"2026-05-18T12:29:39Z"},{"alias_kind":"pith_short_8","alias_value":"RLW6WDKT","created_at":"2026-05-18T12:29:39Z"}],"graph_snapshots":[{"event_id":"sha256:7d748e3414525244b8463a7caceafd615b71ad912e19d9e18e675b35ac4ab528","target":"graph","created_at":"2026-05-18T01:24:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"A long-lived autonomous agent should be able to respond online to novel instances of tasks from a familiar domain. Acting online requires 'fast' responses, in terms of rapid convergence, especially when the task instance has a short duration, such as in applications involving interactions with humans. These requirements can be problematic for many established methods for learning to act. In domains where the agent knows that the task instance is drawn from a family of related tasks, albeit without access to the label of any given instance, it can choose to act through a process of policy reuse","authors_text":"Benjamin Rosman, Majd Hawasly, Subramanian Ramamoorthy","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2015-05-01T21:13:00Z","title":"Bayesian Policy Reuse"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1505.00284","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:833b801fbdfd5883f2f832e968aebda46e25999173eaaca8a8177f0b90cb3605","target":"record","created_at":"2026-05-18T01:24:24Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ff3af234fb5b0cb6d5bf6bbdbefc4c9ce46e846fe21342c649aa0f681805df83","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.AI","submitted_at":"2015-05-01T21:13:00Z","title_canon_sha256":"8300b509bd3c39462e85e8c3d1ec49bc78035757398358298d69c697bc85a28c"},"schema_version":"1.0","source":{"id":"1505.00284","kind":"arxiv","version":2}},"canonical_sha256":"8aedeb0d53bd20f3744feba1f0d4459abfa767bc7a89c6cdf0088aa1d46013f8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8aedeb0d53bd20f3744feba1f0d4459abfa767bc7a89c6cdf0088aa1d46013f8","first_computed_at":"2026-05-18T01:24:24.937091Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T01:24:24.937091Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"UGFeosI8TBuinoeLtNyV4VLs7JQ8moTzijRkslyZ9f/tL2staruQkObOusPA46gHInalSRbUfyeW73VgpCvfAQ==","signature_status":"signed_v1","signed_at":"2026-05-18T01:24:24.937735Z","signed_message":"canonical_sha256_bytes"},"source_id":"1505.00284","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:833b801fbdfd5883f2f832e968aebda46e25999173eaaca8a8177f0b90cb3605","sha256:7d748e3414525244b8463a7caceafd615b71ad912e19d9e18e675b35ac4ab528"],"state_sha256":"c81fea693ff1dd2d09cb506e6fa8de6c119b71c2493835590bec134f5e4b15f8"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"yV7RPk+204I6hJ58QaMB38gWA7dHwAsooi6CGJ/Ti998WhncChiBzVPTrMm0t5yXg3+hTj9f0ZjdSFF6VVVlDw==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-25T20:30:15.199296Z","bundle_sha256":"b46e8821579bf21ff13a4d5be83f34b2e5d7ba8143fabd9366fbbba29c7e3e44"}}