{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2011:ZPJTRYDOGBTFXFSMQX5CDU36DO","short_pith_number":"pith:ZPJTRYDO","schema_version":"1.0","canonical_sha256":"cbd338e06e30665b964c85fa21d37e1ba97b4348e44834ac4c79d928c2706e9b","source":{"kind":"arxiv","id":"1106.0681","version":1},"attestation_state":"computed","paper":{"title":"Accelerating Reinforcement Learning through Implicit Imitation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"B. Price, C. Boutilier","submitted_at":"2011-06-03T14:57:02Z","abstract_excerpt":"Imitation can be viewed as a means of enhancing learning in multiagent environments.  It augments an agent's ability to learn useful behaviors by making intelligent use of the knowledge implicit in behaviors demonstrated by cooperative teachers or other more experienced agents.  We propose and study a formal model of implicit imitation that can accelerate reinforcement learning dramatically in certain cases.  Roughly, by observing a mentor, a reinforcement-learning agent can extract information about its own capabilities in, and the relative value of, unvisited parts of the state space.  We st"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1106.0681","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.LG","submitted_at":"2011-06-03T14:57:02Z","cross_cats_sorted":["cs.AI"],"title_canon_sha256":"914366787b3cda9540a929cccfcc45bca28fa39e4ead3cffd2e0d269b39af394","abstract_canon_sha256":"e48e87034bb4ef48007bc2a6ee99c68f48835376797bdae9ff46951ce881ea56"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T04:20:39.715970Z","signature_b64":"Kq/LVKm3grNPum3E5Oi4sAunMv9ravQYQVpbAZ++yl59cy6eQYvBA2g97SxDLKwjl0ALcbtkDDpcMB35gybZCQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"cbd338e06e30665b964c85fa21d37e1ba97b4348e44834ac4c79d928c2706e9b","last_reissued_at":"2026-05-18T04:20:39.715113Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T04:20:39.715113Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Accelerating Reinforcement Learning through Implicit Imitation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI"],"primary_cat":"cs.LG","authors_text":"B. Price, C. Boutilier","submitted_at":"2011-06-03T14:57:02Z","abstract_excerpt":"Imitation can be viewed as a means of enhancing learning in multiagent environments.  It augments an agent's ability to learn useful behaviors by making intelligent use of the knowledge implicit in behaviors demonstrated by cooperative teachers or other more experienced agents.  We propose and study a formal model of implicit imitation that can accelerate reinforcement learning dramatically in certain cases.  Roughly, by observing a mentor, a reinforcement-learning agent can extract information about its own capabilities in, and the relative value of, unvisited parts of the state space.  We st"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1106.0681","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1106.0681","created_at":"2026-05-18T04:20:39.715253+00:00"},{"alias_kind":"arxiv_version","alias_value":"1106.0681v1","created_at":"2026-05-18T04:20:39.715253+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1106.0681","created_at":"2026-05-18T04:20:39.715253+00:00"},{"alias_kind":"pith_short_12","alias_value":"ZPJTRYDOGBTF","created_at":"2026-05-18T12:26:50.516681+00:00"},{"alias_kind":"pith_short_16","alias_value":"ZPJTRYDOGBTFXFSM","created_at":"2026-05-18T12:26:50.516681+00:00"},{"alias_kind":"pith_short_8","alias_value":"ZPJTRYDO","created_at":"2026-05-18T12:26:50.516681+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO","json":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO.json","graph_json":"https://pith.science/api/pith-number/ZPJTRYDOGBTFXFSMQX5CDU36DO/graph.json","events_json":"https://pith.science/api/pith-number/ZPJTRYDOGBTFXFSMQX5CDU36DO/events.json","paper":"https://pith.science/paper/ZPJTRYDO"},"agent_actions":{"view_html":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO","download_json":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO.json","view_paper":"https://pith.science/paper/ZPJTRYDO","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1106.0681&json=true","fetch_graph":"https://pith.science/api/pith-number/ZPJTRYDOGBTFXFSMQX5CDU36DO/graph.json","fetch_events":"https://pith.science/api/pith-number/ZPJTRYDOGBTFXFSMQX5CDU36DO/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO/action/timestamp_anchor","attest_storage":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO/action/storage_attestation","attest_author":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO/action/author_attestation","sign_citation":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO/action/citation_signature","submit_replication":"https://pith.science/pith/ZPJTRYDOGBTFXFSMQX5CDU36DO/action/replication_record"}},"created_at":"2026-05-18T04:20:39.715253+00:00","updated_at":"2026-05-18T04:20:39.715253+00:00"}