{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:ODXWLQUGPOGNC3ACYAHSXJRHOF","short_pith_number":"pith:ODXWLQUG","canonical_record":{"source":{"id":"1803.05752","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-03-15T14:00:24Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"8ecc28d22cc83b1edde69a42c930dfe82543c2187abfad27fd06d4bd59529ecb","abstract_canon_sha256":"5c7257a8b431c9593c91bd82dab08009a8f3441ac3b8a472d9aa799ee95a6dcc"},"schema_version":"1.0"},"canonical_sha256":"70ef65c2867b8cd16c02c00f2ba627716034055ff543f2c65ca3efa6fdab809b","source":{"kind":"arxiv","id":"1803.05752","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.05752","created_at":"2026-05-18T00:05:19Z"},{"alias_kind":"arxiv_version","alias_value":"1803.05752v1","created_at":"2026-05-18T00:05:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.05752","created_at":"2026-05-18T00:05:19Z"},{"alias_kind":"pith_short_12","alias_value":"ODXWLQUGPOGN","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_16","alias_value":"ODXWLQUGPOGNC3AC","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_8","alias_value":"ODXWLQUG","created_at":"2026-05-18T12:32:43Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:ODXWLQUGPOGNC3ACYAHSXJRHOF","target":"record","payload":{"canonical_record":{"source":{"id":"1803.05752","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-03-15T14:00:24Z","cross_cats_sorted":["cs.AI","cs.LG"],"title_canon_sha256":"8ecc28d22cc83b1edde69a42c930dfe82543c2187abfad27fd06d4bd59529ecb","abstract_canon_sha256":"5c7257a8b431c9593c91bd82dab08009a8f3441ac3b8a472d9aa799ee95a6dcc"},"schema_version":"1.0"},"canonical_sha256":"70ef65c2867b8cd16c02c00f2ba627716034055ff543f2c65ca3efa6fdab809b","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:05:19.429756Z","signature_b64":"wCfKS/Ldv/3OeXBHmky/kqHYh9b5pHL1XMLSVYnQBWrRgSdDvmClta0td3oeNFt6tkm8dsGHhDDm+kdJLR/0Dw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"70ef65c2867b8cd16c02c00f2ba627716034055ff543f2c65ca3efa6fdab809b","last_reissued_at":"2026-05-18T00:05:19.429188Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:05:19.429188Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1803.05752","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3Bbj6bD/sYLBr2tNsWCXT/foyQAogc9/ACTAtTPnCSHO4+npLmnvmYPHKzmZVRB7w+YIABhv8pVwQtDa66y3DQ==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T04:09:48.963888Z"},"content_sha256":"83197fa9bb6db3bf4c683a846c438d8ddd2ba9e118ed635ca22fc94777a46407","schema_version":"1.0","event_id":"sha256:83197fa9bb6db3bf4c683a846c438d8ddd2ba9e118ed635ca22fc94777a46407"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:ODXWLQUGPOGNC3ACYAHSXJRHOF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Rearrangement with Nonprehensile Manipulation Using Deep Reinforcement Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":["cs.AI","cs.LG"],"primary_cat":"cs.RO","authors_text":"Danica Kragic, Johannes A. Stork, Kaiyu Hang, Michael Y. Wang, Weihao Yuan","submitted_at":"2018-03-15T14:00:24Z","abstract_excerpt":"Rearranging objects on a tabletop surface by means of nonprehensile manipulation is a task which requires skillful interaction with the physical world. Usually, this is achieved by precisely modeling physical properties of the objects, robot, and the environment for explicit planning. In contrast, as explicitly modeling the physical environment is not always feasible and involves various uncertainties, we learn a nonprehensile rearrangement strategy with deep reinforcement learning based on only visual feedback. For this, we model the task with rewards and train a deep Q-network. Our potential"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.05752","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:05:19Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"gbaEerC0AEouJAv0NEJudX6OSdQD5BNrXZoX0G1O/j8ptnPBY10vXOPTvpU7Hm6H/Vzln/Kf/230AxIpGBNaAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-09T04:09:48.964653Z"},"content_sha256":"26abf94342c54567ff54668f6874714ae6a7d54a0809868e11252baa636f6189","schema_version":"1.0","event_id":"sha256:26abf94342c54567ff54668f6874714ae6a7d54a0809868e11252baa636f6189"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/ODXWLQUGPOGNC3ACYAHSXJRHOF/bundle.json","state_url":"https://pith.science/pith/ODXWLQUGPOGNC3ACYAHSXJRHOF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/ODXWLQUGPOGNC3ACYAHSXJRHOF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-09T04:09:48Z","links":{"resolver":"https://pith.science/pith/ODXWLQUGPOGNC3ACYAHSXJRHOF","bundle":"https://pith.science/pith/ODXWLQUGPOGNC3ACYAHSXJRHOF/bundle.json","state":"https://pith.science/pith/ODXWLQUGPOGNC3ACYAHSXJRHOF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/ODXWLQUGPOGNC3ACYAHSXJRHOF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:ODXWLQUGPOGNC3ACYAHSXJRHOF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"5c7257a8b431c9593c91bd82dab08009a8f3441ac3b8a472d9aa799ee95a6dcc","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-03-15T14:00:24Z","title_canon_sha256":"8ecc28d22cc83b1edde69a42c930dfe82543c2187abfad27fd06d4bd59529ecb"},"schema_version":"1.0","source":{"id":"1803.05752","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1803.05752","created_at":"2026-05-18T00:05:19Z"},{"alias_kind":"arxiv_version","alias_value":"1803.05752v1","created_at":"2026-05-18T00:05:19Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1803.05752","created_at":"2026-05-18T00:05:19Z"},{"alias_kind":"pith_short_12","alias_value":"ODXWLQUGPOGN","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_16","alias_value":"ODXWLQUGPOGNC3AC","created_at":"2026-05-18T12:32:43Z"},{"alias_kind":"pith_short_8","alias_value":"ODXWLQUG","created_at":"2026-05-18T12:32:43Z"}],"graph_snapshots":[{"event_id":"sha256:26abf94342c54567ff54668f6874714ae6a7d54a0809868e11252baa636f6189","target":"graph","created_at":"2026-05-18T00:05:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Rearranging objects on a tabletop surface by means of nonprehensile manipulation is a task which requires skillful interaction with the physical world. Usually, this is achieved by precisely modeling physical properties of the objects, robot, and the environment for explicit planning. In contrast, as explicitly modeling the physical environment is not always feasible and involves various uncertainties, we learn a nonprehensile rearrangement strategy with deep reinforcement learning based on only visual feedback. For this, we model the task with rewards and train a deep Q-network. Our potential","authors_text":"Danica Kragic, Johannes A. Stork, Kaiyu Hang, Michael Y. Wang, Weihao Yuan","cross_cats":["cs.AI","cs.LG"],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-03-15T14:00:24Z","title":"Rearrangement with Nonprehensile Manipulation Using Deep Reinforcement Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1803.05752","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:83197fa9bb6db3bf4c683a846c438d8ddd2ba9e118ed635ca22fc94777a46407","target":"record","created_at":"2026-05-18T00:05:19Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"5c7257a8b431c9593c91bd82dab08009a8f3441ac3b8a472d9aa799ee95a6dcc","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.RO","submitted_at":"2018-03-15T14:00:24Z","title_canon_sha256":"8ecc28d22cc83b1edde69a42c930dfe82543c2187abfad27fd06d4bd59529ecb"},"schema_version":"1.0","source":{"id":"1803.05752","kind":"arxiv","version":1}},"canonical_sha256":"70ef65c2867b8cd16c02c00f2ba627716034055ff543f2c65ca3efa6fdab809b","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"70ef65c2867b8cd16c02c00f2ba627716034055ff543f2c65ca3efa6fdab809b","first_computed_at":"2026-05-18T00:05:19.429188Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:05:19.429188Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"wCfKS/Ldv/3OeXBHmky/kqHYh9b5pHL1XMLSVYnQBWrRgSdDvmClta0td3oeNFt6tkm8dsGHhDDm+kdJLR/0Dw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:05:19.429756Z","signed_message":"canonical_sha256_bytes"},"source_id":"1803.05752","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:83197fa9bb6db3bf4c683a846c438d8ddd2ba9e118ed635ca22fc94777a46407","sha256:26abf94342c54567ff54668f6874714ae6a7d54a0809868e11252baa636f6189"],"state_sha256":"525d8be6b68714813c2264cff8bca33b5d592d58877745fc8cd2452d0b90fae5"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"76HdQe932ifXQblQ6LCTFvjcI3hXnZL6Py8RkiR+WOusDrOYZ+PsNDk/HVwoq8MODRAX5E4NNXzMVQoq4SzOCQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-09T04:09:48.968890Z","bundle_sha256":"8d6755225d47c611bad2126b9bdd4f0fc111394628e6abf3611e5cb269634bad"}}