{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2018:DJSLKS4HZYD6QD42VT5CBVBW4A","short_pith_number":"pith:DJSLKS4H","canonical_record":{"source":{"id":"1812.02619","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-12-06T15:48:54Z","cross_cats_sorted":[],"title_canon_sha256":"0e7c123ab12ae0cc3c7adef5456a559cd90a8b8c126ee6419ed131d572d603c0","abstract_canon_sha256":"adc60e64b027e27284e827a9add5749c7632c921d1e5000b96c70e090df86015"},"schema_version":"1.0"},"canonical_sha256":"1a64b54b87ce07e80f9aacfa20d436e01b146db147d4121c09cb625e9f5a51a1","source":{"kind":"arxiv","id":"1812.02619","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1812.02619","created_at":"2026-05-17T23:58:55Z"},{"alias_kind":"arxiv_version","alias_value":"1812.02619v1","created_at":"2026-05-17T23:58:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1812.02619","created_at":"2026-05-17T23:58:55Z"},{"alias_kind":"pith_short_12","alias_value":"DJSLKS4HZYD6","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"DJSLKS4HZYD6QD42","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"DJSLKS4H","created_at":"2026-05-18T12:32:19Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2018:DJSLKS4HZYD6QD42VT5CBVBW4A","target":"record","payload":{"canonical_record":{"source":{"id":"1812.02619","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-12-06T15:48:54Z","cross_cats_sorted":[],"title_canon_sha256":"0e7c123ab12ae0cc3c7adef5456a559cd90a8b8c126ee6419ed131d572d603c0","abstract_canon_sha256":"adc60e64b027e27284e827a9add5749c7632c921d1e5000b96c70e090df86015"},"schema_version":"1.0"},"canonical_sha256":"1a64b54b87ce07e80f9aacfa20d436e01b146db147d4121c09cb625e9f5a51a1","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:58:55.299254Z","signature_b64":"dwMvSWQfXiNRSbDC8ms6a0CwMiNQFNiuhd9Ji03jJhGflDuOQqs0ojzJsure3lhpDzgICmIyxVNNC3/mu2p+Bg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1a64b54b87ce07e80f9aacfa20d436e01b146db147d4121c09cb625e9f5a51a1","last_reissued_at":"2026-05-17T23:58:55.298788Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:58:55.298788Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1812.02619","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:58:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"ouaVIvpSMVqUGaIlQQjEtRIxhNniEnWtso5KhZzmE0skYa+DLljlpMd7JuUtppsEMgjAv3RhZRWHtKkP7XxyDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T23:36:33.431864Z"},"content_sha256":"18594a4182e1c5cc917bb990b4006969ac5102221016ebfd5cb864e1cb9967ec","schema_version":"1.0","event_id":"sha256:18594a4182e1c5cc917bb990b4006969ac5102221016ebfd5cb864e1cb9967ec"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2018:DJSLKS4HZYD6QD42VT5CBVBW4A","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Tube-CNN: Modeling temporal evolution of appearance for object detection in video","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Anton Osokin, Ivan Laptev, Tuan-Hung Vu","submitted_at":"2018-12-06T15:48:54Z","abstract_excerpt":"Object detection in video is crucial for many applications. Compared to images, video provides additional cues which can help to disambiguate the detection problem. Our goal in this paper is to learn discriminative models for the temporal evolution of object appearance and to use such models for object detection. To model temporal evolution, we introduce space-time tubes corresponding to temporal sequences of bounding boxes. We propose two CNN architectures for generating and classifying tubes, respectively. Our tube proposal network (TPN) first generates a large number of spatio-temporal tube"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1812.02619","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-17T23:58:55Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YfF0yTp1WWof4o1/RYaw36RlxS5NQ0xlGb+lQ1jXN7XnOL2ZzOldbkjqVGo5a8Gpr2Fx0BV4lHyZnj8lRICNAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-30T23:36:33.432215Z"},"content_sha256":"6c3917ce8afef7399909d26434fc1b53a85e80603c4307704c873888c462ed7d","schema_version":"1.0","event_id":"sha256:6c3917ce8afef7399909d26434fc1b53a85e80603c4307704c873888c462ed7d"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/DJSLKS4HZYD6QD42VT5CBVBW4A/bundle.json","state_url":"https://pith.science/pith/DJSLKS4HZYD6QD42VT5CBVBW4A/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/DJSLKS4HZYD6QD42VT5CBVBW4A/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-30T23:36:33Z","links":{"resolver":"https://pith.science/pith/DJSLKS4HZYD6QD42VT5CBVBW4A","bundle":"https://pith.science/pith/DJSLKS4HZYD6QD42VT5CBVBW4A/bundle.json","state":"https://pith.science/pith/DJSLKS4HZYD6QD42VT5CBVBW4A/state.json","well_known_bundle":"https://pith.science/.well-known/pith/DJSLKS4HZYD6QD42VT5CBVBW4A/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2018:DJSLKS4HZYD6QD42VT5CBVBW4A","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"adc60e64b027e27284e827a9add5749c7632c921d1e5000b96c70e090df86015","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-12-06T15:48:54Z","title_canon_sha256":"0e7c123ab12ae0cc3c7adef5456a559cd90a8b8c126ee6419ed131d572d603c0"},"schema_version":"1.0","source":{"id":"1812.02619","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1812.02619","created_at":"2026-05-17T23:58:55Z"},{"alias_kind":"arxiv_version","alias_value":"1812.02619v1","created_at":"2026-05-17T23:58:55Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1812.02619","created_at":"2026-05-17T23:58:55Z"},{"alias_kind":"pith_short_12","alias_value":"DJSLKS4HZYD6","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_16","alias_value":"DJSLKS4HZYD6QD42","created_at":"2026-05-18T12:32:19Z"},{"alias_kind":"pith_short_8","alias_value":"DJSLKS4H","created_at":"2026-05-18T12:32:19Z"}],"graph_snapshots":[{"event_id":"sha256:6c3917ce8afef7399909d26434fc1b53a85e80603c4307704c873888c462ed7d","target":"graph","created_at":"2026-05-17T23:58:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Object detection in video is crucial for many applications. Compared to images, video provides additional cues which can help to disambiguate the detection problem. Our goal in this paper is to learn discriminative models for the temporal evolution of object appearance and to use such models for object detection. To model temporal evolution, we introduce space-time tubes corresponding to temporal sequences of bounding boxes. We propose two CNN architectures for generating and classifying tubes, respectively. Our tube proposal network (TPN) first generates a large number of spatio-temporal tube","authors_text":"Anton Osokin, Ivan Laptev, Tuan-Hung Vu","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-12-06T15:48:54Z","title":"Tube-CNN: Modeling temporal evolution of appearance for object detection in video"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1812.02619","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:18594a4182e1c5cc917bb990b4006969ac5102221016ebfd5cb864e1cb9967ec","target":"record","created_at":"2026-05-17T23:58:55Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"adc60e64b027e27284e827a9add5749c7632c921d1e5000b96c70e090df86015","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2018-12-06T15:48:54Z","title_canon_sha256":"0e7c123ab12ae0cc3c7adef5456a559cd90a8b8c126ee6419ed131d572d603c0"},"schema_version":"1.0","source":{"id":"1812.02619","kind":"arxiv","version":1}},"canonical_sha256":"1a64b54b87ce07e80f9aacfa20d436e01b146db147d4121c09cb625e9f5a51a1","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"1a64b54b87ce07e80f9aacfa20d436e01b146db147d4121c09cb625e9f5a51a1","first_computed_at":"2026-05-17T23:58:55.298788Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-17T23:58:55.298788Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"dwMvSWQfXiNRSbDC8ms6a0CwMiNQFNiuhd9Ji03jJhGflDuOQqs0ojzJsure3lhpDzgICmIyxVNNC3/mu2p+Bg==","signature_status":"signed_v1","signed_at":"2026-05-17T23:58:55.299254Z","signed_message":"canonical_sha256_bytes"},"source_id":"1812.02619","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:18594a4182e1c5cc917bb990b4006969ac5102221016ebfd5cb864e1cb9967ec","sha256:6c3917ce8afef7399909d26434fc1b53a85e80603c4307704c873888c462ed7d"],"state_sha256":"e39c18d2dab58e9a8af2ac64308df16d57184badb887ef4b4f4c9d6bf9eb896d"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"8Fn4QGtS9+tXgMAM6A/QQVL3CghFY4+Ax5xKjcaEqVmGG4WssPzUuDN80g4mEAnbfTxhRd9PNBGjMN0l0Gy0DA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-30T23:36:33.434350Z","bundle_sha256":"b178c0fbd7e1563b058b8a82c01df2c37ebe7018b55053d4e3638dc0c34412de"}}