{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2017:AEJYEAP6IWAFAFWWN6N6V7B2H4","short_pith_number":"pith:AEJYEAP6","canonical_record":{"source":{"id":"1708.05038","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-16T18:54:39Z","cross_cats_sorted":[],"title_canon_sha256":"9cd1b2da276f61b38ab57f14307cce39afb9c1c97658be7c0d5ea0454eef4e1c","abstract_canon_sha256":"ed4853802c1cca8eea6e9f5ee4e0244e59cb12820783933b72308ed46a7981fb"},"schema_version":"1.0"},"canonical_sha256":"01138201fe45805016d66f9beafc3a3f32f38b1d6c111ab551df01b25b6f6523","source":{"kind":"arxiv","id":"1708.05038","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.05038","created_at":"2026-05-18T00:37:54Z"},{"alias_kind":"arxiv_version","alias_value":"1708.05038v1","created_at":"2026-05-18T00:37:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.05038","created_at":"2026-05-18T00:37:54Z"},{"alias_kind":"pith_short_12","alias_value":"AEJYEAP6IWAF","created_at":"2026-05-18T12:31:05Z"},{"alias_kind":"pith_short_16","alias_value":"AEJYEAP6IWAFAFWW","created_at":"2026-05-18T12:31:05Z"},{"alias_kind":"pith_short_8","alias_value":"AEJYEAP6","created_at":"2026-05-18T12:31:05Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2017:AEJYEAP6IWAFAFWWN6N6V7B2H4","target":"record","payload":{"canonical_record":{"source":{"id":"1708.05038","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-16T18:54:39Z","cross_cats_sorted":[],"title_canon_sha256":"9cd1b2da276f61b38ab57f14307cce39afb9c1c97658be7c0d5ea0454eef4e1c","abstract_canon_sha256":"ed4853802c1cca8eea6e9f5ee4e0244e59cb12820783933b72308ed46a7981fb"},"schema_version":"1.0"},"canonical_sha256":"01138201fe45805016d66f9beafc3a3f32f38b1d6c111ab551df01b25b6f6523","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:37:54.041087Z","signature_b64":"GVy8r1giP4TEMfDSW8jpV5lGn4yukvfHgQLgrVQykIX9CfyWSMGqfUJpjVMVLWTB//wAOlIFNtNMhAG9a8XjAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"01138201fe45805016d66f9beafc3a3f32f38b1d6c111ab551df01b25b6f6523","last_reissued_at":"2026-05-18T00:37:54.040643Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:37:54.040643Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"1708.05038","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:37:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+g66jQerR08VNPFrbn/GfVbH+5sGZyNPNifikQEkPRMCOJLV34BPvLg00+e+IVCqcUAebVPOwT8CbFzGQi1/Cg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T15:49:33.690279Z"},"content_sha256":"cf48fbdc4517b3af3debe17e662eb541ae438b87d814994264d0f594006a867f","schema_version":"1.0","event_id":"sha256:cf48fbdc4517b3af3debe17e662eb541ae438b87d814994264d0f594006a867f"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2017:AEJYEAP6IWAFAFWWN6N6V7B2H4","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"ConvNet Architecture Search for Spatiotemporal Feature Learning","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Du Tran, Jamie Ray, Manohar Paluri, Shih-Fu Chang, Zheng Shou","submitted_at":"2017-08-16T18:54:39Z","abstract_excerpt":"Learning image representations with ConvNets by pre-training on ImageNet has proven useful across many visual understanding tasks including object detection, semantic segmentation, and image captioning. Although any image representation can be applied to video frames, a dedicated spatiotemporal representation is still vital in order to incorporate motion patterns that cannot be captured by appearance based models alone. This paper presents an empirical ConvNet architecture search for spatiotemporal feature learning, culminating in a deep 3-dimensional (3D) Residual ConvNet. Our proposed archit"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.05038","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-18T00:37:54Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"hEr2v1oS/V13RzAVZGOCcsvEn0j7Z7XiUc1QHPF85SqYC4baQ6L9C5mTHdCu4vc46izZjXZK/mySVAhk7vCjAg==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-26T15:49:33.690675Z"},"content_sha256":"84ef5ed21ce78d220d8a8b031b4a59b1633b25638412007c1c1ddfa06adbd5a4","schema_version":"1.0","event_id":"sha256:84ef5ed21ce78d220d8a8b031b4a59b1633b25638412007c1c1ddfa06adbd5a4"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/AEJYEAP6IWAFAFWWN6N6V7B2H4/bundle.json","state_url":"https://pith.science/pith/AEJYEAP6IWAFAFWWN6N6V7B2H4/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/AEJYEAP6IWAFAFWWN6N6V7B2H4/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-26T15:49:33Z","links":{"resolver":"https://pith.science/pith/AEJYEAP6IWAFAFWWN6N6V7B2H4","bundle":"https://pith.science/pith/AEJYEAP6IWAFAFWWN6N6V7B2H4/bundle.json","state":"https://pith.science/pith/AEJYEAP6IWAFAFWWN6N6V7B2H4/state.json","well_known_bundle":"https://pith.science/.well-known/pith/AEJYEAP6IWAFAFWWN6N6V7B2H4/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2017:AEJYEAP6IWAFAFWWN6N6V7B2H4","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"ed4853802c1cca8eea6e9f5ee4e0244e59cb12820783933b72308ed46a7981fb","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-16T18:54:39Z","title_canon_sha256":"9cd1b2da276f61b38ab57f14307cce39afb9c1c97658be7c0d5ea0454eef4e1c"},"schema_version":"1.0","source":{"id":"1708.05038","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"1708.05038","created_at":"2026-05-18T00:37:54Z"},{"alias_kind":"arxiv_version","alias_value":"1708.05038v1","created_at":"2026-05-18T00:37:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1708.05038","created_at":"2026-05-18T00:37:54Z"},{"alias_kind":"pith_short_12","alias_value":"AEJYEAP6IWAF","created_at":"2026-05-18T12:31:05Z"},{"alias_kind":"pith_short_16","alias_value":"AEJYEAP6IWAFAFWW","created_at":"2026-05-18T12:31:05Z"},{"alias_kind":"pith_short_8","alias_value":"AEJYEAP6","created_at":"2026-05-18T12:31:05Z"}],"graph_snapshots":[{"event_id":"sha256:84ef5ed21ce78d220d8a8b031b4a59b1633b25638412007c1c1ddfa06adbd5a4","target":"graph","created_at":"2026-05-18T00:37:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"paper":{"abstract_excerpt":"Learning image representations with ConvNets by pre-training on ImageNet has proven useful across many visual understanding tasks including object detection, semantic segmentation, and image captioning. Although any image representation can be applied to video frames, a dedicated spatiotemporal representation is still vital in order to incorporate motion patterns that cannot be captured by appearance based models alone. This paper presents an empirical ConvNet architecture search for spatiotemporal feature learning, culminating in a deep 3-dimensional (3D) Residual ConvNet. Our proposed archit","authors_text":"Du Tran, Jamie Ray, Manohar Paluri, Shih-Fu Chang, Zheng Shou","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-16T18:54:39Z","title":"ConvNet Architecture Search for Spatiotemporal Feature Learning"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1708.05038","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:cf48fbdc4517b3af3debe17e662eb541ae438b87d814994264d0f594006a867f","target":"record","created_at":"2026-05-18T00:37:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"ed4853802c1cca8eea6e9f5ee4e0244e59cb12820783933b72308ed46a7981fb","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2017-08-16T18:54:39Z","title_canon_sha256":"9cd1b2da276f61b38ab57f14307cce39afb9c1c97658be7c0d5ea0454eef4e1c"},"schema_version":"1.0","source":{"id":"1708.05038","kind":"arxiv","version":1}},"canonical_sha256":"01138201fe45805016d66f9beafc3a3f32f38b1d6c111ab551df01b25b6f6523","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"01138201fe45805016d66f9beafc3a3f32f38b1d6c111ab551df01b25b6f6523","first_computed_at":"2026-05-18T00:37:54.040643Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-18T00:37:54.040643Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"GVy8r1giP4TEMfDSW8jpV5lGn4yukvfHgQLgrVQykIX9CfyWSMGqfUJpjVMVLWTB//wAOlIFNtNMhAG9a8XjAw==","signature_status":"signed_v1","signed_at":"2026-05-18T00:37:54.041087Z","signed_message":"canonical_sha256_bytes"},"source_id":"1708.05038","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:cf48fbdc4517b3af3debe17e662eb541ae438b87d814994264d0f594006a867f","sha256:84ef5ed21ce78d220d8a8b031b4a59b1633b25638412007c1c1ddfa06adbd5a4"],"state_sha256":"ab14b26b62eb2df307821d6420be3c98410ed3118c816189bc09095efa678c12"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"az1zUOz7r5JYEeePT98b7vZMCLt/+fjLwUMxICL6A0Td5NynfSVDi/P9ICE4I90MQ5czCp6dhcmFDuj1rmfhAg==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-26T15:49:33.693109Z","bundle_sha256":"0cb496d1ec8d05cde400212e40170d2da7a0991d6044b3457a9ad7f30a18f90a"}}