{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2016:JYY5YQ3Y7QZ6WTYWLGH774SXWU","short_pith_number":"pith:JYY5YQ3Y","schema_version":"1.0","canonical_sha256":"4e31dc4378fc33eb4f16598ffff257b52d8833c1e2382afb6dbd2ee3228ff7f8","source":{"kind":"arxiv","id":"1609.00153","version":2},"attestation_state":"computed","paper":{"title":"Weakly Supervised PatchNets: Describing and Aggregating Local Patches for Scene Recognition","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bowen Zhang, Limin Wang, Yali Wang, Yu Qiao, Zhe Wang","submitted_at":"2016-09-01T09:15:41Z","abstract_excerpt":"Traditional feature encoding scheme (e.g., Fisher vector) with local descriptors (e.g., SIFT) and recent convolutional neural networks (CNNs) are two classes of successful methods for image recognition. In this paper, we propose a hybrid representation, which leverages the discriminative capacity of CNNs and the simplicity of descriptor encoding schema for image recognition, with a focus on scene recognition. To this end, we make three main contributions from the following aspects. First, we propose a patch-level and end-to-end architecture to model the appearance of local patches, called {\\em"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"1609.00153","kind":"arxiv","version":2},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2016-09-01T09:15:41Z","cross_cats_sorted":[],"title_canon_sha256":"9d538c6ad53ce45d612e02c897e97c141168f0c288b1e733c2b1cf63ba9a500e","abstract_canon_sha256":"09687ce2b0a4d4b7ba6b18c0515c913e2413ee98708dfab67ee98141ce330485"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-18T00:45:48.598746Z","signature_b64":"9xz6dZ5tW6qlttxIJwPR2wE/JgJ7zEwwx9WrOmg8WamtmBKwS5k1F2SBKy7xIPAkFYibFYugCJJ6GJo15Ox4AA==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"4e31dc4378fc33eb4f16598ffff257b52d8833c1e2382afb6dbd2ee3228ff7f8","last_reissued_at":"2026-05-18T00:45:48.598148Z","signature_status":"signed_v1","first_computed_at":"2026-05-18T00:45:48.598148Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Weakly Supervised PatchNets: Describing and Aggregating Local Patches for Scene Recognition","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bowen Zhang, Limin Wang, Yali Wang, Yu Qiao, Zhe Wang","submitted_at":"2016-09-01T09:15:41Z","abstract_excerpt":"Traditional feature encoding scheme (e.g., Fisher vector) with local descriptors (e.g., SIFT) and recent convolutional neural networks (CNNs) are two classes of successful methods for image recognition. In this paper, we propose a hybrid representation, which leverages the discriminative capacity of CNNs and the simplicity of descriptor encoding schema for image recognition, with a focus on scene recognition. To this end, we make three main contributions from the following aspects. First, we propose a patch-level and end-to-end architecture to model the appearance of local patches, called {\\em"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"1609.00153","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"1609.00153","created_at":"2026-05-18T00:45:48.598251+00:00"},{"alias_kind":"arxiv_version","alias_value":"1609.00153v2","created_at":"2026-05-18T00:45:48.598251+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.1609.00153","created_at":"2026-05-18T00:45:48.598251+00:00"},{"alias_kind":"pith_short_12","alias_value":"JYY5YQ3Y7QZ6","created_at":"2026-05-18T12:30:25.849896+00:00"},{"alias_kind":"pith_short_16","alias_value":"JYY5YQ3Y7QZ6WTYW","created_at":"2026-05-18T12:30:25.849896+00:00"},{"alias_kind":"pith_short_8","alias_value":"JYY5YQ3Y","created_at":"2026-05-18T12:30:25.849896+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU","json":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU.json","graph_json":"https://pith.science/api/pith-number/JYY5YQ3Y7QZ6WTYWLGH774SXWU/graph.json","events_json":"https://pith.science/api/pith-number/JYY5YQ3Y7QZ6WTYWLGH774SXWU/events.json","paper":"https://pith.science/paper/JYY5YQ3Y"},"agent_actions":{"view_html":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU","download_json":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU.json","view_paper":"https://pith.science/paper/JYY5YQ3Y","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=1609.00153&json=true","fetch_graph":"https://pith.science/api/pith-number/JYY5YQ3Y7QZ6WTYWLGH774SXWU/graph.json","fetch_events":"https://pith.science/api/pith-number/JYY5YQ3Y7QZ6WTYWLGH774SXWU/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU/action/timestamp_anchor","attest_storage":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU/action/storage_attestation","attest_author":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU/action/author_attestation","sign_citation":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU/action/citation_signature","submit_replication":"https://pith.science/pith/JYY5YQ3Y7QZ6WTYWLGH774SXWU/action/replication_record"}},"created_at":"2026-05-18T00:45:48.598251+00:00","updated_at":"2026-05-18T00:45:48.598251+00:00"}