{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:D3PUDUKIQDMJMDQU7EFHZCIKZF","short_pith_number":"pith:D3PUDUKI","schema_version":"1.0","canonical_sha256":"1edf41d14880d8960e14f90a7c890ac96c3ed30b083b3db70702eaf2c7377e81","source":{"kind":"arxiv","id":"2605.14923","version":1},"attestation_state":"computed","paper":{"title":"SceneParser: Hierarchical Scene Parsing for Visual Semantics Understanding","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Hao Fei, Luping Xiao, Meishan Zhang, Pengxin Xu, Qing Jiang, Shanghang Zhang, Xincheng Lin, Xingyu Chen","submitted_at":"2026-05-14T14:58:46Z","abstract_excerpt":"General scene perception has progressed from object recognition toward open-vocabulary grounding, part localization, and affordance prediction. Yet these capabilities are often realized as isolated predictions that localize objects, parts, or interaction points without capturing the structured dependencies needed for interaction-oriented scene understanding. To address this gap, we introduce Hierarchical Scene Parsing, an interaction-oriented parsing task that represents physical scenes as explicit scene -> object -> part -> affordance hierarchies with cross-level bindings. We instantiate this"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.14923","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-14T14:58:46Z","cross_cats_sorted":[],"title_canon_sha256":"f387f64abd612039af6b2716c76652b7439f75c4a667bf1a0e25a3481a3ae974","abstract_canon_sha256":"fcf42a77bde38058497805bc490578b5f80d4686933749fdc1e1f1837167699d"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-17T23:38:55.641114Z","signature_b64":"gsV+58ixEECG1Ei4cxPAWQYcFL+MOxE9m3XUcRnOtwJRn+LjP2DIkGvDpSky9djApTqZo47XgxAJjXX5CXv/DQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"1edf41d14880d8960e14f90a7c890ac96c3ed30b083b3db70702eaf2c7377e81","last_reissued_at":"2026-05-17T23:38:55.640469Z","signature_status":"signed_v1","first_computed_at":"2026-05-17T23:38:55.640469Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"SceneParser: Hierarchical Scene Parsing for Visual Semantics Understanding","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Hao Fei, Luping Xiao, Meishan Zhang, Pengxin Xu, Qing Jiang, Shanghang Zhang, Xincheng Lin, Xingyu Chen","submitted_at":"2026-05-14T14:58:46Z","abstract_excerpt":"General scene perception has progressed from object recognition toward open-vocabulary grounding, part localization, and affordance prediction. Yet these capabilities are often realized as isolated predictions that localize objects, parts, or interaction points without capturing the structured dependencies needed for interaction-oriented scene understanding. To address this gap, we introduce Hierarchical Scene Parsing, an interaction-oriented parsing task that represents physical scenes as explicit scene -> object -> part -> affordance hierarchies with cross-level bindings. We instantiate this"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.14923","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.14923","created_at":"2026-05-17T23:38:55.640576+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.14923v1","created_at":"2026-05-17T23:38:55.640576+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.14923","created_at":"2026-05-17T23:38:55.640576+00:00"},{"alias_kind":"pith_short_12","alias_value":"D3PUDUKIQDMJ","created_at":"2026-05-18T12:33:37.589309+00:00"},{"alias_kind":"pith_short_16","alias_value":"D3PUDUKIQDMJMDQU","created_at":"2026-05-18T12:33:37.589309+00:00"},{"alias_kind":"pith_short_8","alias_value":"D3PUDUKI","created_at":"2026-05-18T12:33:37.589309+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF","json":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF.json","graph_json":"https://pith.science/api/pith-number/D3PUDUKIQDMJMDQU7EFHZCIKZF/graph.json","events_json":"https://pith.science/api/pith-number/D3PUDUKIQDMJMDQU7EFHZCIKZF/events.json","paper":"https://pith.science/paper/D3PUDUKI"},"agent_actions":{"view_html":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF","download_json":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF.json","view_paper":"https://pith.science/paper/D3PUDUKI","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.14923&json=true","fetch_graph":"https://pith.science/api/pith-number/D3PUDUKIQDMJMDQU7EFHZCIKZF/graph.json","fetch_events":"https://pith.science/api/pith-number/D3PUDUKIQDMJMDQU7EFHZCIKZF/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF/action/timestamp_anchor","attest_storage":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF/action/storage_attestation","attest_author":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF/action/author_attestation","sign_citation":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF/action/citation_signature","submit_replication":"https://pith.science/pith/D3PUDUKIQDMJMDQU7EFHZCIKZF/action/replication_record"}},"created_at":"2026-05-17T23:38:55.640576+00:00","updated_at":"2026-05-17T23:38:55.640576+00:00"}