{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:6X4UWWREEHZLPHUIVCH7H4KECW","short_pith_number":"pith:6X4UWWRE","schema_version":"1.0","canonical_sha256":"f5f94b5a2421f2b79e88a88ff3f14415bd645b3a891ce41c31ecebd367129f32","source":{"kind":"arxiv","id":"2606.30124","version":1},"attestation_state":"computed","paper":{"title":"SciIR: A Large-scale Training Dataset and Benchmark for Scientific Image Reasoning Generation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bowen Zhou, Jiabao Wei, Jianjun Li, Junhao Xiao, Peize Li, Ruijie Li, Yuning An, Zhengfeng Shi, Zhiyuan Ma","submitted_at":"2026-06-29T10:59:10Z","abstract_excerpt":"While Text-to-Image (T2I) models have shown remarkable success in generating photorealistic visual content, they still struggle with the rigorous semantic alignment and logical reasoning required for scientific imagery. Inspired by Peirce's Semiotic Triad, we introduce Scientific Image Reasoning (SciIR), a comprehensive resource for training and evaluation of scientific image generation. We formalize scientific reasoning into three core dimensions: Entity Structure (Icon), Scientific Process (Index), and Scientific Law (Symbol). Specifically, to overcome the scarcity of training data in scient"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2606.30124","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CV","submitted_at":"2026-06-29T10:59:10Z","cross_cats_sorted":[],"title_canon_sha256":"081be0a158f412f944602d3f91bba1c763ad85a62fe2c23c1a05ac68ab39f70f","abstract_canon_sha256":"5599a5405d2ef175ef60bb1dbe528f3969a5caba02e2991e782d0fc196fb3aa0"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-30T02:17:50.654436Z","signature_b64":"8WDerifdS+1TmogVpJV9WxNTgmXBZ1DX/VnscEYYKK/rb9pVwwhGPtTULQ1wPWdOcZ1kr547fIoUa73+JIRTDQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"f5f94b5a2421f2b79e88a88ff3f14415bd645b3a891ce41c31ecebd367129f32","last_reissued_at":"2026-06-30T02:17:50.653919Z","signature_status":"signed_v1","first_computed_at":"2026-06-30T02:17:50.653919Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"SciIR: A Large-scale Training Dataset and Benchmark for Scientific Image Reasoning Generation","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Bowen Zhou, Jiabao Wei, Jianjun Li, Junhao Xiao, Peize Li, Ruijie Li, Yuning An, Zhengfeng Shi, Zhiyuan Ma","submitted_at":"2026-06-29T10:59:10Z","abstract_excerpt":"While Text-to-Image (T2I) models have shown remarkable success in generating photorealistic visual content, they still struggle with the rigorous semantic alignment and logical reasoning required for scientific imagery. Inspired by Peirce's Semiotic Triad, we introduce Scientific Image Reasoning (SciIR), a comprehensive resource for training and evaluation of scientific image generation. We formalize scientific reasoning into three core dimensions: Entity Structure (Icon), Scientific Process (Index), and Scientific Law (Symbol). Specifically, to overcome the scarcity of training data in scient"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.30124","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.30124/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2606.30124","created_at":"2026-06-30T02:17:50.653998+00:00"},{"alias_kind":"arxiv_version","alias_value":"2606.30124v1","created_at":"2026-06-30T02:17:50.653998+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.30124","created_at":"2026-06-30T02:17:50.653998+00:00"},{"alias_kind":"pith_short_12","alias_value":"6X4UWWREEHZL","created_at":"2026-06-30T02:17:50.653998+00:00"},{"alias_kind":"pith_short_16","alias_value":"6X4UWWREEHZLPHUI","created_at":"2026-06-30T02:17:50.653998+00:00"},{"alias_kind":"pith_short_8","alias_value":"6X4UWWRE","created_at":"2026-06-30T02:17:50.653998+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW","json":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW.json","graph_json":"https://pith.science/api/pith-number/6X4UWWREEHZLPHUIVCH7H4KECW/graph.json","events_json":"https://pith.science/api/pith-number/6X4UWWREEHZLPHUIVCH7H4KECW/events.json","paper":"https://pith.science/paper/6X4UWWRE"},"agent_actions":{"view_html":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW","download_json":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW.json","view_paper":"https://pith.science/paper/6X4UWWRE","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2606.30124&json=true","fetch_graph":"https://pith.science/api/pith-number/6X4UWWREEHZLPHUIVCH7H4KECW/graph.json","fetch_events":"https://pith.science/api/pith-number/6X4UWWREEHZLPHUIVCH7H4KECW/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW/action/timestamp_anchor","attest_storage":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW/action/storage_attestation","attest_author":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW/action/author_attestation","sign_citation":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW/action/citation_signature","submit_replication":"https://pith.science/pith/6X4UWWREEHZLPHUIVCH7H4KECW/action/replication_record"}},"created_at":"2026-06-30T02:17:50.653998+00:00","updated_at":"2026-06-30T02:17:50.653998+00:00"}