{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2022:GRQDQ4NHYFDUHLLTMFPJSMIBZK","short_pith_number":"pith:GRQDQ4NH","canonical_record":{"source":{"id":"2205.00159","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2022-04-30T04:37:01Z","cross_cats_sorted":[],"title_canon_sha256":"3916fb3a1cb77f65f428c60e2275b4a4beb7433b7ef756a0c52c33d93e1d50c8","abstract_canon_sha256":"e42eaade339853651172ef18d24916b1618d62accb790481a5b0985c44b1378b"},"schema_version":"1.0"},"canonical_sha256":"34603871a7c14743ad73615e993101caa6451246f22f7ebabc3b9c8925c3c54d","source":{"kind":"arxiv","id":"2205.00159","version":2},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2205.00159","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"arxiv_version","alias_value":"2205.00159v2","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2205.00159","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"pith_short_12","alias_value":"GRQDQ4NHYFDU","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"pith_short_16","alias_value":"GRQDQ4NHYFDUHLLT","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"pith_short_8","alias_value":"GRQDQ4NH","created_at":"2026-07-05T04:25:17Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2022:GRQDQ4NHYFDUHLLTMFPJSMIBZK","target":"record","payload":{"canonical_record":{"source":{"id":"2205.00159","kind":"arxiv","version":2},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2022-04-30T04:37:01Z","cross_cats_sorted":[],"title_canon_sha256":"3916fb3a1cb77f65f428c60e2275b4a4beb7433b7ef756a0c52c33d93e1d50c8","abstract_canon_sha256":"e42eaade339853651172ef18d24916b1618d62accb790481a5b0985c44b1378b"},"schema_version":"1.0"},"canonical_sha256":"34603871a7c14743ad73615e993101caa6451246f22f7ebabc3b9c8925c3c54d","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-07-05T04:25:17.729394Z","signature_b64":"VzB1V3IIpJLZtyeSI0HvcfJfT+Nynk9yEVkqN5TwescPfM0XCja7Klo27tLCrB1tqkebtWsh5IYfA+/v+fWZAQ==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"34603871a7c14743ad73615e993101caa6451246f22f7ebabc3b9c8925c3c54d","last_reissued_at":"2026-07-05T04:25:17.728872Z","signature_status":"signed_v1","first_computed_at":"2026-07-05T04:25:17.728872Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2205.00159","source_version":2,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T04:25:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"E1uFozJN9M6yMMn65/YfpGCpkAcNSIyG9hN2svi1y7eGIeOAztWEgsAsGZJS2qI9Ra/oBTHyOT6Tkna5L4EzBA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T15:37:21.254878Z"},"content_sha256":"133e10b0e3dcb7cc1e3c951da353be3fb240fac9d428cdd713b1126528edcddd","schema_version":"1.0","event_id":"sha256:133e10b0e3dcb7cc1e3c951da353be3fb240fac9d428cdd713b1126528edcddd"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2022:GRQDQ4NHYFDUHLLTMFPJSMIBZK","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"SVTR: Scene Text Recognition with a Single Visual Model","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":[],"primary_cat":"cs.CV","authors_text":"Caiyan Jia, Chenxia Li, Tianlun Zheng, Xiaoting Yin, Yongkun Du, Yu-Gang Jiang, Yuning Du, Zhineng Chen","submitted_at":"2022-04-30T04:37:01Z","abstract_excerpt":"Dominant scene text recognition models commonly contain two building blocks, a visual model for feature extraction and a sequence model for text transcription. This hybrid architecture, although accurate, is complex and less efficient. In this study, we propose a Single Visual model for Scene Text recognition within the patch-wise image tokenization framework, which dispenses with the sequential modeling entirely. The method, termed SVTR, firstly decomposes an image text into small patches named character components. Afterward, hierarchical stages are recurrently carried out by component-level"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2205.00159","kind":"arxiv","version":2},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2205.00159/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-07-05T04:25:17Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"9NaMe4UzTUgwkog14EeQe78Yk/DvUVsxFoEAx/nlAwC/JvO5VDzBO5Gt2Z8IsuPF3AAYHkqlQNP+90AqvWE+Aw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-07-05T15:37:21.255506Z"},"content_sha256":"ceca36bf292e3ce1ba6f0ffce4cf6b70735c7875d3de9eae354a89a73a497579","schema_version":"1.0","event_id":"sha256:ceca36bf292e3ce1ba6f0ffce4cf6b70735c7875d3de9eae354a89a73a497579"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/GRQDQ4NHYFDUHLLTMFPJSMIBZK/bundle.json","state_url":"https://pith.science/pith/GRQDQ4NHYFDUHLLTMFPJSMIBZK/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/GRQDQ4NHYFDUHLLTMFPJSMIBZK/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-07-05T15:37:21Z","links":{"resolver":"https://pith.science/pith/GRQDQ4NHYFDUHLLTMFPJSMIBZK","bundle":"https://pith.science/pith/GRQDQ4NHYFDUHLLTMFPJSMIBZK/bundle.json","state":"https://pith.science/pith/GRQDQ4NHYFDUHLLTMFPJSMIBZK/state.json","well_known_bundle":"https://pith.science/.well-known/pith/GRQDQ4NHYFDUHLLTMFPJSMIBZK/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2022:GRQDQ4NHYFDUHLLTMFPJSMIBZK","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e42eaade339853651172ef18d24916b1618d62accb790481a5b0985c44b1378b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2022-04-30T04:37:01Z","title_canon_sha256":"3916fb3a1cb77f65f428c60e2275b4a4beb7433b7ef756a0c52c33d93e1d50c8"},"schema_version":"1.0","source":{"id":"2205.00159","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2205.00159","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"arxiv_version","alias_value":"2205.00159v2","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2205.00159","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"pith_short_12","alias_value":"GRQDQ4NHYFDU","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"pith_short_16","alias_value":"GRQDQ4NHYFDUHLLT","created_at":"2026-07-05T04:25:17Z"},{"alias_kind":"pith_short_8","alias_value":"GRQDQ4NH","created_at":"2026-07-05T04:25:17Z"}],"graph_snapshots":[{"event_id":"sha256:ceca36bf292e3ce1ba6f0ffce4cf6b70735c7875d3de9eae354a89a73a497579","target":"graph","created_at":"2026-07-05T04:25:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2205.00159/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Dominant scene text recognition models commonly contain two building blocks, a visual model for feature extraction and a sequence model for text transcription. This hybrid architecture, although accurate, is complex and less efficient. In this study, we propose a Single Visual model for Scene Text recognition within the patch-wise image tokenization framework, which dispenses with the sequential modeling entirely. The method, termed SVTR, firstly decomposes an image text into small patches named character components. Afterward, hierarchical stages are recurrently carried out by component-level","authors_text":"Caiyan Jia, Chenxia Li, Tianlun Zheng, Xiaoting Yin, Yongkun Du, Yu-Gang Jiang, Yuning Du, Zhineng Chen","cross_cats":[],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2022-04-30T04:37:01Z","title":"SVTR: Scene Text Recognition with a Single Visual Model"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2205.00159","kind":"arxiv","version":2},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:133e10b0e3dcb7cc1e3c951da353be3fb240fac9d428cdd713b1126528edcddd","target":"record","created_at":"2026-07-05T04:25:17Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e42eaade339853651172ef18d24916b1618d62accb790481a5b0985c44b1378b","cross_cats_sorted":[],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2022-04-30T04:37:01Z","title_canon_sha256":"3916fb3a1cb77f65f428c60e2275b4a4beb7433b7ef756a0c52c33d93e1d50c8"},"schema_version":"1.0","source":{"id":"2205.00159","kind":"arxiv","version":2}},"canonical_sha256":"34603871a7c14743ad73615e993101caa6451246f22f7ebabc3b9c8925c3c54d","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"34603871a7c14743ad73615e993101caa6451246f22f7ebabc3b9c8925c3c54d","first_computed_at":"2026-07-05T04:25:17.728872Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-07-05T04:25:17.728872Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"VzB1V3IIpJLZtyeSI0HvcfJfT+Nynk9yEVkqN5TwescPfM0XCja7Klo27tLCrB1tqkebtWsh5IYfA+/v+fWZAQ==","signature_status":"signed_v1","signed_at":"2026-07-05T04:25:17.729394Z","signed_message":"canonical_sha256_bytes"},"source_id":"2205.00159","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:133e10b0e3dcb7cc1e3c951da353be3fb240fac9d428cdd713b1126528edcddd","sha256:ceca36bf292e3ce1ba6f0ffce4cf6b70735c7875d3de9eae354a89a73a497579"],"state_sha256":"c9fa14915decd32b1e91fa79d25f1056fc79bd7d212e08ccb8b85ec98d75f9e7"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"KrczrvPlStbVaEIYHeKgtkOjzL2PojXQw4mrCj7bC0gS7aXkXHc+OjsXmRCJxqYBUsPuDWYVepR18u8Jt+GHAA==","signed_message":"bundle_sha256_bytes","signed_at":"2026-07-05T15:37:21.258504Z","bundle_sha256":"cb4d46c6e93264083355611d1366e3e2374683ff9095aac8cb0f2efabe6a7d84"}}