{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:RYU2AZN2J4GJBV7FJ36RS2QDRT","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"726b24e809aaa247419cb7f83c5b70ac863540f8dae7ce5eb02dd72042ce4754","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T12:35:51Z","title_canon_sha256":"c0f93b20d4d316c033d21025403c3291911464f9820096acfba8790f40f8fbff"},"schema_version":"1.0","source":{"id":"2605.06137","kind":"arxiv","version":2}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.06137","created_at":"2026-06-01T01:03:54Z"},{"alias_kind":"arxiv_version","alias_value":"2605.06137v2","created_at":"2026-06-01T01:03:54Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.06137","created_at":"2026-06-01T01:03:54Z"},{"alias_kind":"pith_short_12","alias_value":"RYU2AZN2J4GJ","created_at":"2026-06-01T01:03:54Z"},{"alias_kind":"pith_short_16","alias_value":"RYU2AZN2J4GJBV7F","created_at":"2026-06-01T01:03:54Z"},{"alias_kind":"pith_short_8","alias_value":"RYU2AZN2","created_at":"2026-06-01T01:03:54Z"}],"graph_snapshots":[{"event_id":"sha256:9e49854de8e74d3d205050e2f5e56f4bbbeb6568b6da7217968569695c0f19f9","target":"graph","created_at":"2026-06-01T01:03:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":4,"items":[{"attestation":"unclaimed","claim_id":"C1","kind":"strongest_claim","source":"verdict.strongest_claim","status":"machine_extracted","text":"On ImageNet 256x256, Prologue-Base reduces gFID from 21.01 to 10.75 without classifier-free guidance while keeping reconstruction almost unchanged; Prologue-Large reaches a competitive rFID of 0.99 and gFID of 1.46 using a standard AR model without auxiliary semantic supervision."},{"attestation":"unclaimed","claim_id":"C2","kind":"weakest_assumption","source":"verdict.weakest_assumption","status":"machine_extracted","text":"The assumption that training prologue tokens exclusively with AR CE loss will not interfere with the visual tokens' reconstruction quality and that the ELBO formalization supports the decoupled optimization."},{"attestation":"unclaimed","claim_id":"C3","kind":"one_line_summary","source":"verdict.one_line_summary","status":"machine_extracted","text":"Prologue introduces dedicated prologue tokens to decouple generation and reconstruction in AR visual models, significantly improving generation FID scores on ImageNet while maintaining reconstruction quality."},{"attestation":"unclaimed","claim_id":"C4","kind":"headline","source":"verdict.pith_extraction.headline","status":"machine_extracted","text":"Prepending a small set of prologue tokens trained only on AR loss decouples generation from reconstruction in autoregressive image models."}],"snapshot_sha256":"17cd00dc84d509e17b769798e8d02715ae78bff4d23bbeb090398f84f84f0029"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[{"findings_count":0,"name":"claim_evidence","ran_at":"2026-05-20T13:02:04.297997Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"ai_meta_artifact","ran_at":"2026-05-20T08:36:43.479893Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_title_agreement","ran_at":"2026-05-19T19:01:19.381010Z","status":"completed","version":"1.0.0"},{"findings_count":0,"name":"doi_compliance","ran_at":"2026-05-19T12:55:47.107759Z","status":"completed","version":"1.0.0"}],"endpoint":"/pith/2605.06137/integrity.json","findings":[],"snapshot_sha256":"d33aa7f6baebfeac59e11662ddca406cd367af12d49edde56d32af5c3b118fc8","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"In this work, we propose Prologue, an approach to bridging the reconstruction-generation gap in autoregressive (AR) image generation. Instead of modifying visual tokens to satisfy both reconstruction and generation, Prologue generates a small set of prologue tokens prepended to the visual token sequence. These prologue tokens are trained exclusively with the AR cross-entropy (CE) loss, while visual tokens remain dedicated to reconstruction. This decoupled design lets us optimize generation through the AR model's true distribution without affecting reconstruction quality, which we further forma","authors_text":"Bowen Zheng, Colin Zhang, Guang Yang, Tianyang Hu, Weijian Luo","cross_cats":["cs.AI","cs.LG"],"headline":"Prepending a small set of prologue tokens trained only on AR loss decouples generation from reconstruction in autoregressive image models.","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T12:35:51Z","title":"Autoregressive Visual Generation Needs a Prologue"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.06137","kind":"arxiv","version":2},"verdict":{"created_at":"2026-05-08T13:48:32.689247Z","id":"4387a6b6-6f87-4b83-ace2-889d7f4e7849","model_set":{"reader":"grok-4.3"},"one_line_summary":"Prologue introduces dedicated prologue tokens to decouple generation and reconstruction in AR visual models, significantly improving generation FID scores on ImageNet while maintaining reconstruction quality.","pipeline_version":"pith-pipeline@v0.9.0","pith_extraction_headline":"Prepending a small set of prologue tokens trained only on AR loss decouples generation from reconstruction in autoregressive image models.","strongest_claim":"On ImageNet 256x256, Prologue-Base reduces gFID from 21.01 to 10.75 without classifier-free guidance while keeping reconstruction almost unchanged; Prologue-Large reaches a competitive rFID of 0.99 and gFID of 1.46 using a standard AR model without auxiliary semantic supervision.","weakest_assumption":"The assumption that training prologue tokens exclusively with AR CE loss will not interfere with the visual tokens' reconstruction quality and that the ELBO formalization supports the decoupled optimization."}},"verdict_id":"4387a6b6-6f87-4b83-ace2-889d7f4e7849"}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:f8d3c207c227fa1635fa7abe5414990dde4e57969ff63da74a045b2bf2160975","target":"record","created_at":"2026-06-01T01:03:54Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"726b24e809aaa247419cb7f83c5b70ac863540f8dae7ce5eb02dd72042ce4754","cross_cats_sorted":["cs.AI","cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.CV","submitted_at":"2026-05-07T12:35:51Z","title_canon_sha256":"c0f93b20d4d316c033d21025403c3291911464f9820096acfba8790f40f8fbff"},"schema_version":"1.0","source":{"id":"2605.06137","kind":"arxiv","version":2}},"canonical_sha256":"8e29a065ba4f0c90d7e54efd196a038cf99ad4c7f7658b6b29ad57588600595e","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"8e29a065ba4f0c90d7e54efd196a038cf99ad4c7f7658b6b29ad57588600595e","first_computed_at":"2026-06-01T01:03:54.500915Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-01T01:03:54.500915Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"3qX9e4HIzZBJpC4Is3DfaY0mf0kaDrSniTrhUjhQLax0F6vP+JFubClMnX5fh7Skq4b7HAtECUiM9MztZyt4AA==","signature_status":"signed_v1","signed_at":"2026-06-01T01:03:54.501675Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.06137","source_kind":"arxiv","source_version":2}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:f8d3c207c227fa1635fa7abe5414990dde4e57969ff63da74a045b2bf2160975","sha256:9e49854de8e74d3d205050e2f5e56f4bbbeb6568b6da7217968569695c0f19f9"],"state_sha256":"cfab09a32e12e8e06ee759ba332a8bc728d3e1a8fe400998818652f303c34852"}