{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:Y4GW2JWNSWT3LT5ADT7RESI4XF","short_pith_number":"pith:Y4GW2JWN","canonical_record":{"source":{"id":"2606.01479","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-31T22:39:45Z","cross_cats_sorted":[],"title_canon_sha256":"e2d6abf27b3667b00a9fff85d6001fa722630ddfba9a446a156c4d3ec23fc063","abstract_canon_sha256":"e5995b1f30d04f17ea0445f42c145e6e519c33104f196c463e910d574bd48f32"},"schema_version":"1.0"},"canonical_sha256":"c70d6d26cd95a7b5cfa01cff12491cb94f9b8dee50f8710d05c5f8fe9d63ebf8","source":{"kind":"arxiv","id":"2606.01479","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.01479","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"arxiv_version","alias_value":"2606.01479v1","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.01479","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"pith_short_12","alias_value":"Y4GW2JWNSWT3","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"pith_short_16","alias_value":"Y4GW2JWNSWT3LT5A","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"pith_short_8","alias_value":"Y4GW2JWN","created_at":"2026-06-02T02:04:34Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:Y4GW2JWNSWT3LT5ADT7RESI4XF","target":"record","payload":{"canonical_record":{"source":{"id":"2606.01479","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-31T22:39:45Z","cross_cats_sorted":[],"title_canon_sha256":"e2d6abf27b3667b00a9fff85d6001fa722630ddfba9a446a156c4d3ec23fc063","abstract_canon_sha256":"e5995b1f30d04f17ea0445f42c145e6e519c33104f196c463e910d574bd48f32"},"schema_version":"1.0"},"canonical_sha256":"c70d6d26cd95a7b5cfa01cff12491cb94f9b8dee50f8710d05c5f8fe9d63ebf8","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-06-02T02:04:34.451093Z","signature_b64":"24nKHURU5138wOuxNcjS4X15kn3c6MwA6dyyryjM2K4iJqYhJb1drmgoaoeX1up0vXXp6znFg1m0yWefQ+/YAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"c70d6d26cd95a7b5cfa01cff12491cb94f9b8dee50f8710d05c5f8fe9d63ebf8","last_reissued_at":"2026-06-02T02:04:34.450679Z","signature_status":"signed_v1","first_computed_at":"2026-06-02T02:04:34.450679Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2606.01479","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T02:04:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"3RLN1Fx0ycT6rR1TfMkSQkXpkBuIK2xaQz5qsJ+p9PP7yegBCQBJzSvn4Ix5aPTz0iaJZ1pC6v6sJX0VKCKrDw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T13:14:06.223923Z"},"content_sha256":"7ab76fab472322c3d6dc71d5bc2ee64a63e4bcaceec73dae3df6738bacb50d0d","schema_version":"1.0","event_id":"sha256:7ab76fab472322c3d6dc71d5bc2ee64a63e4bcaceec73dae3df6738bacb50d0d"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:Y4GW2JWNSWT3LT5ADT7RESI4XF","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Sparse Autoencoders for Interpretable Emotion Control in Text-to-Speech","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.CL","authors_text":"Gang Zhou, Hongfei Du, Jiacheng Shi, Sidi Lu, Ye Gao","submitted_at":"2026-05-31T22:39:45Z","abstract_excerpt":"Integrating large language models (LLMs) into text-to-speech (TTS) systems has improved speech expressiveness, yet interpretable emotional control remains challenging. Existing approaches primarily rely on external conditioning or global activation steering, offering limited insight into the internal representations underlying emotional control. In this work, we analyze emotion-related variation in the semantic hidden states of LLM-based TTS models using sparse autoencoders (SAEs) to identify sparse latent features. Our analysis shows that emotional variation is distributed across multiple spa"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.01479","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2606.01479/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-06-02T02:04:34Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"MuVz3+mb5oElBQh98nTmzBvbeOp7QwFeLQGpbnG/YlwyQbqLQwIuIA/MwI+mR6hmXwY6r9KayfTQBr2RAlb9Dw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-06-02T13:14:06.224307Z"},"content_sha256":"7ca616772cb1974f693de7e23a41ba06fa8bb9196b2fbcdff2edecfc71180555","schema_version":"1.0","event_id":"sha256:7ca616772cb1974f693de7e23a41ba06fa8bb9196b2fbcdff2edecfc71180555"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/Y4GW2JWNSWT3LT5ADT7RESI4XF/bundle.json","state_url":"https://pith.science/pith/Y4GW2JWNSWT3LT5ADT7RESI4XF/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/Y4GW2JWNSWT3LT5ADT7RESI4XF/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-06-02T13:14:06Z","links":{"resolver":"https://pith.science/pith/Y4GW2JWNSWT3LT5ADT7RESI4XF","bundle":"https://pith.science/pith/Y4GW2JWNSWT3LT5ADT7RESI4XF/bundle.json","state":"https://pith.science/pith/Y4GW2JWNSWT3LT5ADT7RESI4XF/state.json","well_known_bundle":"https://pith.science/.well-known/pith/Y4GW2JWNSWT3LT5ADT7RESI4XF/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:Y4GW2JWNSWT3LT5ADT7RESI4XF","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"e5995b1f30d04f17ea0445f42c145e6e519c33104f196c463e910d574bd48f32","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-31T22:39:45Z","title_canon_sha256":"e2d6abf27b3667b00a9fff85d6001fa722630ddfba9a446a156c4d3ec23fc063"},"schema_version":"1.0","source":{"id":"2606.01479","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2606.01479","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"arxiv_version","alias_value":"2606.01479v1","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2606.01479","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"pith_short_12","alias_value":"Y4GW2JWNSWT3","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"pith_short_16","alias_value":"Y4GW2JWNSWT3LT5A","created_at":"2026-06-02T02:04:34Z"},{"alias_kind":"pith_short_8","alias_value":"Y4GW2JWN","created_at":"2026-06-02T02:04:34Z"}],"graph_snapshots":[{"event_id":"sha256:7ca616772cb1974f693de7e23a41ba06fa8bb9196b2fbcdff2edecfc71180555","target":"graph","created_at":"2026-06-02T02:04:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2606.01479/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Integrating large language models (LLMs) into text-to-speech (TTS) systems has improved speech expressiveness, yet interpretable emotional control remains challenging. Existing approaches primarily rely on external conditioning or global activation steering, offering limited insight into the internal representations underlying emotional control. In this work, we analyze emotion-related variation in the semantic hidden states of LLM-based TTS models using sparse autoencoders (SAEs) to identify sparse latent features. Our analysis shows that emotional variation is distributed across multiple spa","authors_text":"Gang Zhou, Hongfei Du, Jiacheng Shi, Sidi Lu, Ye Gao","cross_cats":[],"headline":"","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-31T22:39:45Z","title":"Sparse Autoencoders for Interpretable Emotion Control in Text-to-Speech"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2606.01479","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:7ab76fab472322c3d6dc71d5bc2ee64a63e4bcaceec73dae3df6738bacb50d0d","target":"record","created_at":"2026-06-02T02:04:34Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"e5995b1f30d04f17ea0445f42c145e6e519c33104f196c463e910d574bd48f32","cross_cats_sorted":[],"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.CL","submitted_at":"2026-05-31T22:39:45Z","title_canon_sha256":"e2d6abf27b3667b00a9fff85d6001fa722630ddfba9a446a156c4d3ec23fc063"},"schema_version":"1.0","source":{"id":"2606.01479","kind":"arxiv","version":1}},"canonical_sha256":"c70d6d26cd95a7b5cfa01cff12491cb94f9b8dee50f8710d05c5f8fe9d63ebf8","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"c70d6d26cd95a7b5cfa01cff12491cb94f9b8dee50f8710d05c5f8fe9d63ebf8","first_computed_at":"2026-06-02T02:04:34.450679Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-02T02:04:34.450679Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"24nKHURU5138wOuxNcjS4X15kn3c6MwA6dyyryjM2K4iJqYhJb1drmgoaoeX1up0vXXp6znFg1m0yWefQ+/YAg==","signature_status":"signed_v1","signed_at":"2026-06-02T02:04:34.451093Z","signed_message":"canonical_sha256_bytes"},"source_id":"2606.01479","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:7ab76fab472322c3d6dc71d5bc2ee64a63e4bcaceec73dae3df6738bacb50d0d","sha256:7ca616772cb1974f693de7e23a41ba06fa8bb9196b2fbcdff2edecfc71180555"],"state_sha256":"cfcaf86f4d36fc5958797356a0fffe7b5a834c6454e36243d998a7bd5a40f9e3"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"tSHJMiJU5nvXL94t02IaF6wVIeFD1FOXexiqvZwkAQlUaNoukCG/CfPpRpbLYttX6oQF53e+XDYo83yzB89IDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-06-02T13:14:06.226614Z","bundle_sha256":"6f727cd25221573d893ff8c571466f366b6774925f6e9c9744b096bcfe43ed86"}}