{"bundle_type":"pith_open_graph_bundle","bundle_version":"1.0","pith_number":"pith:2026:2YCCGMFATOWEQSTO3WGTZL76OW","short_pith_number":"pith:2YCCGMFA","canonical_record":{"source":{"id":"2605.19101","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-05-18T20:41:08Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"d2f2e869dc92de286a551168ed387533eb25a8faf9779ce8384f5eaa6413fea8","abstract_canon_sha256":"79d9153a9b0e8b5f00aefc628daf6f29878fe2746437d5d79f14336c38035998"},"schema_version":"1.0"},"canonical_sha256":"d6042330a09bac484a6edd8d3caffe75b1ed852529c5405ec73bde6fc858a950","source":{"kind":"arxiv","id":"2605.19101","version":1},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19101","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19101v1","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19101","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"pith_short_12","alias_value":"2YCCGMFATOWE","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"pith_short_16","alias_value":"2YCCGMFATOWEQSTO","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"pith_short_8","alias_value":"2YCCGMFA","created_at":"2026-05-20T01:05:27Z"}],"events":[{"event_type":"record_created","subject_pith_number":"pith:2026:2YCCGMFATOWEQSTO3WGTZL76OW","target":"record","payload":{"canonical_record":{"source":{"id":"2605.19101","kind":"arxiv","version":1},"metadata":{"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-05-18T20:41:08Z","cross_cats_sorted":["cs.LG"],"title_canon_sha256":"d2f2e869dc92de286a551168ed387533eb25a8faf9779ce8384f5eaa6413fea8","abstract_canon_sha256":"79d9153a9b0e8b5f00aefc628daf6f29878fe2746437d5d79f14336c38035998"},"schema_version":"1.0"},"canonical_sha256":"d6042330a09bac484a6edd8d3caffe75b1ed852529c5405ec73bde6fc858a950","receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-20T01:05:27.185960Z","signature_b64":"zmpsnZGAVswbeUaQHF0m4OZQXJfIsfrk6xY9QOpxzWVqXCvrEUmyXlUpk68Sgcr5wQAXSDtuGiE4p4YpZNQYAg==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"d6042330a09bac484a6edd8d3caffe75b1ed852529c5405ec73bde6fc858a950","last_reissued_at":"2026-05-20T01:05:27.185203Z","signature_status":"signed_v1","first_computed_at":"2026-05-20T01:05:27.185203Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"source_kind":"arxiv","source_id":"2605.19101","source_version":1,"attestation_state":"computed"},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:27Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"RqmhCuSQ7XfrueVF8/IcJOggTjJtN81NyXNhRHqp8ohmm7bQoWDkwhmuJBvZ6fhhIBrsEgg4ueAD3FRzpXXXDA==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T16:14:21.374583Z"},"content_sha256":"1e79ae0ef3a1e711e07b6cd720e2eded37a5446cc42ba9c5efb7f0fe9f7e8910","schema_version":"1.0","event_id":"sha256:1e79ae0ef3a1e711e07b6cd720e2eded37a5446cc42ba9c5efb7f0fe9f7e8910"},{"event_type":"graph_snapshot","subject_pith_number":"pith:2026:2YCCGMFATOWEQSTO3WGTZL76OW","target":"graph","payload":{"graph_snapshot":{"paper":{"title":"Heterogeneity-Aware Dataset Scheduling for Efficient Audio Large Language Model Training","license":"http://creativecommons.org/licenses/by/4.0/","headline":"","cross_cats":["cs.LG"],"primary_cat":"cs.SD","authors_text":"Chongxin Gan, Jianning Wang, Yang Li, Yanru Wu","submitted_at":"2026-05-18T20:41:08Z","abstract_excerpt":"Training general-purpose Audio Large Language Models (ALLMs) across diverse datasets is essential for holistic audio understanding, yet it faces significant challenges due to dataset heterogeneity, which often leads to conflicting gradients and slow convergence. Despite its impact, how to explicitly manage this heterogeneity during training remains underexplored, with current practices relying primarily on uniform mixture. In this work, we analyze multi-dataset AudioQA training from a convergence perspective and propose Grouped Sequential Training (GST). GST strategically organizes datasets in"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19101","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.19101/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"verdict_id":null},"signer":{"signer_id":"pith.science","signer_type":"pith_registry","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"created_at":"2026-05-20T01:05:27Z","supersedes":[],"prev_event":null,"signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"YL01LhC+zo3iRhuxe+/x5MLSS7XH2fd9HN41iRq+1dHBi0LwYU+o95joQRe8JkFx0VqJe8iiIuD/AMMOyvFOCw==","signed_message":"open_graph_event_sha256_bytes","signed_at":"2026-05-21T16:14:21.374961Z"},"content_sha256":"307a08194ed413612fce038a59dcd342624847922f6848222eeafc488ba798ae","schema_version":"1.0","event_id":"sha256:307a08194ed413612fce038a59dcd342624847922f6848222eeafc488ba798ae"}],"timestamp_proofs":[],"mirror_hints":[{"mirror_type":"https","name":"Pith Resolver","base_url":"https://pith.science","bundle_url":"https://pith.science/pith/2YCCGMFATOWEQSTO3WGTZL76OW/bundle.json","state_url":"https://pith.science/pith/2YCCGMFATOWEQSTO3WGTZL76OW/state.json","well_known_bundle_url":"https://pith.science/.well-known/pith/2YCCGMFATOWEQSTO3WGTZL76OW/bundle.json","status":"primary"}],"public_keys":[{"key_id":"pith-v1-2026-05","algorithm":"ed25519","format":"raw","public_key_b64":"stVStoiQhXFxp4s2pdzPNoqVNBMojDU/fJ2db5S3CbM=","public_key_hex":"b2d552b68890857171a78b36a5dccf368a953413288c353f7c9d9d6f94b709b3","fingerprint_sha256_b32_first128bits":"RVFV5Z2OI2J3ZUO7ERDEBCYNKS","fingerprint_sha256_hex":"8d4b5ee74e4693bcd1df2446408b0d54","rotates_at":null,"url":"https://pith.science/pith-signing-key.json","notes":"Pith uses this Ed25519 key to sign canonical record SHA-256 digests. Verify with: ed25519_verify(public_key, message=canonical_sha256_bytes, signature=base64decode(signature_b64))."}],"merge_version":"pith-open-graph-merge-v1","built_at":"2026-05-21T16:14:21Z","links":{"resolver":"https://pith.science/pith/2YCCGMFATOWEQSTO3WGTZL76OW","bundle":"https://pith.science/pith/2YCCGMFATOWEQSTO3WGTZL76OW/bundle.json","state":"https://pith.science/pith/2YCCGMFATOWEQSTO3WGTZL76OW/state.json","well_known_bundle":"https://pith.science/.well-known/pith/2YCCGMFATOWEQSTO3WGTZL76OW/bundle.json"},"state":{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2026:2YCCGMFATOWEQSTO3WGTZL76OW","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"79d9153a9b0e8b5f00aefc628daf6f29878fe2746437d5d79f14336c38035998","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-05-18T20:41:08Z","title_canon_sha256":"d2f2e869dc92de286a551168ed387533eb25a8faf9779ce8384f5eaa6413fea8"},"schema_version":"1.0","source":{"id":"2605.19101","kind":"arxiv","version":1}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2605.19101","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"arxiv_version","alias_value":"2605.19101v1","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.19101","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"pith_short_12","alias_value":"2YCCGMFATOWE","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"pith_short_16","alias_value":"2YCCGMFATOWEQSTO","created_at":"2026-05-20T01:05:27Z"},{"alias_kind":"pith_short_8","alias_value":"2YCCGMFA","created_at":"2026-05-20T01:05:27Z"}],"graph_snapshots":[{"event_id":"sha256:307a08194ed413612fce038a59dcd342624847922f6848222eeafc488ba798ae","target":"graph","created_at":"2026-05-20T01:05:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2605.19101/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"Training general-purpose Audio Large Language Models (ALLMs) across diverse datasets is essential for holistic audio understanding, yet it faces significant challenges due to dataset heterogeneity, which often leads to conflicting gradients and slow convergence. Despite its impact, how to explicitly manage this heterogeneity during training remains underexplored, with current practices relying primarily on uniform mixture. In this work, we analyze multi-dataset AudioQA training from a convergence perspective and propose Grouped Sequential Training (GST). GST strategically organizes datasets in","authors_text":"Chongxin Gan, Jianning Wang, Yang Li, Yanru Wu","cross_cats":["cs.LG"],"headline":"","license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-05-18T20:41:08Z","title":"Heterogeneity-Aware Dataset Scheduling for Efficient Audio Large Language Model Training"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.19101","kind":"arxiv","version":1},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:1e79ae0ef3a1e711e07b6cd720e2eded37a5446cc42ba9c5efb7f0fe9f7e8910","target":"record","created_at":"2026-05-20T01:05:27Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"79d9153a9b0e8b5f00aefc628daf6f29878fe2746437d5d79f14336c38035998","cross_cats_sorted":["cs.LG"],"license":"http://creativecommons.org/licenses/by/4.0/","primary_cat":"cs.SD","submitted_at":"2026-05-18T20:41:08Z","title_canon_sha256":"d2f2e869dc92de286a551168ed387533eb25a8faf9779ce8384f5eaa6413fea8"},"schema_version":"1.0","source":{"id":"2605.19101","kind":"arxiv","version":1}},"canonical_sha256":"d6042330a09bac484a6edd8d3caffe75b1ed852529c5405ec73bde6fc858a950","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"d6042330a09bac484a6edd8d3caffe75b1ed852529c5405ec73bde6fc858a950","first_computed_at":"2026-05-20T01:05:27.185203Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-05-20T01:05:27.185203Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"zmpsnZGAVswbeUaQHF0m4OZQXJfIsfrk6xY9QOpxzWVqXCvrEUmyXlUpk68Sgcr5wQAXSDtuGiE4p4YpZNQYAg==","signature_status":"signed_v1","signed_at":"2026-05-20T01:05:27.185960Z","signed_message":"canonical_sha256_bytes"},"source_id":"2605.19101","source_kind":"arxiv","source_version":1}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:1e79ae0ef3a1e711e07b6cd720e2eded37a5446cc42ba9c5efb7f0fe9f7e8910","sha256:307a08194ed413612fce038a59dcd342624847922f6848222eeafc488ba798ae"],"state_sha256":"c76a5082f77deb241008a326a60ade6a675ad5eaf74e999c3069498ce7bc3260"},"bundle_signature":{"signature_status":"signed_v1","algorithm":"ed25519","key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signature_b64":"+a1JRPdO9QHNK4V27aUiC1s29kqWEB2FS/dNabI1oMot4QdrPfEMgIi5vtYvYAPpApj1SDYD6DgdNlF9ToFCDQ==","signed_message":"bundle_sha256_bytes","signed_at":"2026-05-21T16:14:21.378015Z","bundle_sha256":"a62005d199c2c7fbac60072517cdcbe672db6bb6b27a8a165ca7ea4dab41cf37"}}