{"state_type":"pith_open_graph_state","state_version":"1.0","pith_number":"pith:2025:JYYPWID2MWKFIELS225R7LV3SN","merge_version":"pith-open-graph-merge-v1","event_count":2,"valid_event_count":2,"invalid_event_count":0,"equivocation_count":0,"current":{"canonical_record":{"metadata":{"abstract_canon_sha256":"af10d4298fdfe9fb503c8170ec6a1cbbf2ae97db8c4accd3460c049a4d5b8465","cross_cats_sorted":["cs.SD","eess.AS"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2025-02-19T13:28:20Z","title_canon_sha256":"0ddf3e411228dd802c98f669104577bb5a728e6ae6cd522243991ea4dddab108"},"schema_version":"1.0","source":{"id":"2502.13713","kind":"arxiv","version":5}},"source_aliases":[{"alias_kind":"arxiv","alias_value":"2502.13713","created_at":"2026-06-03T01:05:43Z"},{"alias_kind":"arxiv_version","alias_value":"2502.13713v5","created_at":"2026-06-03T01:05:43Z"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2502.13713","created_at":"2026-06-03T01:05:43Z"},{"alias_kind":"pith_short_12","alias_value":"JYYPWID2MWKF","created_at":"2026-06-03T01:05:43Z"},{"alias_kind":"pith_short_16","alias_value":"JYYPWID2MWKFIELS","created_at":"2026-06-03T01:05:43Z"},{"alias_kind":"pith_short_8","alias_value":"JYYPWID2","created_at":"2026-06-03T01:05:43Z"}],"graph_snapshots":[{"event_id":"sha256:2feb3b013eb6d369f768d15858095790f7e1b88aa0114b7c27ee9aafbbc433c2","target":"graph","created_at":"2026-06-03T01:05:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"graph_snapshot":{"author_claims":{"count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","strong_count":0},"builder_version":"pith-number-builder-2026-05-17-v1","claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"integrity":{"available":true,"clean":true,"detectors_run":[],"endpoint":"/pith/2502.13713/integrity.json","findings":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938","summary":{"advisory":0,"by_detector":{},"critical":0,"informational":0}},"paper":{"abstract_excerpt":"We present TALKPLAY, a novel multimodal music recommendation system that reformulates recommendation as a token generation problem using large language models (LLMs). By leveraging the instruction-following and natural language generation capabilities of LLMs, our system effectively recommends music from diverse user queries while generating contextually relevant responses. While pretrained LLMs are primarily designed for text modality, TALKPLAY extends their scope through two key innovations: a multimodal music tokenizer that encodes audio features, lyrics, metadata, semantic tags, and playli","authors_text":"Juhan Nam, Keunwoo Choi, Seungheon Doh","cross_cats":["cs.SD","eess.AS"],"headline":"","license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2025-02-19T13:28:20Z","title":"TALKPLAY: Multimodal Music Recommendation with Large Language Models"},"references":{"count":0,"internal_anchors":0,"resolved_work":0,"sample":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2502.13713","kind":"arxiv","version":5},"verdict":{"created_at":null,"id":null,"model_set":{},"one_line_summary":"","pipeline_version":null,"pith_extraction_headline":"","strongest_claim":"","weakest_assumption":""}},"verdict_id":null}}],"author_attestations":[],"timestamp_anchors":[],"storage_attestations":[],"citation_signatures":[],"replication_records":[],"corrections":[],"mirror_hints":[],"record_created":{"event_id":"sha256:3a5a6a0ca51537f007316536829386880c8ab6735bb154986c23f909c5340503","target":"record","created_at":"2026-06-03T01:05:43Z","signer":{"key_id":"pith-v1-2026-05","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","signer_id":"pith.science","signer_type":"pith_registry"},"payload":{"attestation_state":"computed","canonical_record":{"metadata":{"abstract_canon_sha256":"af10d4298fdfe9fb503c8170ec6a1cbbf2ae97db8c4accd3460c049a4d5b8465","cross_cats_sorted":["cs.SD","eess.AS"],"license":"http://creativecommons.org/licenses/by-nc-sa/4.0/","primary_cat":"cs.IR","submitted_at":"2025-02-19T13:28:20Z","title_canon_sha256":"0ddf3e411228dd802c98f669104577bb5a728e6ae6cd522243991ea4dddab108"},"schema_version":"1.0","source":{"id":"2502.13713","kind":"arxiv","version":5}},"canonical_sha256":"4e30fb207a6594541172d6bb1faebb937d0611d10cb316dcb2fbd9d5cf22d0f4","receipt":{"algorithm":"ed25519","builder_version":"pith-number-builder-2026-05-17-v1","canonical_sha256":"4e30fb207a6594541172d6bb1faebb937d0611d10cb316dcb2fbd9d5cf22d0f4","first_computed_at":"2026-06-03T01:05:43.566413Z","key_id":"pith-v1-2026-05","kind":"pith_receipt","last_reissued_at":"2026-06-03T01:05:43.566413Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54","receipt_version":"0.3","signature_b64":"tRaFArQvPx0S+afzJxn0s9MxDb+DHy5XVbSaHeqQv/7c1DvGW0L/3VI9l7ITkH5sD2y+wHEsSTR9uEshOPboBA==","signature_status":"signed_v1","signed_at":"2026-06-03T01:05:43.566846Z","signed_message":"canonical_sha256_bytes"},"source_id":"2502.13713","source_kind":"arxiv","source_version":5}}},"equivocations":[],"invalid_events":[],"applied_event_ids":["sha256:3a5a6a0ca51537f007316536829386880c8ab6735bb154986c23f909c5340503","sha256:2feb3b013eb6d369f768d15858095790f7e1b88aa0114b7c27ee9aafbbc433c2"],"state_sha256":"41764be3b0f152c0d1b4a8a62174795b15b98331fa13cd5a1078c6ea1150f74b"}