{"record_type":"pith_number_record","schema_url":"https://pith.science/schemas/pith-number/v1.json","pith_number":"pith:2026:H4IELT26RZSIVSDPZZL3ZEVLQH","short_pith_number":"pith:H4IELT26","schema_version":"1.0","canonical_sha256":"3f1045cf5e8e648ac86fce57bc92ab81cfede55745571ff7fd565beacb5de59d","source":{"kind":"arxiv","id":"2605.21967","version":1},"attestation_state":"computed","paper":{"title":"Reinforced Preference Optimization for Reasoning-Augmented Recommendations","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Chi Lu, Derong Xu, Jingtong Gao, Kun Gai, Maolin Wang, Peng Jiang, Qingpeng Cai, Xiangyu Zhao, Xiaopeng Li, Zeyu Song","submitted_at":"2026-05-21T03:56:42Z","abstract_excerpt":"Recommender systems are critical for delivering personalized content across digital platforms, and recent advances in Large Language Models (LLMs) offer new opportunities to enhance them with richer world knowledge and explicit reasoning capabilities. With the help of reasoning knowledge, recommendations can better infer users' underlying intents, adapt to evolving preferences, and leverage semantic relationships for improved accuracy and interpretability. However, existing reasoning-based recommendation methods often fail to fully align the LLM's reasoning process with recommendation-specific"},"verification_status":{"content_addressed":true,"pith_receipt":true,"author_attested":false,"weak_author_claims":0,"strong_author_claims":0,"externally_anchored":false,"storage_verified":false,"citation_signatures":0,"replication_records":0,"graph_snapshot":true,"references_resolved":false,"formal_links_present":false},"canonical_record":{"source":{"id":"2605.21967","kind":"arxiv","version":1},"metadata":{"license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","primary_cat":"cs.IR","submitted_at":"2026-05-21T03:56:42Z","cross_cats_sorted":[],"title_canon_sha256":"cd9d34e396ce55c0cc5765741ec66f439fefc4f3d7539986910249e5242b9e64","abstract_canon_sha256":"c8fcd440f7f3227ae4bde0375425cc79bcc8b8466890fa2c48b267ee5b89238a"},"schema_version":"1.0"},"receipt":{"kind":"pith_receipt","key_id":"pith-v1-2026-05","algorithm":"ed25519","signed_at":"2026-05-22T01:04:17.623101Z","signature_b64":"64ltYamKjpKWsBL3Mm/g0Z1mDboT1n5hYPrp3HaSAluLtNq42hpCIASuMEvGbgVNcw/gzu8hwepxAboDMDpxAw==","signed_message":"canonical_sha256_bytes","builder_version":"pith-number-builder-2026-05-17-v1","receipt_version":"0.3","canonical_sha256":"3f1045cf5e8e648ac86fce57bc92ab81cfede55745571ff7fd565beacb5de59d","last_reissued_at":"2026-05-22T01:04:17.622280Z","signature_status":"signed_v1","first_computed_at":"2026-05-22T01:04:17.622280Z","public_key_fingerprint":"8d4b5ee74e4693bcd1df2446408b0d54"},"graph_snapshot":{"paper":{"title":"Reinforced Preference Optimization for Reasoning-Augmented Recommendations","license":"http://arxiv.org/licenses/nonexclusive-distrib/1.0/","headline":"","cross_cats":[],"primary_cat":"cs.IR","authors_text":"Chi Lu, Derong Xu, Jingtong Gao, Kun Gai, Maolin Wang, Peng Jiang, Qingpeng Cai, Xiangyu Zhao, Xiaopeng Li, Zeyu Song","submitted_at":"2026-05-21T03:56:42Z","abstract_excerpt":"Recommender systems are critical for delivering personalized content across digital platforms, and recent advances in Large Language Models (LLMs) offer new opportunities to enhance them with richer world knowledge and explicit reasoning capabilities. With the help of reasoning knowledge, recommendations can better infer users' underlying intents, adapt to evolving preferences, and leverage semantic relationships for improved accuracy and interpretability. However, existing reasoning-based recommendation methods often fail to fully align the LLM's reasoning process with recommendation-specific"},"claims":{"count":0,"items":[],"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"source":{"id":"2605.21967","kind":"arxiv","version":1},"verdict":{"id":null,"model_set":{},"created_at":null,"strongest_claim":"","one_line_summary":"","pipeline_version":null,"weakest_assumption":"","pith_extraction_headline":""},"integrity":{"clean":true,"summary":{"advisory":0,"critical":0,"by_detector":{},"informational":0},"endpoint":"/pith/2605.21967/integrity.json","findings":[],"available":true,"detectors_run":[],"snapshot_sha256":"c28c3603d3b5d939e8dc4c7e95fa8dfce3d595e45f758748cecf8e644a296938"},"references":{"count":0,"sample":[],"resolved_work":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57","internal_anchors":0},"formal_canon":{"evidence_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"author_claims":{"count":0,"strong_count":0,"snapshot_sha256":"258153158e38e3291e3d48162225fcdb2d5a3ed65a07baac614ab91432fd4f57"},"builder_version":"pith-number-builder-2026-05-17-v1"},"aliases":[{"alias_kind":"arxiv","alias_value":"2605.21967","created_at":"2026-05-22T01:04:17.622421+00:00"},{"alias_kind":"arxiv_version","alias_value":"2605.21967v1","created_at":"2026-05-22T01:04:17.622421+00:00"},{"alias_kind":"doi","alias_value":"10.48550/arxiv.2605.21967","created_at":"2026-05-22T01:04:17.622421+00:00"},{"alias_kind":"pith_short_12","alias_value":"H4IELT26RZSI","created_at":"2026-05-22T01:04:17.622421+00:00"},{"alias_kind":"pith_short_16","alias_value":"H4IELT26RZSIVSDP","created_at":"2026-05-22T01:04:17.622421+00:00"},{"alias_kind":"pith_short_8","alias_value":"H4IELT26","created_at":"2026-05-22T01:04:17.622421+00:00"}],"events":[],"event_summary":{},"paper_claims":[],"inbound_citations":{"count":0,"internal_anchor_count":0,"sample":[]},"formal_canon":{"evidence_count":0,"sample":[],"anchors":[]},"links":{"html":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH","json":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH.json","graph_json":"https://pith.science/api/pith-number/H4IELT26RZSIVSDPZZL3ZEVLQH/graph.json","events_json":"https://pith.science/api/pith-number/H4IELT26RZSIVSDPZZL3ZEVLQH/events.json","paper":"https://pith.science/paper/H4IELT26"},"agent_actions":{"view_html":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH","download_json":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH.json","view_paper":"https://pith.science/paper/H4IELT26","resolve_alias":"https://pith.science/api/pith-number/resolve?arxiv=2605.21967&json=true","fetch_graph":"https://pith.science/api/pith-number/H4IELT26RZSIVSDPZZL3ZEVLQH/graph.json","fetch_events":"https://pith.science/api/pith-number/H4IELT26RZSIVSDPZZL3ZEVLQH/events.json","actions":{"anchor_timestamp":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH/action/timestamp_anchor","attest_storage":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH/action/storage_attestation","attest_author":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH/action/author_attestation","sign_citation":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH/action/citation_signature","submit_replication":"https://pith.science/pith/H4IELT26RZSIVSDPZZL3ZEVLQH/action/replication_record"}},"created_at":"2026-05-22T01:04:17.622421+00:00","updated_at":"2026-05-22T01:04:17.622421+00:00"}