{"work":{"id":"75e19688-9dee-43d2-b058-3cd127182dbd","openalex_id":null,"doi":null,"arxiv_id":"2402.01391","raw_key":null,"title":"Stepcoder: Improve code generation with reinforcement learning from compiler feedback.arXiv preprint arXiv:2402.01391,","authors":null,"authors_text":"Shihan Dou, Yan Liu, Haoxiang Jia, Limao Xiong, Enyu Zhou, Wei Shen, Junjie Shan, Caishuang Huang, Xiao Wang, Xiaoran Fan, Zhiheng Xi, Yuhao Zhou, Tao Ji, Rui Zheng, Qi Zhang, Xuanjing Huang, and Tao Gui","year":2024,"venue":null,"abstract":null,"external_url":"https://arxiv.org/abs/2402.01391","cited_by_count":null,"metadata_source":"arxiv_reference","metadata_fetched_at":"2026-05-23T22:18:31.312659+00:00","pith_arxiv_id":null,"created_at":"2026-05-10T00:19:46.688552+00:00","updated_at":"2026-05-23T22:18:31.312659+00:00","title_quality_ok":true,"display_title":"Stepcoder: Improve code generation with reinforcement learning from compiler feedback","render_title":"Stepcoder: Improve code generation with reinforcement learning from compiler feedback"},"hub":{"state":{"work_id":"75e19688-9dee-43d2-b058-3cd127182dbd","tier":"hub","tier_reason":"10+ Pith inbound or 1,000+ external citations","pith_inbound_count":12,"external_cited_by_count":null,"distinct_field_count":5,"first_pith_cited_at":"2024-06-01T17:48:15+00:00","last_pith_cited_at":"2026-05-16T22:18:04+00:00","author_build_status":"not_needed","summary_status":"needed","contexts_status":"needed","graph_status":"needed","ask_index_status":"not_needed","reader_status":"not_needed","recognition_status":"not_needed","updated_at":"2026-05-31T02:31:54.198470+00:00","tier_text":"hub"},"tier":"hub","role_counts":[{"context_role":"background","n":7}],"polarity_counts":[{"context_polarity":"background","n":6},{"context_polarity":"unclear","n":1}],"runs":{},"summary":{},"graph":{},"authors":[]}}