{"work":{"id":"7ffab50f-285e-4804-b3fe-167071264d7d","openalex_id":null,"doi":null,"arxiv_id":"2511.18397","raw_key":null,"title":"Natural Emergent Misalignment from Reward Hacking in Production RL , 2025","authors":null,"authors_text":"Monte MacDiarmid, Benjamin Wright, Jonathan Uesato, Joe Benton, Jon Kutasov, Sara Price, Naia Bouscal, Sam Bowman, Trenton Bricken, Alex Cloud, Carson Denison, Johannes Gasteiger, Ryan Greenblatt, Jan Leike, Jack Lindsey, Vlad Mikulik, Etha","year":2025,"venue":null,"abstract":null,"external_url":"https://arxiv.org/abs/2511.18397","cited_by_count":null,"metadata_source":"arxiv_reference","metadata_fetched_at":"2026-05-25T04:50:20.768555+00:00","pith_arxiv_id":null,"created_at":"2026-05-09T06:25:39.792955+00:00","updated_at":"2026-06-05T21:23:00.469572+00:00","title_quality_ok":true,"display_title":"Natural Emergent Misalignment from Reward Hacking in Production RL","render_title":"Natural Emergent Misalignment from Reward Hacking in Production RL"},"hub":{"state":{"work_id":"7ffab50f-285e-4804-b3fe-167071264d7d","tier":"hub","tier_reason":"10+ Pith inbound or 1,000+ external citations","pith_inbound_count":19,"external_cited_by_count":null,"distinct_field_count":6,"first_pith_cited_at":"2026-04-07T17:43:18+00:00","last_pith_cited_at":"2026-05-22T12:31:18+00:00","author_build_status":"not_needed","summary_status":"needed","contexts_status":"needed","graph_status":"needed","ask_index_status":"not_needed","reader_status":"not_needed","recognition_status":"not_needed","updated_at":"2026-06-07T08:41:27.473584+00:00","tier_text":"hub"},"tier":"hub","role_counts":[{"context_role":"background","n":3},{"context_role":"other","n":2}],"polarity_counts":[{"context_polarity":"background","n":3},{"context_polarity":"unclear","n":2}],"runs":{},"summary":{},"graph":{},"authors":[]}}