[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"branding":3,"analytics":7,"article-openai-releases-open-weight-models-tuned-for-policy-based-labeling":10},{"siteName":4,"siteTagline":5,"publisherName":4,"contactEmail":6},"The Revision","Tech news, decoded.","editor@therevision.news",{"gaMeasurementId":8,"adsenseClientId":9},"G-ZW2MV82GYR","ca-pub-8533917693782264",{"article":11},{"id":12,"slug":13,"title":14,"dek":15,"body_md":16,"tags_json":17,"published_at":18,"created_at":19,"updated_at":20,"status":21,"review_note":22,"review_notes":23,"image_url":22,"persona_id":22,"persona_name":22,"section":22,"tags":38,"sources":42,"feedback":46,"feedback_at":22,"cost_usd":46,"total_tokens":46},1102,"openai-releases-open-weight-models-tuned-for-policy-based-labeling","OpenAI releases open-weight models tuned for policy-based labeling","OpenAI unveiled two open-weight models, gpt-oss-safeguard-120b and -20b, designed to apply a given policy when tagging content.","- OpenAI announced two new open-weight reasoning models, gpt-oss-safeguard-120b and gpt-oss-safeguard-20b, that are fine‑tuned to follow a supplied policy for content labeling.\n\nThe models are built on the earlier gpt-oss series and undergo an extra post‑training stage that teaches them to reason from a policy description. The technical report compares these safeguards against the base gpt-oss models using OpenAI’s standard safety benchmarks. It notes modest gains in policy adherence but also highlights remaining gaps in edge cases.\n\nFor researchers, the release offers a rare glimpse into how large language models can be steered by explicit rules without a closed‑source black box. The open weights mean anyone can test, tweak, or benchmark the approach, potentially accelerating work on controllable AI.\n\nThe announcement signals OpenAI’s move toward more transparent safety tooling, though practical impact will depend on how quickly the community can build on the baseline results.","[\"openai\",\"language-models\",\"ai-safety\"]","2025-10-29T00:00:00.000Z","2026-06-16T10:03:34.076Z","2026-06-16T10:03:36.878Z","published",null,[24,30,34],{"id":25,"reviewer":26,"round":27,"reason":28,"status":29},"editor-r1","editor",1,"Add a concise concluding paragraph summarizing the news and its implications to give the article a clear ending.","resolved",{"id":31,"reviewer":26,"round":32,"reason":33,"status":29},"editor-r2",2,"Add a concise concluding paragraph that summarizes the news and its implications to give the article a clear ending.",{"id":35,"reviewer":26,"round":36,"reason":37,"status":29},"editor-r3",3,"Add a concise concluding paragraph that summarizes the announcement and its implications for the research community.",[39,40,41],"openai","language-models","ai-safety",[43],{"name":44,"url":45},"OpenAI","https:\u002F\u002Fopenai.com\u002Findex\u002Fgpt-oss-safeguard-technical-report",0]