{"schema_version":"onlylabs.public_signal.v1","title":"OpenAI Writing: Detecting misbehavior in frontier reasoning models","description":"OpenAI writing signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a","json_url":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a/signal.json","generated_at":"2026-06-08T15:45:48.912+00:00","org":{"slug":"openai","name":"OpenAI","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/openai","dossier_json_url":"https://onlylabs.fyi/labs/openai/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a","signal_json":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a/signal.json","source":"https://openai.com/index/chain-of-thought-monitoring","lab_dossier":"https://onlylabs.fyi/labs/openai","lab_dossier_json":"https://onlylabs.fyi/labs/openai/dossier.json","analysis":"https://onlylabs.fyi/analysis/openai","analysis_json":"https://onlylabs.fyi/analysis/openai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/openai/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":"https://onlylabs.fyi/topics/talking","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","data_business":null},"answer_pack":{"answer":"OpenAI published Detecting misbehavior in frontier reasoning models. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: OpenAI safety research on frontier models · Detecting misbehavior in frontier reasoning models | OpenAI March 10, 2025 Detecting misbehavior in frontier reasoning models Frontier reasoning models exploit loopholes.... onlylabs links this event to 1 captured evidence page and 6 related writing signals.","signal_desk":"talking","source_context":{"source_url":"https://openai.com/index/chain-of-thought-monitoring","source_host":"openai.com","occurred_at":"2025-03-10T10:00:00+00:00","first_seen_at":"2026-06-05T05:42:57.832854+00:00","date_source":"rss.item_date","context":null},"context_markers":[{"label":"Lab","value":"OpenAI","source":"signal"},{"label":"Signal desk","value":"talking","source":"signal"},{"label":"Source host","value":"openai.com","source":"source"},{"label":"Notability","value":"OpenAI safety research on frontier models","source":"signal"},{"label":"Watch term","value":"RL environments","source":"evidence"},{"label":"Watch term","value":"Infrastructure","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"},{"label":"Watch term","value":"Agents and tool use","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["exa"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://openai.com/index/chain-of-thought-monitoring"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-08T15:45:48.912+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a/signal.json","dossier_json":"https://onlylabs.fyi/labs/openai/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/openai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/openai/evidence.json","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","evidence_focus":["post title","source URL","captured page text","HN traction","linked model or paper references","publication date"],"extraction_questions":["Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Which writing reframes a recent release, model, hiring wave, or policy stance?","Which posts mention data, evals, infrastructure, safety, or deployment workflows?"],"signal_questions":["What public theme, launch framing, or research direction does this writing signal expose?","Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Do the 6 related writing signals show a repeated pattern?"],"output_fields":["org","theme","public_framing","traction","data_business_lane","evidence_url"],"data_business_relevance":"Public writing supplies the narrative layer over raw signals and helps identify which frontier-lab priorities are becoming externally legible.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a/signal.json","required":true},{"label":"source","url":"https://openai.com/index/chain-of-thought-monitoring","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/openai/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/openai/evidence.json","required":true},{"label":"topic_signals_json","url":"https://onlylabs.fyi/topics/talking/signals.json","required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze OpenAI's writing signal \"Detecting misbehavior in frontier reasoning models\" for frontier lab strategy."},"semantic_triples":[{"subject":"OpenAI","predicate":"published","object":"Detecting misbehavior in frontier reasoning models","text":"OpenAI published Detecting misbehavior in frontier reasoning models."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"is classified as","object":"writing signal","text":"Detecting misbehavior in frontier reasoning models is classified as writing signal."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"belongs to","object":"talking desk","text":"Detecting misbehavior in frontier reasoning models belongs to talking desk."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Detecting misbehavior in frontier reasoning models has evidence coverage 1 captured evidence page."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has captured page count","object":"1","text":"Detecting misbehavior in frontier reasoning models has captured page count 1."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has readable page count","object":"1","text":"Detecting misbehavior in frontier reasoning models has readable page count 1."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has related signal count","object":"6","text":"Detecting misbehavior in frontier reasoning models has related signal count 6."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has analysis playbook objective","object":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","text":"Detecting misbehavior in frontier reasoning models has analysis playbook objective Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has source host","object":"openai.com","text":"Detecting misbehavior in frontier reasoning models has source host openai.com."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has lab","object":"OpenAI","text":"Detecting misbehavior in frontier reasoning models has lab OpenAI."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has signal desk","object":"talking","text":"Detecting misbehavior in frontier reasoning models has signal desk talking."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has source host","object":"openai.com","text":"Detecting misbehavior in frontier reasoning models has source host openai.com."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has notability","object":"OpenAI safety research on frontier models","text":"Detecting misbehavior in frontier reasoning models has notability OpenAI safety research on frontier models."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has watch term","object":"RL environments","text":"Detecting misbehavior in frontier reasoning models has watch term RL environments."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has watch term","object":"Infrastructure","text":"Detecting misbehavior in frontier reasoning models has watch term Infrastructure."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has watch term","object":"Safety and alignment","text":"Detecting misbehavior in frontier reasoning models has watch term Safety and alignment."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has watch term","object":"Agents and tool use","text":"Detecting misbehavior in frontier reasoning models has watch term Agents and tool use."}]},"intelligence":{"signal_desk":"talking","answer":"OpenAI published Detecting misbehavior in frontier reasoning models. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: OpenAI safety research on frontier models · Detecting misbehavior in frontier reasoning models | OpenAI March 10, 2025 Detecting misbehavior in frontier reasoning models Frontier reasoning models exploit loopholes.... onlylabs links this event to 1 captured evidence page and 6 related writing signals.","semantic_triples":[{"subject":"OpenAI","predicate":"published","object":"Detecting misbehavior in frontier reasoning models","text":"OpenAI published Detecting misbehavior in frontier reasoning models."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"is classified as","object":"writing signal","text":"Detecting misbehavior in frontier reasoning models is classified as writing signal."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"belongs to","object":"talking desk","text":"Detecting misbehavior in frontier reasoning models belongs to talking desk."},{"subject":"Detecting misbehavior in frontier reasoning models","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Detecting misbehavior in frontier reasoning models has evidence coverage 1 captured evidence page."}]},"signal":{"id":"9e7bef74-3ad8-4683-a99d-8ff219bae25a","url":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a","json_url":"https://onlylabs.fyi/signals/9e7bef74-3ad8-4683-a99d-8ff219bae25a/signal.json","source_url":"https://openai.com/index/chain-of-thought-monitoring","title":"Detecting misbehavior in frontier reasoning models","summary":"OpenAI published a writing signal. onlylabs watches public writing for research themes, product direction, and model-launch context.","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2025-03-10T10:00:00+00:00","first_seen_at":"2026-06-05T05:42:57.832854+00:00","date_source":"rss.item_date","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["exa"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://openai.com/index/chain-of-thought-monitoring"]},"facets":{},"traction":{"github_stars":null,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://openai.com/index/chain-of-thought-monitoring","final_url":"https://openai.com/index/chain-of-thought-monitoring","title":"Detecting misbehavior in frontier reasoning models","http_status":200,"content_type":null,"capture_method":"exa","fetched_at":"2026-06-08T15:45:48.912+00:00","bytes":null,"raw_path":null,"content_hash":null,"excerpt_chars":1200,"truncated":true,"excerpt":"Detecting misbehavior in frontier reasoning models | OpenAI March 10, 2025 Detecting misbehavior in frontier reasoning models Frontier reasoning models exploit loopholes when given the chance. We show we can detect exploits using an LLM to monitor their chains-of-thought. Penalizing their “bad thoughts” doesn’t stop the majority of misbehavior—it makes them hide their intent. Listen to article Share Chain-of-thought (CoT) reasoning models “think” in natural language understandable by humans. Monitoring their “thinking” has allowed us to detect misbehavior such as subverting tests in coding tasks, deceiving users, or giving up when a problem is too hard. We believe that CoT monitoring may be one of few tools we will have to oversee superhuman models of the future. We have further found that directly optimizing the CoT to adhere to specific criteria (e.g. to not think about reward hacking) may boost performance in the short run; however, it does not eliminate all misbehavior and can cause a model to hide its intent. We hope future research will find ways to directly optimize CoTs without this drawback, but until then We recommend against applying strong optimization pressure..."},"evidence_pages":[{"url":"https://openai.com/index/chain-of-thought-monitoring","final_url":"https://openai.com/index/chain-of-thought-monitoring","title":"Detecting misbehavior in frontier reasoning models","http_status":200,"content_type":null,"capture_method":"exa","fetched_at":"2026-06-08T15:45:48.912+00:00","bytes":null,"raw_path":null,"content_hash":null,"excerpt_chars":1200,"truncated":true,"excerpt":"Detecting misbehavior in frontier reasoning models | OpenAI March 10, 2025 Detecting misbehavior in frontier reasoning models Frontier reasoning models exploit loopholes when given the chance. We show we can detect exploits using an LLM to monitor their chains-of-thought. Penalizing their “bad thoughts” doesn’t stop the majority of misbehavior—it makes them hide their intent. Listen to article Share Chain-of-thought (CoT) reasoning models “think” in natural language understandable by humans. Monitoring their “thinking” has allowed us to detect misbehavior such as subverting tests in coding tasks, deceiving users, or giving up when a problem is too hard. We believe that CoT monitoring may be one of few tools we will have to oversee superhuman models of the future. We have further found that directly optimizing the CoT to adhere to specific criteria (e.g. to not think about reward hacking) may boost performance in the short run; however, it does not eliminate all misbehavior and can cause a model to hide its intent. We hope future research will find ways to directly optimize CoTs without this drawback, but until then We recommend against applying strong optimization pressure..."}],"related_signals":[{"id":"b3668d3b-26d2-40c0-9d4f-ed1a67927aa4","url":"https://onlylabs.fyi/signals/b3668d3b-26d2-40c0-9d4f-ed1a67927aa4","source_url":"https://openai.com/index/supporting-eu-trustworthy-ai-ecosystem","title":"Supporting Europe’s work in ensuring a trustworthy AI ecosystem ","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-11T00:00:00+00:00","first_seen_at":"2026-06-11T08:00:56.140796+00:00","date_source":"rss.item_date"},{"id":"2638c0a7-b372-409c-ac72-f6d81d6464dc","url":"https://onlylabs.fyi/signals/2638c0a7-b372-409c-ac72-f6d81d6464dc","source_url":"https://openai.com/index/using-codex-to-simulate-black-holes","title":"How an astrophysicist uses Codex to help simulate black holes","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-11T00:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"509ea784-51ec-4ede-855b-5a4d1b27d3be","url":"https://onlylabs.fyi/signals/509ea784-51ec-4ede-855b-5a4d1b27d3be","source_url":"https://openai.com/index/openai-on-oracle-cloud","title":"Access OpenAI models and Codex through your Oracle cloud commitment","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T20:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"4f051449-87f2-466e-941e-b5918381a8fe","url":"https://onlylabs.fyi/signals/4f051449-87f2-466e-941e-b5918381a8fe","source_url":"https://openai.com/index/prc-linked-influence-operations-ai-debates","title":"PRC-linked influence operations are targeting AI debates in the US","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T12:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"4507c0c1-cb74-4bb3-b62b-5f6c2d37e20d","url":"https://onlylabs.fyi/signals/4507c0c1-cb74-4bb3-b62b-5f6c2d37e20d","source_url":"https://openai.com/index/lseg","title":"From data to decisions: how LSEG is scaling trusted AI","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T00:00:00+00:00","first_seen_at":"2026-06-10T09:18:54.26094+00:00","date_source":"rss.item_date"},{"id":"fb16aa7a-c4ef-4859-b514-0839c2f1330d","url":"https://onlylabs.fyi/signals/fb16aa7a-c4ef-4859-b514-0839c2f1330d","source_url":"https://openai.com/index/nextdoor","title":"How engineers at Nextdoor use Codex to build without limits","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-09T12:00:00+00:00","first_seen_at":"2026-06-10T07:01:28.700378+00:00","date_source":"rss.item_date"}]}