{"schema_version":"onlylabs.public_signal.v1","title":"OpenAI Writing: Finding GPT-4’s mistakes with GPT-4","description":"OpenAI writing signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457","json_url":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457/signal.json","generated_at":"2026-06-08T15:46:01.326+00:00","org":{"slug":"openai","name":"OpenAI","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/openai","dossier_json_url":"https://onlylabs.fyi/labs/openai/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457","signal_json":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457/signal.json","source":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","lab_dossier":"https://onlylabs.fyi/labs/openai","lab_dossier_json":"https://onlylabs.fyi/labs/openai/dossier.json","analysis":"https://onlylabs.fyi/analysis/openai","analysis_json":"https://onlylabs.fyi/analysis/openai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/openai/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":"https://onlylabs.fyi/topics/talking","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","data_business":null},"answer_pack":{"answer":"OpenAI published Finding GPT-4’s mistakes with GPT-4. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: Finding GPT-4’s mistakes with GPT-4 | OpenAI June 27, 2024 Publication Finding GPT‑4’s mistakes with GPT‑4 CriticGPT, a model based on GPT‑4, writes critiques of ChatGPT.... onlylabs links this event to 1 captured evidence page and 6 related writing signals.","signal_desk":"talking","source_context":{"source_url":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","source_host":"openai.com","occurred_at":"2024-06-27T10:00:00+00:00","first_seen_at":"2026-06-05T05:42:57.832854+00:00","date_source":"rss.item_date","context":null},"context_markers":[{"label":"Lab","value":"OpenAI","source":"signal"},{"label":"Signal desk","value":"talking","source":"signal"},{"label":"Source host","value":"openai.com","source":"source"},{"label":"Watch term","value":"RL environments","source":"evidence"},{"label":"Watch term","value":"Data pipeline","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"},{"label":"Watch term","value":"Agents and tool use","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["exa"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-08T15:46:01.326+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457/signal.json","dossier_json":"https://onlylabs.fyi/labs/openai/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/openai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/openai/evidence.json","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","evidence_focus":["post title","source URL","captured page text","HN traction","linked model or paper references","publication date"],"extraction_questions":["Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Which writing reframes a recent release, model, hiring wave, or policy stance?","Which posts mention data, evals, infrastructure, safety, or deployment workflows?"],"signal_questions":["What public theme, launch framing, or research direction does this writing signal expose?","Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Do the 6 related writing signals show a repeated pattern?"],"output_fields":["org","theme","public_framing","traction","data_business_lane","evidence_url"],"data_business_relevance":"Public writing supplies the narrative layer over raw signals and helps identify which frontier-lab priorities are becoming externally legible.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457/signal.json","required":true},{"label":"source","url":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/openai/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/openai/evidence.json","required":true},{"label":"topic_signals_json","url":"https://onlylabs.fyi/topics/talking/signals.json","required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze OpenAI's writing signal \"Finding GPT-4’s mistakes with GPT-4\" for frontier lab strategy."},"semantic_triples":[{"subject":"OpenAI","predicate":"published","object":"Finding GPT-4’s mistakes with GPT-4","text":"OpenAI published Finding GPT-4’s mistakes with GPT-4."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"is classified as","object":"writing signal","text":"Finding GPT-4’s mistakes with GPT-4 is classified as writing signal."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"belongs to","object":"talking desk","text":"Finding GPT-4’s mistakes with GPT-4 belongs to talking desk."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Finding GPT-4’s mistakes with GPT-4 has evidence coverage 1 captured evidence page."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has captured page count","object":"1","text":"Finding GPT-4’s mistakes with GPT-4 has captured page count 1."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has readable page count","object":"1","text":"Finding GPT-4’s mistakes with GPT-4 has readable page count 1."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has related signal count","object":"6","text":"Finding GPT-4’s mistakes with GPT-4 has related signal count 6."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has analysis playbook objective","object":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","text":"Finding GPT-4’s mistakes with GPT-4 has analysis playbook objective Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has source host","object":"openai.com","text":"Finding GPT-4’s mistakes with GPT-4 has source host openai.com."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has lab","object":"OpenAI","text":"Finding GPT-4’s mistakes with GPT-4 has lab OpenAI."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has signal desk","object":"talking","text":"Finding GPT-4’s mistakes with GPT-4 has signal desk talking."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has source host","object":"openai.com","text":"Finding GPT-4’s mistakes with GPT-4 has source host openai.com."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has watch term","object":"RL environments","text":"Finding GPT-4’s mistakes with GPT-4 has watch term RL environments."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has watch term","object":"Data pipeline","text":"Finding GPT-4’s mistakes with GPT-4 has watch term Data pipeline."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has watch term","object":"Safety and alignment","text":"Finding GPT-4’s mistakes with GPT-4 has watch term Safety and alignment."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has watch term","object":"Agents and tool use","text":"Finding GPT-4’s mistakes with GPT-4 has watch term Agents and tool use."}]},"intelligence":{"signal_desk":"talking","answer":"OpenAI published Finding GPT-4’s mistakes with GPT-4. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: Finding GPT-4’s mistakes with GPT-4 | OpenAI June 27, 2024 Publication Finding GPT‑4’s mistakes with GPT‑4 CriticGPT, a model based on GPT‑4, writes critiques of ChatGPT.... onlylabs links this event to 1 captured evidence page and 6 related writing signals.","semantic_triples":[{"subject":"OpenAI","predicate":"published","object":"Finding GPT-4’s mistakes with GPT-4","text":"OpenAI published Finding GPT-4’s mistakes with GPT-4."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"is classified as","object":"writing signal","text":"Finding GPT-4’s mistakes with GPT-4 is classified as writing signal."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"belongs to","object":"talking desk","text":"Finding GPT-4’s mistakes with GPT-4 belongs to talking desk."},{"subject":"Finding GPT-4’s mistakes with GPT-4","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Finding GPT-4’s mistakes with GPT-4 has evidence coverage 1 captured evidence page."}]},"signal":{"id":"e4a9a82d-04a2-4c65-b72d-75c8cbe87457","url":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457","json_url":"https://onlylabs.fyi/signals/e4a9a82d-04a2-4c65-b72d-75c8cbe87457/signal.json","source_url":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","title":"Finding GPT-4’s mistakes with GPT-4","summary":"OpenAI published a writing signal. onlylabs watches public writing for research themes, product direction, and model-launch context.","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2024-06-27T10:00:00+00:00","first_seen_at":"2026-06-05T05:42:57.832854+00:00","date_source":"rss.item_date","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["exa"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4"]},"facets":{},"traction":{"github_stars":null,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","final_url":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","title":"Finding GPT-4’s mistakes with GPT-4","http_status":200,"content_type":null,"capture_method":"exa","fetched_at":"2026-06-08T15:46:01.326+00:00","bytes":null,"raw_path":null,"content_hash":null,"excerpt_chars":1200,"truncated":true,"excerpt":"Finding GPT-4’s mistakes with GPT-4 | OpenAI June 27, 2024 Publication Finding GPT‑4’s mistakes with GPT‑4 CriticGPT, a model based on GPT‑4, writes critiques of ChatGPT responses to help human trainers spot mistakes during RLHF Read paper Loading… Share We've trained a model, based on GPT‑4, called CriticGPT to catch errors in ChatGPT's code output. We found that when people get help from CriticGPT to review ChatGPT code they outperform those without help 60% of the time. We are beginning the work to integrate CriticGPT‑like models into our RLHF labeling pipeline, providing our trainers with explicit AI assistance. This is a step towards being able to evaluate outputs from advanced AI systems that can be difficult for people to rate without better tools. The GPT‑4 series of models, which powers ChatGPT, is aligned to be helpful and interactive through “Reinforcement Learning from Human Feedback”(RLHF⁠). A key part of RLHF is collecting comparisons in which people, called AI trainers, rate different ChatGPT responses against each other. As we make advances in reasoning and model behavior, ChatGPT becomes more accurate and its mistakes become more subtle. This can make it hard for..."},"evidence_pages":[{"url":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","final_url":"https://openai.com/index/finding-gpt4s-mistakes-with-gpt-4","title":"Finding GPT-4’s mistakes with GPT-4","http_status":200,"content_type":null,"capture_method":"exa","fetched_at":"2026-06-08T15:46:01.326+00:00","bytes":null,"raw_path":null,"content_hash":null,"excerpt_chars":1200,"truncated":true,"excerpt":"Finding GPT-4’s mistakes with GPT-4 | OpenAI June 27, 2024 Publication Finding GPT‑4’s mistakes with GPT‑4 CriticGPT, a model based on GPT‑4, writes critiques of ChatGPT responses to help human trainers spot mistakes during RLHF Read paper Loading… Share We've trained a model, based on GPT‑4, called CriticGPT to catch errors in ChatGPT's code output. We found that when people get help from CriticGPT to review ChatGPT code they outperform those without help 60% of the time. We are beginning the work to integrate CriticGPT‑like models into our RLHF labeling pipeline, providing our trainers with explicit AI assistance. This is a step towards being able to evaluate outputs from advanced AI systems that can be difficult for people to rate without better tools. The GPT‑4 series of models, which powers ChatGPT, is aligned to be helpful and interactive through “Reinforcement Learning from Human Feedback”(RLHF⁠). A key part of RLHF is collecting comparisons in which people, called AI trainers, rate different ChatGPT responses against each other. As we make advances in reasoning and model behavior, ChatGPT becomes more accurate and its mistakes become more subtle. This can make it hard for..."}],"related_signals":[{"id":"b3668d3b-26d2-40c0-9d4f-ed1a67927aa4","url":"https://onlylabs.fyi/signals/b3668d3b-26d2-40c0-9d4f-ed1a67927aa4","source_url":"https://openai.com/index/supporting-eu-trustworthy-ai-ecosystem","title":"Supporting Europe’s work in ensuring a trustworthy AI ecosystem ","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-11T00:00:00+00:00","first_seen_at":"2026-06-11T08:00:56.140796+00:00","date_source":"rss.item_date"},{"id":"2638c0a7-b372-409c-ac72-f6d81d6464dc","url":"https://onlylabs.fyi/signals/2638c0a7-b372-409c-ac72-f6d81d6464dc","source_url":"https://openai.com/index/using-codex-to-simulate-black-holes","title":"How an astrophysicist uses Codex to help simulate black holes","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-11T00:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"509ea784-51ec-4ede-855b-5a4d1b27d3be","url":"https://onlylabs.fyi/signals/509ea784-51ec-4ede-855b-5a4d1b27d3be","source_url":"https://openai.com/index/openai-on-oracle-cloud","title":"Access OpenAI models and Codex through your Oracle cloud commitment","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T20:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"4f051449-87f2-466e-941e-b5918381a8fe","url":"https://onlylabs.fyi/signals/4f051449-87f2-466e-941e-b5918381a8fe","source_url":"https://openai.com/index/prc-linked-influence-operations-ai-debates","title":"PRC-linked influence operations are targeting AI debates in the US","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T12:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"4507c0c1-cb74-4bb3-b62b-5f6c2d37e20d","url":"https://onlylabs.fyi/signals/4507c0c1-cb74-4bb3-b62b-5f6c2d37e20d","source_url":"https://openai.com/index/lseg","title":"From data to decisions: how LSEG is scaling trusted AI","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T00:00:00+00:00","first_seen_at":"2026-06-10T09:18:54.26094+00:00","date_source":"rss.item_date"},{"id":"fb16aa7a-c4ef-4859-b514-0839c2f1330d","url":"https://onlylabs.fyi/signals/fb16aa7a-c4ef-4859-b514-0839c2f1330d","source_url":"https://openai.com/index/nextdoor","title":"How engineers at Nextdoor use Codex to build without limits","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-09T12:00:00+00:00","first_seen_at":"2026-06-10T07:01:28.700378+00:00","date_source":"rss.item_date"}]}