{"schema_version":"onlylabs.public_signal.v1","title":"Google (DeepMind / Gemini) Repo: google-deepmind/bbeh","description":"Google (DeepMind / Gemini) repo signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29","json_url":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29/signal.json","generated_at":"2026-06-11T04:00:37.326762+00:00","org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/google-deepmind","dossier_json_url":"https://onlylabs.fyi/labs/google-deepmind/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29","signal_json":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29/signal.json","source":"https://github.com/google-deepmind/bbeh","lab_dossier":"https://onlylabs.fyi/labs/google-deepmind","lab_dossier_json":"https://onlylabs.fyi/labs/google-deepmind/dossier.json","analysis":"https://onlylabs.fyi/analysis/google-deepmind","analysis_json":"https://onlylabs.fyi/analysis/google-deepmind/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/google-deepmind/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":null},"answer_pack":{"answer":"Google (DeepMind / Gemini) published google-deepmind/bbeh (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo google-deepmind/bbeh · language Python · New repo from DeepMind, low stars. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","signal_desk":"repos","source_context":{"source_url":"https://github.com/google-deepmind/bbeh","source_host":"github.com","occurred_at":"2025-02-25T19:47:19+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source","context":"Python"},"context_markers":[{"label":"Lab","value":"Google (DeepMind / Gemini)","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"google-deepmind/bbeh","source":"source"},{"label":"Language","value":"Python","source":"source"},{"label":"Stars","value":"120","source":"traction"},{"label":"Notability","value":"New repo from DeepMind, low stars","source":"signal"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Data pipeline","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/google-deepmind/bbeh"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T04:00:37.326762+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29/signal.json","dossier_json":"https://onlylabs.fyi/labs/google-deepmind/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/google-deepmind/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/google-deepmind/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","data_business_lane","evidence_url"],"data_business_relevance":"New repositories can expose organization build priorities early, especially around internal tooling, eval infrastructure, data systems, deployment, and agent workflows.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29/signal.json","required":true},{"label":"source","url":"https://github.com/google-deepmind/bbeh","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/google-deepmind/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/google-deepmind/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Google (DeepMind / Gemini)'s repo signal \"google-deepmind/bbeh\" for frontier lab strategy."},"semantic_triples":[{"subject":"Google (DeepMind / Gemini)","predicate":"published repo","object":"google-deepmind/bbeh","text":"Google (DeepMind / Gemini) published repo google-deepmind/bbeh."},{"subject":"google-deepmind/bbeh","predicate":"is classified as","object":"repo signal","text":"google-deepmind/bbeh is classified as repo signal."},{"subject":"google-deepmind/bbeh","predicate":"belongs to","object":"repos desk","text":"google-deepmind/bbeh belongs to repos desk."},{"subject":"google-deepmind/bbeh","predicate":"has context","object":"Python","text":"google-deepmind/bbeh has context Python."},{"subject":"google-deepmind/bbeh","predicate":"has evidence coverage","object":"1 captured evidence page","text":"google-deepmind/bbeh has evidence coverage 1 captured evidence page."},{"subject":"google-deepmind/bbeh","predicate":"has captured page count","object":"1","text":"google-deepmind/bbeh has captured page count 1."},{"subject":"google-deepmind/bbeh","predicate":"has readable page count","object":"1","text":"google-deepmind/bbeh has readable page count 1."},{"subject":"google-deepmind/bbeh","predicate":"has related signal count","object":"6","text":"google-deepmind/bbeh has related signal count 6."},{"subject":"google-deepmind/bbeh","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"google-deepmind/bbeh has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"google-deepmind/bbeh","predicate":"has source host","object":"github.com","text":"google-deepmind/bbeh has source host github.com."},{"subject":"google-deepmind/bbeh","predicate":"has lab","object":"Google (DeepMind / Gemini)","text":"google-deepmind/bbeh has lab Google (DeepMind / Gemini)."},{"subject":"google-deepmind/bbeh","predicate":"has signal desk","object":"repos","text":"google-deepmind/bbeh has signal desk repos."},{"subject":"google-deepmind/bbeh","predicate":"has source host","object":"github.com","text":"google-deepmind/bbeh has source host github.com."},{"subject":"google-deepmind/bbeh","predicate":"has repository","object":"google-deepmind/bbeh","text":"google-deepmind/bbeh has repository google-deepmind/bbeh."},{"subject":"google-deepmind/bbeh","predicate":"has language","object":"Python","text":"google-deepmind/bbeh has language Python."},{"subject":"google-deepmind/bbeh","predicate":"has stars","object":"120","text":"google-deepmind/bbeh has stars 120."},{"subject":"google-deepmind/bbeh","predicate":"has notability","object":"New repo from DeepMind, low stars","text":"google-deepmind/bbeh has notability New repo from DeepMind, low stars."},{"subject":"google-deepmind/bbeh","predicate":"has watch term","object":"Eval methodology","text":"google-deepmind/bbeh has watch term Eval methodology."}]},"intelligence":{"signal_desk":"repos","answer":"Google (DeepMind / Gemini) published google-deepmind/bbeh (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo google-deepmind/bbeh · language Python · New repo from DeepMind, low stars. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","semantic_triples":[{"subject":"Google (DeepMind / Gemini)","predicate":"published repo","object":"google-deepmind/bbeh","text":"Google (DeepMind / Gemini) published repo google-deepmind/bbeh."},{"subject":"google-deepmind/bbeh","predicate":"is classified as","object":"repo signal","text":"google-deepmind/bbeh is classified as repo signal."},{"subject":"google-deepmind/bbeh","predicate":"belongs to","object":"repos desk","text":"google-deepmind/bbeh belongs to repos desk."},{"subject":"google-deepmind/bbeh","predicate":"has context","object":"Python","text":"google-deepmind/bbeh has context Python."},{"subject":"google-deepmind/bbeh","predicate":"has evidence coverage","object":"1 captured evidence page","text":"google-deepmind/bbeh has evidence coverage 1 captured evidence page."}]},"signal":{"id":"05319577-9fdc-4f35-918a-9aa6918bbd29","url":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29","json_url":"https://onlylabs.fyi/signals/05319577-9fdc-4f35-918a-9aa6918bbd29/signal.json","source_url":"https://github.com/google-deepmind/bbeh","title":"google-deepmind/bbeh","summary":"Google (DeepMind / Gemini) published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab"},"occurred_at":"2025-02-25T19:47:19+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/google-deepmind/bbeh"]},"facets":{"repo":"google-deepmind/bbeh","language":"Python"},"traction":{"github_stars":120,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://github.com/google-deepmind/bbeh","final_url":"https://github.com/google-deepmind/bbeh","title":"google-deepmind/bbeh repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T04:00:37.326762+00:00","bytes":15483,"raw_path":"93216a8cc1a2f30fbe41d563510a631209231ef01a8fd7d96d3ed767170035db.json","content_hash":"c4355ef44be519b147886dce1b8728390ffd119c43f579e5c8eae9018539bdf8","excerpt_chars":1200,"truncated":true,"excerpt":"google-deepmind/bbeh Language: Python License: Apache-2.0 Stars: 121 Forks: 9 Open issues: 5 Created: 2025-02-25T19:47:19Z Pushed: 2025-05-07T14:25:47Z Default branch: main Fork: no Archived: no README: <!-- mdlint off(SNIPPET_INVALID_LANGUAGE) --> <!-- mdlint off(LINE_OVER_80) --> BIG-Bench Extra Hard ![BBEH_LOGO](images/bbeh_logo.png) Large language models (LLMs) are increasingly deployed in everyday applications, demanding robust general reasoning capabilities and diverse reasoning skillset. However, current LLM reasoning benchmarks predominantly focus on mathematical and coding abilities, leaving a gap in evaluating broader reasoning proficiencies. One particular exception is the BIG-Bench dataset, which has served as a crucial benchmark for evaluating the general reasoning capabilities of LLMs, thanks to its diverse set of challenging tasks that allowed for a comprehensive assessment of general reasoning across various skills within a unified framework. However, recent advances in LLMs have led to saturation on BIG-Bench, and its harder version BIG-Bench Hard (BBH). State-of-the-art models achieve near-perfect scores on many tasks in BBH, thus diminishing its utility. To..."},"evidence_pages":[{"url":"https://github.com/google-deepmind/bbeh","final_url":"https://github.com/google-deepmind/bbeh","title":"google-deepmind/bbeh repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T04:00:37.326762+00:00","bytes":15483,"raw_path":"93216a8cc1a2f30fbe41d563510a631209231ef01a8fd7d96d3ed767170035db.json","content_hash":"c4355ef44be519b147886dce1b8728390ffd119c43f579e5c8eae9018539bdf8","excerpt_chars":1200,"truncated":true,"excerpt":"google-deepmind/bbeh Language: Python License: Apache-2.0 Stars: 121 Forks: 9 Open issues: 5 Created: 2025-02-25T19:47:19Z Pushed: 2025-05-07T14:25:47Z Default branch: main Fork: no Archived: no README: <!-- mdlint off(SNIPPET_INVALID_LANGUAGE) --> <!-- mdlint off(LINE_OVER_80) --> BIG-Bench Extra Hard ![BBEH_LOGO](images/bbeh_logo.png) Large language models (LLMs) are increasingly deployed in everyday applications, demanding robust general reasoning capabilities and diverse reasoning skillset. However, current LLM reasoning benchmarks predominantly focus on mathematical and coding abilities, leaving a gap in evaluating broader reasoning proficiencies. One particular exception is the BIG-Bench dataset, which has served as a crucial benchmark for evaluating the general reasoning capabilities of LLMs, thanks to its diverse set of challenging tasks that allowed for a comprehensive assessment of general reasoning across various skills within a unified framework. However, recent advances in LLMs have led to saturation on BIG-Bench, and its harder version BIG-Bench Hard (BBH). State-of-the-art models achieve near-perfect scores on many tasks in BBH, thus diminishing its utility. To..."}],"related_signals":[{"id":"02f8701d-7bfd-41b5-aabe-1ad72a880dfb","url":"https://onlylabs.fyi/signals/02f8701d-7bfd-41b5-aabe-1ad72a880dfb","source_url":"https://github.com/google-deepmind/unpic","title":"google-deepmind/unpic","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab"},"occurred_at":"2026-06-04T14:37:24+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source"},{"id":"35320cac-ddbe-4f25-a3b5-384a0ca0030b","url":"https://onlylabs.fyi/signals/35320cac-ddbe-4f25-a3b5-384a0ca0030b","source_url":"https://github.com/google-deepmind/seeing_without_pixels","title":"google-deepmind/seeing_without_pixels","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab"},"occurred_at":"2026-06-03T04:04:52+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source"},{"id":"62f799ef-bf1d-4aee-9f87-fa0de8bb5e81","url":"https://onlylabs.fyi/signals/62f799ef-bf1d-4aee-9f87-fa0de8bb5e81","source_url":"https://github.com/google-deepmind/nested","title":"google-deepmind/nested","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab"},"occurred_at":"2026-05-18T16:16:42+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source"},{"id":"e67b1d5f-ef62-4574-80df-a72a4bded705","url":"https://onlylabs.fyi/signals/e67b1d5f-ef62-4574-80df-a72a4bded705","source_url":"https://github.com/google-deepmind/science-skills","title":"google-deepmind/science-skills","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab"},"occurred_at":"2026-05-13T16:17:41+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source"},{"id":"7b714793-a56e-495b-8d57-85fd2850555a","url":"https://onlylabs.fyi/signals/7b714793-a56e-495b-8d57-85fd2850555a","source_url":"https://github.com/google-deepmind/alphaproof-nexus-results","title":"google-deepmind/alphaproof-nexus-results","context":"Lean","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab"},"occurred_at":"2026-05-13T09:59:21+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source"},{"id":"dab748d2-53d6-4972-a594-eb6bfbf727ea","url":"https://onlylabs.fyi/signals/dab748d2-53d6-4972-a594-eb6bfbf727ea","source_url":"https://github.com/google-deepmind/tecci","title":"google-deepmind/tecci","context":"JavaScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"google-deepmind","name":"Google (DeepMind / Gemini)","category":"frontier-lab"},"occurred_at":"2026-05-05T12:22:40+00:00","first_seen_at":"2026-06-05T05:42:58.453363+00:00","date_source":"source"}]}