{"schema_version":"onlylabs.public_signal.v1","title":"Microsoft Repo: microsoft/OdysseyBench","description":"Microsoft repo signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606","json_url":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606/signal.json","generated_at":"2026-06-11T03:56:32.820228+00:00","org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/microsoft","dossier_json_url":"https://onlylabs.fyi/labs/microsoft/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606","signal_json":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606/signal.json","source":"https://github.com/microsoft/OdysseyBench","lab_dossier":"https://onlylabs.fyi/labs/microsoft","lab_dossier_json":"https://onlylabs.fyi/labs/microsoft/dossier.json","analysis":"https://onlylabs.fyi/analysis/microsoft","analysis_json":"https://onlylabs.fyi/analysis/microsoft/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/microsoft/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":{"radar":"https://onlylabs.fyi/data-radar","radar_json":"https://onlylabs.fyi/data-radar.json","opportunities":"https://onlylabs.fyi/opportunities","opportunities_json":"https://onlylabs.fyi/opportunities.json","lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"},{"key":"product","label":"Product and customer","url":"https://onlylabs.fyi/data-radar/product","json_url":"https://onlylabs.fyi/data-radar/product/signals.json"}]}},"answer_pack":{"answer":"Microsoft published microsoft/OdysseyBench (Jupyter Notebook). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo microsoft/OdysseyBench · language Jupyter Notebook · New repo with only 10 stars.. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality, Product and customer in the data-business radar.","signal_desk":"repos","source_context":{"source_url":"https://github.com/microsoft/OdysseyBench","source_host":"github.com","occurred_at":"2025-10-10T11:22:39+00:00","first_seen_at":"2026-06-06T01:49:41.740219+00:00","date_source":"source","context":"Jupyter Notebook"},"context_markers":[{"label":"Lab","value":"Microsoft","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"microsoft/OdysseyBench","source":"source"},{"label":"Language","value":"Jupyter Notebook","source":"source"},{"label":"Stars","value":"10","source":"traction"},{"label":"Notability","value":"New repo with only 10 stars.","source":"signal"},{"label":"Radar lane","value":"Evals and quality","source":"radar"},{"label":"Radar lane","value":"Product and customer","source":"radar"},{"label":"Matched term","value":"eval","source":"radar"},{"label":"Matched term","value":"benchmark","source":"radar"},{"label":"Matched term","value":"product","source":"radar"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Data pipeline","source":"evidence"},{"label":"Watch term","value":"Agents and tool use","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/microsoft/OdysseyBench"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:56:32.820228+00:00"},"data_business":{"matches":true,"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"},{"key":"product","label":"Product and customer","url":"https://onlylabs.fyi/data-radar/product","json_url":"https://onlylabs.fyi/data-radar/product/signals.json"}],"matched_terms":["eval","benchmark","product"],"score":28,"reason":"Microsoft has a repo signal matching evals and quality, product and customer."},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606/signal.json","dossier_json":"https://onlylabs.fyi/labs/microsoft/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/microsoft/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/microsoft/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":"https://onlylabs.fyi/data-radar.json","opportunities_json":"https://onlylabs.fyi/opportunities.json"},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Which data-business lane explains this signal: Evals and quality, Product and customer?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","data_business_lane","evidence_url"],"data_business_relevance":"New repositories can expose organization build priorities early, especially around internal tooling, eval infrastructure, data systems, deployment, and agent workflows.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606/signal.json","required":true},{"label":"source","url":"https://github.com/microsoft/OdysseyBench","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/microsoft/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/microsoft/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":"https://onlylabs.fyi/data-radar.json","required":true}],"expected_output":["one-paragraph source-grounded interpretation","data-business implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Microsoft's repo signal \"microsoft/OdysseyBench\" for frontier lab strategy and data-business implications."},"semantic_triples":[{"subject":"Microsoft","predicate":"published repo","object":"microsoft/OdysseyBench","text":"Microsoft published repo microsoft/OdysseyBench."},{"subject":"microsoft/OdysseyBench","predicate":"is classified as","object":"repo signal","text":"microsoft/OdysseyBench is classified as repo signal."},{"subject":"microsoft/OdysseyBench","predicate":"belongs to","object":"repos desk","text":"microsoft/OdysseyBench belongs to repos desk."},{"subject":"microsoft/OdysseyBench","predicate":"has context","object":"Jupyter Notebook","text":"microsoft/OdysseyBench has context Jupyter Notebook."},{"subject":"microsoft/OdysseyBench","predicate":"has evidence coverage","object":"1 captured evidence page","text":"microsoft/OdysseyBench has evidence coverage 1 captured evidence page."},{"subject":"microsoft/OdysseyBench","predicate":"matches data-business lanes","object":"Evals and quality, Product and customer","text":"microsoft/OdysseyBench matches data-business lanes Evals and quality, Product and customer."},{"subject":"microsoft/OdysseyBench","predicate":"has captured page count","object":"1","text":"microsoft/OdysseyBench has captured page count 1."},{"subject":"microsoft/OdysseyBench","predicate":"has readable page count","object":"1","text":"microsoft/OdysseyBench has readable page count 1."},{"subject":"microsoft/OdysseyBench","predicate":"has related signal count","object":"6","text":"microsoft/OdysseyBench has related signal count 6."},{"subject":"microsoft/OdysseyBench","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"microsoft/OdysseyBench has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"microsoft/OdysseyBench","predicate":"has source host","object":"github.com","text":"microsoft/OdysseyBench has source host github.com."},{"subject":"microsoft/OdysseyBench","predicate":"has lab","object":"Microsoft","text":"microsoft/OdysseyBench has lab Microsoft."},{"subject":"microsoft/OdysseyBench","predicate":"has signal desk","object":"repos","text":"microsoft/OdysseyBench has signal desk repos."},{"subject":"microsoft/OdysseyBench","predicate":"has source host","object":"github.com","text":"microsoft/OdysseyBench has source host github.com."},{"subject":"microsoft/OdysseyBench","predicate":"has repository","object":"microsoft/OdysseyBench","text":"microsoft/OdysseyBench has repository microsoft/OdysseyBench."},{"subject":"microsoft/OdysseyBench","predicate":"has language","object":"Jupyter Notebook","text":"microsoft/OdysseyBench has language Jupyter Notebook."},{"subject":"microsoft/OdysseyBench","predicate":"has stars","object":"10","text":"microsoft/OdysseyBench has stars 10."},{"subject":"microsoft/OdysseyBench","predicate":"has notability","object":"New repo with only 10 stars.","text":"microsoft/OdysseyBench has notability New repo with only 10 stars.."},{"subject":"microsoft/OdysseyBench","predicate":"has radar lane","object":"Evals and quality","text":"microsoft/OdysseyBench has radar lane Evals and quality."}]},"intelligence":{"signal_desk":"repos","answer":"Microsoft published microsoft/OdysseyBench (Jupyter Notebook). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo microsoft/OdysseyBench · language Jupyter Notebook · New repo with only 10 stars.. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality, Product and customer in the data-business radar.","semantic_triples":[{"subject":"Microsoft","predicate":"published repo","object":"microsoft/OdysseyBench","text":"Microsoft published repo microsoft/OdysseyBench."},{"subject":"microsoft/OdysseyBench","predicate":"is classified as","object":"repo signal","text":"microsoft/OdysseyBench is classified as repo signal."},{"subject":"microsoft/OdysseyBench","predicate":"belongs to","object":"repos desk","text":"microsoft/OdysseyBench belongs to repos desk."},{"subject":"microsoft/OdysseyBench","predicate":"has context","object":"Jupyter Notebook","text":"microsoft/OdysseyBench has context Jupyter Notebook."},{"subject":"microsoft/OdysseyBench","predicate":"has evidence coverage","object":"1 captured evidence page","text":"microsoft/OdysseyBench has evidence coverage 1 captured evidence page."},{"subject":"microsoft/OdysseyBench","predicate":"matches data-business lanes","object":"Evals and quality, Product and customer","text":"microsoft/OdysseyBench matches data-business lanes Evals and quality, Product and customer."}]},"signal":{"id":"0fef14a8-0b64-43b9-bc0d-75b8cb461606","url":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606","json_url":"https://onlylabs.fyi/signals/0fef14a8-0b64-43b9-bc0d-75b8cb461606/signal.json","source_url":"https://github.com/microsoft/OdysseyBench","title":"microsoft/OdysseyBench","summary":"Microsoft published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Jupyter Notebook","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2025-10-10T11:22:39+00:00","first_seen_at":"2026-06-06T01:49:41.740219+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/microsoft/OdysseyBench"]},"facets":{"repo":"microsoft/OdysseyBench","language":"Jupyter Notebook"},"traction":{"github_stars":10,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":{"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals"},{"key":"product","label":"Product and customer","url":"https://onlylabs.fyi/data-radar/product"}],"score":28,"matched_terms":["eval","benchmark","product"],"reason":"Microsoft has a repo signal matching evals and quality, product and customer."}},"primary_evidence_page":{"url":"https://github.com/microsoft/OdysseyBench","final_url":"https://github.com/microsoft/OdysseyBench","title":"microsoft/OdysseyBench repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:56:32.820228+00:00","bytes":11896,"raw_path":"7ece5a73c754eea5e566511f90bb65a6e31bc74d180d8f342fc5359927592e78.json","content_hash":"b3d149d8cacd4ef4e5c6fd3c6f19d0d0d163f831cc094747d4452fee3a2f60e2","excerpt_chars":1200,"truncated":true,"excerpt":"microsoft/OdysseyBench Description: Repo for the OdysseyBench Benchmark for Evaluating Agent Memory on Long-horizon Productivity Workflows Language: Jupyter Notebook License: MIT Stars: 10 Forks: 0 Open issues: 22 Created: 2025-10-10T11:22:39Z Pushed: 2026-06-11T00:11:52Z Default branch: main Fork: no Archived: no README: OdysseyBench: Evaluating LLM Agents on Long-Horizon Complex Office Application Workflows OdysseyBench is a comprehensive benchmark and evaluation suite for task-oriented agent systems, supporting both the OdysseyBench+ and OdysseyBench-Neo tracks. This project provides tools for task generation, execution, validation, and in-depth evaluation of agent performance, with a focus on memory and retrieval-augmented generation (RAG) capabilities. 💼 Preparation ``` git clone https://github.com/microsoft/OdysseyBench.git git clone https://github.com/zlwang-cs/OfficeBench.git /tmp/OfficeBench find /tmp/OfficeBench/tasks/ -type d -name testbed -exec bash -c 'dest=\"OdysseyBench/tasks/${1#*/tasks/}\"; mkdir -p \"$dest\"; cp -r \"$1\" \"$dest/../\"' _ {} \\; rm -rf /tmp/OfficeBench ``` 🛠️ Setup ``` conda create -n odysseybench python=3.10 pip install -r requirements.txt export..."},"evidence_pages":[{"url":"https://github.com/microsoft/OdysseyBench","final_url":"https://github.com/microsoft/OdysseyBench","title":"microsoft/OdysseyBench repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:56:32.820228+00:00","bytes":11896,"raw_path":"7ece5a73c754eea5e566511f90bb65a6e31bc74d180d8f342fc5359927592e78.json","content_hash":"b3d149d8cacd4ef4e5c6fd3c6f19d0d0d163f831cc094747d4452fee3a2f60e2","excerpt_chars":1200,"truncated":true,"excerpt":"microsoft/OdysseyBench Description: Repo for the OdysseyBench Benchmark for Evaluating Agent Memory on Long-horizon Productivity Workflows Language: Jupyter Notebook License: MIT Stars: 10 Forks: 0 Open issues: 22 Created: 2025-10-10T11:22:39Z Pushed: 2026-06-11T00:11:52Z Default branch: main Fork: no Archived: no README: OdysseyBench: Evaluating LLM Agents on Long-Horizon Complex Office Application Workflows OdysseyBench is a comprehensive benchmark and evaluation suite for task-oriented agent systems, supporting both the OdysseyBench+ and OdysseyBench-Neo tracks. This project provides tools for task generation, execution, validation, and in-depth evaluation of agent performance, with a focus on memory and retrieval-augmented generation (RAG) capabilities. 💼 Preparation ``` git clone https://github.com/microsoft/OdysseyBench.git git clone https://github.com/zlwang-cs/OfficeBench.git /tmp/OfficeBench find /tmp/OfficeBench/tasks/ -type d -name testbed -exec bash -c 'dest=\"OdysseyBench/tasks/${1#*/tasks/}\"; mkdir -p \"$dest\"; cp -r \"$1\" \"$dest/../\"' _ {} \\; rm -rf /tmp/OfficeBench ``` 🛠️ Setup ``` conda create -n odysseybench python=3.10 pip install -r requirements.txt export..."}],"related_signals":[{"id":"8afe79f4-378b-4748-9e2a-3cf5e3253fdb","url":"https://onlylabs.fyi/signals/8afe79f4-378b-4748-9e2a-3cf5e3253fdb","source_url":"https://github.com/microsoft/Dev-Trio","title":"microsoft/Dev-Trio","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-08T03:41:01+00:00","first_seen_at":"2026-06-08T07:01:04.198092+00:00","date_source":"source"},{"id":"9e75fa50-dba7-4b77-9faf-166c323e3dff","url":"https://onlylabs.fyi/signals/9e75fa50-dba7-4b77-9faf-166c323e3dff","source_url":"https://github.com/microsoft/amplifier-app-paperclip","title":"microsoft/amplifier-app-paperclip","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-04T21:13:41+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"76cacf33-54b2-4074-bec0-23944d8fb67c","url":"https://onlylabs.fyi/signals/76cacf33-54b2-4074-bec0-23944d8fb67c","source_url":"https://github.com/microsoft/create-github-app-token-via-key-vault","title":"microsoft/create-github-app-token-via-key-vault","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-04T18:22:49+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"b2f7bcbd-9db3-4785-8a2a-2e0e0cb22ed2","url":"https://onlylabs.fyi/signals/b2f7bcbd-9db3-4785-8a2a-2e0e0cb22ed2","source_url":"https://github.com/microsoft/Enterprise-AI-Analytics-Pipeline","title":"microsoft/Enterprise-AI-Analytics-Pipeline","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-04T16:48:58+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"51a9ec5d-5f14-45d9-b57a-db362b5d1ace","url":"https://onlylabs.fyi/signals/51a9ec5d-5f14-45d9-b57a-db362b5d1ace","source_url":"https://github.com/microsoft/fabric-org-app-template","title":"microsoft/fabric-org-app-template","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-03T18:26:42+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"f26025da-153f-4d27-851c-7b4892602810","url":"https://onlylabs.fyi/signals/f26025da-153f-4d27-851c-7b4892602810","source_url":"https://github.com/microsoft/amplifier-bundle-amplifier-online","title":"microsoft/amplifier-bundle-amplifier-online","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-03T17:26:20+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"}]}