{"schema_version":"onlylabs.public_signal.v1","title":"Sarvam AI Repo: sarvamai/llm_wer","description":"Sarvam AI repo signal with public source context, captured evidence pages, related signals, and category-scoped analysis context.","url":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0","json_url":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0/signal.json","generated_at":"2026-06-11T03:20:47.596116+00:00","org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab","category_label":"Neolab","dossier_url":"https://onlylabs.fyi/labs/sarvam","dossier_json_url":"https://onlylabs.fyi/labs/sarvam/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0","signal_json":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0/signal.json","source":"https://github.com/sarvamai/llm_wer","lab_dossier":"https://onlylabs.fyi/labs/sarvam","lab_dossier_json":"https://onlylabs.fyi/labs/sarvam/dossier.json","analysis":"https://onlylabs.fyi/analysis/sarvam","analysis_json":"https://onlylabs.fyi/analysis/sarvam/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/sarvam/evidence.json","category":"https://onlylabs.fyi/neolabs","category_json":"https://onlylabs.fyi/neolabs.json","category_feed":"https://onlylabs.fyi/neolabs/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json?category=neolab","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":null},"answer_pack":{"answer":"Sarvam AI published sarvamai/llm_wer (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo sarvamai/llm_wer · language Python · New repo, low stars. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","signal_desk":"repos","source_context":{"source_url":"https://github.com/sarvamai/llm_wer","source_host":"github.com","occurred_at":"2025-07-08T06:39:43+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source","context":"Python"},"context_markers":[{"label":"Lab","value":"Sarvam AI","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"sarvamai/llm_wer","source":"source"},{"label":"Language","value":"Python","source":"source"},{"label":"Stars","value":"26","source":"traction"},{"label":"Notability","value":"New repo, low stars","source":"signal"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/sarvamai/llm_wer"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:20:47.596116+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0/signal.json","dossier_json":"https://onlylabs.fyi/labs/sarvam/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/sarvam/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/sarvam/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json?category=neolab","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","evidence_url"],"data_business_relevance":"Data-business lane extraction is scoped to frontier labs; for this category, interpret the repository as source-grounded category strategy evidence.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0/signal.json","required":true},{"label":"source","url":"https://github.com/sarvamai/llm_wer","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/sarvam/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/sarvam/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Sarvam AI's repo signal \"sarvamai/llm_wer\" for neolab strategy."},"semantic_triples":[{"subject":"Sarvam AI","predicate":"published repo","object":"sarvamai/llm_wer","text":"Sarvam AI published repo sarvamai/llm_wer."},{"subject":"sarvamai/llm_wer","predicate":"is classified as","object":"repo signal","text":"sarvamai/llm_wer is classified as repo signal."},{"subject":"sarvamai/llm_wer","predicate":"belongs to","object":"repos desk","text":"sarvamai/llm_wer belongs to repos desk."},{"subject":"sarvamai/llm_wer","predicate":"has context","object":"Python","text":"sarvamai/llm_wer has context Python."},{"subject":"sarvamai/llm_wer","predicate":"has evidence coverage","object":"1 captured evidence page","text":"sarvamai/llm_wer has evidence coverage 1 captured evidence page."},{"subject":"sarvamai/llm_wer","predicate":"has captured page count","object":"1","text":"sarvamai/llm_wer has captured page count 1."},{"subject":"sarvamai/llm_wer","predicate":"has readable page count","object":"1","text":"sarvamai/llm_wer has readable page count 1."},{"subject":"sarvamai/llm_wer","predicate":"has related signal count","object":"6","text":"sarvamai/llm_wer has related signal count 6."},{"subject":"sarvamai/llm_wer","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"sarvamai/llm_wer has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"sarvamai/llm_wer","predicate":"has source host","object":"github.com","text":"sarvamai/llm_wer has source host github.com."},{"subject":"sarvamai/llm_wer","predicate":"has lab","object":"Sarvam AI","text":"sarvamai/llm_wer has lab Sarvam AI."},{"subject":"sarvamai/llm_wer","predicate":"has signal desk","object":"repos","text":"sarvamai/llm_wer has signal desk repos."},{"subject":"sarvamai/llm_wer","predicate":"has source host","object":"github.com","text":"sarvamai/llm_wer has source host github.com."},{"subject":"sarvamai/llm_wer","predicate":"has repository","object":"sarvamai/llm_wer","text":"sarvamai/llm_wer has repository sarvamai/llm_wer."},{"subject":"sarvamai/llm_wer","predicate":"has language","object":"Python","text":"sarvamai/llm_wer has language Python."},{"subject":"sarvamai/llm_wer","predicate":"has stars","object":"26","text":"sarvamai/llm_wer has stars 26."},{"subject":"sarvamai/llm_wer","predicate":"has notability","object":"New repo, low stars","text":"sarvamai/llm_wer has notability New repo, low stars."},{"subject":"sarvamai/llm_wer","predicate":"has watch term","object":"Eval methodology","text":"sarvamai/llm_wer has watch term Eval methodology."}]},"intelligence":{"signal_desk":"repos","answer":"Sarvam AI published sarvamai/llm_wer (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo sarvamai/llm_wer · language Python · New repo, low stars. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","semantic_triples":[{"subject":"Sarvam AI","predicate":"published repo","object":"sarvamai/llm_wer","text":"Sarvam AI published repo sarvamai/llm_wer."},{"subject":"sarvamai/llm_wer","predicate":"is classified as","object":"repo signal","text":"sarvamai/llm_wer is classified as repo signal."},{"subject":"sarvamai/llm_wer","predicate":"belongs to","object":"repos desk","text":"sarvamai/llm_wer belongs to repos desk."},{"subject":"sarvamai/llm_wer","predicate":"has context","object":"Python","text":"sarvamai/llm_wer has context Python."},{"subject":"sarvamai/llm_wer","predicate":"has evidence coverage","object":"1 captured evidence page","text":"sarvamai/llm_wer has evidence coverage 1 captured evidence page."}]},"signal":{"id":"495f5bb8-10b1-41c4-8486-4047477767b0","url":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0","json_url":"https://onlylabs.fyi/signals/495f5bb8-10b1-41c4-8486-4047477767b0/signal.json","source_url":"https://github.com/sarvamai/llm_wer","title":"sarvamai/llm_wer","summary":"Sarvam AI published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab"},"occurred_at":"2025-07-08T06:39:43+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/sarvamai/llm_wer"]},"facets":{"repo":"sarvamai/llm_wer","language":"Python"},"traction":{"github_stars":26,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://github.com/sarvamai/llm_wer","final_url":"https://github.com/sarvamai/llm_wer","title":"sarvamai/llm_wer repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:20:47.596116+00:00","bytes":11647,"raw_path":"7d7668e2b1c5430b48064f58f0bbdbfc6158ba95240495c5614c4751a6bee328.json","content_hash":"755d888f960cc871ea924f39eac2f3cd1bd801b8cb6fe5c6ccc449372415137f","excerpt_chars":1200,"truncated":true,"excerpt":"sarvamai/llm_wer Language: Python Stars: 26 Forks: 9 Open issues: 3 Created: 2025-07-08T06:39:43Z Pushed: 2026-04-02T14:00:43Z Default branch: main Fork: no Archived: no README: Background and Motivation To evaluate Automatic Speech Recognition, we traditionally use metrics like Word Error Rate (WER) and Character Error Rate (CER). These metrics work by strictly comparing the ASR's transcribed text to a perfect, human-verified reference text, word for word. However, human language, especially in a multilingual context like India, is fluid and filled with nuances. A rigid, word-for-word comparison often penalizes ASR models for making stylistic or formatting choices that are perfectly acceptable and do not change the meaning of the text. This leads to an inflated error rate and an inaccurate assessment of the ASR's true performance. Why Standard WER is Insufficient for Indic Languages Standard WER can be misleading because it fails to understand context and semantic equivalence. It flags any textual difference as an error, even when no actual mistake in understanding has occurred. Here are a few cases where the WER would be high, but the transcription is functionally correct: -..."},"evidence_pages":[{"url":"https://github.com/sarvamai/llm_wer","final_url":"https://github.com/sarvamai/llm_wer","title":"sarvamai/llm_wer repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:20:47.596116+00:00","bytes":11647,"raw_path":"7d7668e2b1c5430b48064f58f0bbdbfc6158ba95240495c5614c4751a6bee328.json","content_hash":"755d888f960cc871ea924f39eac2f3cd1bd801b8cb6fe5c6ccc449372415137f","excerpt_chars":1200,"truncated":true,"excerpt":"sarvamai/llm_wer Language: Python Stars: 26 Forks: 9 Open issues: 3 Created: 2025-07-08T06:39:43Z Pushed: 2026-04-02T14:00:43Z Default branch: main Fork: no Archived: no README: Background and Motivation To evaluate Automatic Speech Recognition, we traditionally use metrics like Word Error Rate (WER) and Character Error Rate (CER). These metrics work by strictly comparing the ASR's transcribed text to a perfect, human-verified reference text, word for word. However, human language, especially in a multilingual context like India, is fluid and filled with nuances. A rigid, word-for-word comparison often penalizes ASR models for making stylistic or formatting choices that are perfectly acceptable and do not change the meaning of the text. This leads to an inflated error rate and an inaccurate assessment of the ASR's true performance. Why Standard WER is Insufficient for Indic Languages Standard WER can be misleading because it fails to understand context and semantic equivalence. It flags any textual difference as an error, even when no actual mistake in understanding has occurred. Here are a few cases where the WER would be high, but the transcription is functionally correct: -..."}],"related_signals":[{"id":"3fe36150-c035-4288-8712-0eb98e7b97c7","url":"https://onlylabs.fyi/signals/3fe36150-c035-4288-8712-0eb98e7b97c7","source_url":"https://github.com/sarvamai/sarvam-pulse","title":"sarvamai/sarvam-pulse","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab"},"occurred_at":"2026-04-28T17:07:47+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source"},{"id":"91a9d011-aa48-4da6-a34e-8335ad697261","url":"https://onlylabs.fyi/signals/91a9d011-aa48-4da6-a34e-8335ad697261","source_url":"https://github.com/sarvamai/sarvam-mcp","title":"sarvamai/sarvam-mcp","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab"},"occurred_at":"2026-04-27T13:44:58+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source"},{"id":"aea1f29c-7523-4e59-b0c8-62dae7f538f5","url":"https://onlylabs.fyi/signals/aea1f29c-7523-4e59-b0c8-62dae7f538f5","source_url":"https://github.com/sarvamai/n8n-sarvam-node","title":"sarvamai/n8n-sarvam-node","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab"},"occurred_at":"2026-02-27T12:52:34+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source"},{"id":"a1bedd4f-c7ee-4e77-9fc6-d60750cb4c34","url":"https://onlylabs.fyi/signals/a1bedd4f-c7ee-4e77-9fc6-d60750cb4c34","source_url":"https://github.com/sarvamai/olmOCR-bench-sarvam-api","title":"sarvamai/olmOCR-bench-sarvam-api","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab"},"occurred_at":"2026-02-08T13:08:27+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source"},{"id":"ca47d671-60e7-422d-ab0d-225ea71d05bd","url":"https://onlylabs.fyi/signals/ca47d671-60e7-422d-ab0d-225ea71d05bd","source_url":"https://github.com/sarvamai/skills","title":"sarvamai/skills","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab"},"occurred_at":"2026-02-04T12:49:56+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source"},{"id":"e5bb1a7a-78f1-4af9-9074-3c3e7a55caf2","url":"https://onlylabs.fyi/signals/e5bb1a7a-78f1-4af9-9074-3c3e7a55caf2","source_url":"https://github.com/sarvamai/llm_intent_entity","title":"sarvamai/llm_intent_entity","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"sarvam","name":"Sarvam AI","category":"neolab"},"occurred_at":"2025-11-20T13:20:42+00:00","first_seen_at":"2026-06-05T20:58:50.739664+00:00","date_source":"source"}]}