{"schema_version":"onlylabs.public_signal.v1","title":"Cohere Repo: cohere-ai/DiskVectorIndex","description":"Cohere repo signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38","json_url":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38/signal.json","generated_at":"2026-06-11T03:58:55.637458+00:00","org":{"slug":"cohere","name":"Cohere","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/cohere","dossier_json_url":"https://onlylabs.fyi/labs/cohere/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38","signal_json":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38/signal.json","source":"https://github.com/cohere-ai/DiskVectorIndex","lab_dossier":"https://onlylabs.fyi/labs/cohere","lab_dossier_json":"https://onlylabs.fyi/labs/cohere/dossier.json","analysis":"https://onlylabs.fyi/analysis/cohere","analysis_json":"https://onlylabs.fyi/analysis/cohere/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/cohere/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":null},"answer_pack":{"answer":"Cohere published cohere-ai/DiskVectorIndex (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo cohere-ai/DiskVectorIndex · language Python. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","signal_desk":"repos","source_context":{"source_url":"https://github.com/cohere-ai/DiskVectorIndex","source_host":"github.com","occurred_at":"2024-07-02T19:08:30+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source","context":"Python"},"context_markers":[{"label":"Lab","value":"Cohere","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"cohere-ai/DiskVectorIndex","source":"source"},{"label":"Language","value":"Python","source":"source"},{"label":"Stars","value":"210","source":"traction"},{"label":"Watch term","value":"Data pipeline","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/cohere-ai/DiskVectorIndex"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:58:55.637458+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38/signal.json","dossier_json":"https://onlylabs.fyi/labs/cohere/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/cohere/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/cohere/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","data_business_lane","evidence_url"],"data_business_relevance":"New repositories can expose organization build priorities early, especially around internal tooling, eval infrastructure, data systems, deployment, and agent workflows.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38/signal.json","required":true},{"label":"source","url":"https://github.com/cohere-ai/DiskVectorIndex","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/cohere/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/cohere/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Cohere's repo signal \"cohere-ai/DiskVectorIndex\" for frontier lab strategy."},"semantic_triples":[{"subject":"Cohere","predicate":"published repo","object":"cohere-ai/DiskVectorIndex","text":"Cohere published repo cohere-ai/DiskVectorIndex."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"is classified as","object":"repo signal","text":"cohere-ai/DiskVectorIndex is classified as repo signal."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"belongs to","object":"repos desk","text":"cohere-ai/DiskVectorIndex belongs to repos desk."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has context","object":"Python","text":"cohere-ai/DiskVectorIndex has context Python."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has evidence coverage","object":"1 captured evidence page","text":"cohere-ai/DiskVectorIndex has evidence coverage 1 captured evidence page."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has captured page count","object":"1","text":"cohere-ai/DiskVectorIndex has captured page count 1."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has readable page count","object":"1","text":"cohere-ai/DiskVectorIndex has readable page count 1."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has related signal count","object":"6","text":"cohere-ai/DiskVectorIndex has related signal count 6."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"cohere-ai/DiskVectorIndex has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has source host","object":"github.com","text":"cohere-ai/DiskVectorIndex has source host github.com."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has lab","object":"Cohere","text":"cohere-ai/DiskVectorIndex has lab Cohere."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has signal desk","object":"repos","text":"cohere-ai/DiskVectorIndex has signal desk repos."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has source host","object":"github.com","text":"cohere-ai/DiskVectorIndex has source host github.com."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has repository","object":"cohere-ai/DiskVectorIndex","text":"cohere-ai/DiskVectorIndex has repository cohere-ai/DiskVectorIndex."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has language","object":"Python","text":"cohere-ai/DiskVectorIndex has language Python."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has stars","object":"210","text":"cohere-ai/DiskVectorIndex has stars 210."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has watch term","object":"Data pipeline","text":"cohere-ai/DiskVectorIndex has watch term Data pipeline."}]},"intelligence":{"signal_desk":"repos","answer":"Cohere published cohere-ai/DiskVectorIndex (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo cohere-ai/DiskVectorIndex · language Python. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","semantic_triples":[{"subject":"Cohere","predicate":"published repo","object":"cohere-ai/DiskVectorIndex","text":"Cohere published repo cohere-ai/DiskVectorIndex."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"is classified as","object":"repo signal","text":"cohere-ai/DiskVectorIndex is classified as repo signal."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"belongs to","object":"repos desk","text":"cohere-ai/DiskVectorIndex belongs to repos desk."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has context","object":"Python","text":"cohere-ai/DiskVectorIndex has context Python."},{"subject":"cohere-ai/DiskVectorIndex","predicate":"has evidence coverage","object":"1 captured evidence page","text":"cohere-ai/DiskVectorIndex has evidence coverage 1 captured evidence page."}]},"signal":{"id":"c0a14421-330d-45c5-8309-3ac364685f38","url":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38","json_url":"https://onlylabs.fyi/signals/c0a14421-330d-45c5-8309-3ac364685f38/signal.json","source_url":"https://github.com/cohere-ai/DiskVectorIndex","title":"cohere-ai/DiskVectorIndex","summary":"Cohere published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"cohere","name":"Cohere","category":"frontier-lab"},"occurred_at":"2024-07-02T19:08:30+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/cohere-ai/DiskVectorIndex"]},"facets":{"repo":"cohere-ai/DiskVectorIndex","language":"Python"},"traction":{"github_stars":210,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://github.com/cohere-ai/DiskVectorIndex","final_url":"https://github.com/cohere-ai/DiskVectorIndex","title":"cohere-ai/DiskVectorIndex repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:58:55.637458+00:00","bytes":12112,"raw_path":"7be2906be10635985a18d0fb2da3a29843978bf23560a045fe92373ee074ac92.json","content_hash":"61ac6ef7c8189accd56b30802331b6c84c1fbc594c496aed352ac1e0daca20d3","excerpt_chars":1200,"truncated":true,"excerpt":"cohere-ai/DiskVectorIndex Language: Python License: Apache-2.0 Stars: 210 Forks: 12 Open issues: 3 Created: 2024-07-02T19:08:30Z Pushed: 2025-06-26T21:40:29Z Default branch: main Fork: no Archived: no README: DiskVectorIndex - Ultra-Low Memory Vector Search on Large Dataset Indexing large datasets (100M+ embeddings) requires a lot of memory in most vector databases: For 100M documents/embeddings, most vector databases require about **500GB of memory**, driving the cost for your servers accordingly high. This repository offers methods to be able to search on very large datasets (100M+) with just **300MB of memory**, making semantic search on such large datasets suitable for the Memory-Poor developers. We provide various pre-build indices, that can be used to semantic search and powering your RAG applications. Pre-Build Indices Below you find different pre-build indices. The embeddings are downloaded at the first call, the size is specified under Index Size. Most of the embeddings are memory mapped from disk, e.g. for the `Cohere/trec-rag-2024-index` corpus you need 15 GB of disk, but just 380 MB of memory to load the index. | Name | Description | #Docs | Index Size (GB) | Memory..."},"evidence_pages":[{"url":"https://github.com/cohere-ai/DiskVectorIndex","final_url":"https://github.com/cohere-ai/DiskVectorIndex","title":"cohere-ai/DiskVectorIndex repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:58:55.637458+00:00","bytes":12112,"raw_path":"7be2906be10635985a18d0fb2da3a29843978bf23560a045fe92373ee074ac92.json","content_hash":"61ac6ef7c8189accd56b30802331b6c84c1fbc594c496aed352ac1e0daca20d3","excerpt_chars":1200,"truncated":true,"excerpt":"cohere-ai/DiskVectorIndex Language: Python License: Apache-2.0 Stars: 210 Forks: 12 Open issues: 3 Created: 2024-07-02T19:08:30Z Pushed: 2025-06-26T21:40:29Z Default branch: main Fork: no Archived: no README: DiskVectorIndex - Ultra-Low Memory Vector Search on Large Dataset Indexing large datasets (100M+ embeddings) requires a lot of memory in most vector databases: For 100M documents/embeddings, most vector databases require about **500GB of memory**, driving the cost for your servers accordingly high. This repository offers methods to be able to search on very large datasets (100M+) with just **300MB of memory**, making semantic search on such large datasets suitable for the Memory-Poor developers. We provide various pre-build indices, that can be used to semantic search and powering your RAG applications. Pre-Build Indices Below you find different pre-build indices. The embeddings are downloaded at the first call, the size is specified under Index Size. Most of the embeddings are memory mapped from disk, e.g. for the `Cohere/trec-rag-2024-index` corpus you need 15 GB of disk, but just 380 MB of memory to load the index. | Name | Description | #Docs | Index Size (GB) | Memory..."}],"related_signals":[{"id":"b04cc72b-18a2-4d54-a2ff-ac76954c11eb","url":"https://onlylabs.fyi/signals/b04cc72b-18a2-4d54-a2ff-ac76954c11eb","source_url":"https://github.com/cohere-ai/cohere-azure-workshops","title":"cohere-ai/cohere-azure-workshops","context":"Jupyter Notebook","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"cohere","name":"Cohere","category":"frontier-lab"},"occurred_at":"2026-05-01T21:40:24+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source"},{"id":"dd51f42b-b547-4722-88fa-9e9b7ba7a5ae","url":"https://onlylabs.fyi/signals/dd51f42b-b547-4722-88fa-9e9b7ba7a5ae","source_url":"https://github.com/cohere-ai/cvm-measure","title":"cohere-ai/cvm-measure","context":"Makefile","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"cohere","name":"Cohere","category":"frontier-lab"},"occurred_at":"2026-04-10T19:07:01+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source"},{"id":"8f7c20cc-6531-4978-bb14-4e3b1d6c7b25","url":"https://onlylabs.fyi/signals/8f7c20cc-6531-4978-bb14-4e3b1d6c7b25","source_url":"https://github.com/cohere-ai/melody","title":"cohere-ai/melody","context":"Rust","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"cohere","name":"Cohere","category":"frontier-lab"},"occurred_at":"2025-10-10T17:32:30+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source"},{"id":"93fef8fe-ae41-4db2-aa12-e85c4b88fda0","url":"https://onlylabs.fyi/signals/93fef8fe-ae41-4db2-aa12-e85c4b88fda0","source_url":"https://github.com/cohere-ai/htn-2025-techtalk","title":"cohere-ai/htn-2025-techtalk","context":"Jupyter Notebook","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"cohere","name":"Cohere","category":"frontier-lab"},"occurred_at":"2025-09-04T01:21:23+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source"},{"id":"a8a38c03-91f9-452f-915d-2191c3a03296","url":"https://onlylabs.fyi/signals/a8a38c03-91f9-452f-915d-2191c3a03296","source_url":"https://github.com/cohere-ai/north-mcp-python-sdk","title":"cohere-ai/north-mcp-python-sdk","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"cohere","name":"Cohere","category":"frontier-lab"},"occurred_at":"2025-05-08T13:04:41+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source"},{"id":"f4ee1bbf-3fd2-4c59-9827-17979cbffa3c","url":"https://onlylabs.fyi/signals/f4ee1bbf-3fd2-4c59-9827-17979cbffa3c","source_url":"https://github.com/cohere-ai/cohere-workshop-march-17-2025","title":"cohere-ai/cohere-workshop-march-17-2025","context":"Jupyter Notebook","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"cohere","name":"Cohere","category":"frontier-lab"},"occurred_at":"2025-02-25T14:18:28+00:00","first_seen_at":"2026-06-05T05:43:00.174979+00:00","date_source":"source"}]}