{"schema_version":"onlylabs.public_signal.v1","title":"Microsoft Repo: microsoft/Staccato-Stuttered-ASR","description":"Microsoft repo signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93","json_url":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93/signal.json","generated_at":"2026-06-11T03:03:02.497009+00:00","org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/microsoft","dossier_json_url":"https://onlylabs.fyi/labs/microsoft/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93","signal_json":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93/signal.json","source":"https://github.com/microsoft/Staccato-Stuttered-ASR","lab_dossier":"https://onlylabs.fyi/labs/microsoft","lab_dossier_json":"https://onlylabs.fyi/labs/microsoft/dossier.json","analysis":"https://onlylabs.fyi/analysis/microsoft","analysis_json":"https://onlylabs.fyi/analysis/microsoft/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/microsoft/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":null},"answer_pack":{"answer":"Microsoft published microsoft/Staccato-Stuttered-ASR (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo microsoft/Staccato-Stuttered-ASR · language Python · New repo from Microsoft on ASR, no traction info. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","signal_desk":"repos","source_context":{"source_url":"https://github.com/microsoft/Staccato-Stuttered-ASR","source_host":"github.com","occurred_at":"2026-01-07T21:54:17+00:00","first_seen_at":"2026-06-06T01:49:41.740219+00:00","date_source":"source","context":"Python"},"context_markers":[{"label":"Lab","value":"Microsoft","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"microsoft/Staccato-Stuttered-ASR","source":"source"},{"label":"Language","value":"Python","source":"source"},{"label":"Notability","value":"New repo from Microsoft on ASR, no traction info","source":"signal"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Infrastructure","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/microsoft/Staccato-Stuttered-ASR"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:03:02.497009+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93/signal.json","dossier_json":"https://onlylabs.fyi/labs/microsoft/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/microsoft/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/microsoft/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","data_business_lane","evidence_url"],"data_business_relevance":"New repositories can expose organization build priorities early, especially around internal tooling, eval infrastructure, data systems, deployment, and agent workflows.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93/signal.json","required":true},{"label":"source","url":"https://github.com/microsoft/Staccato-Stuttered-ASR","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/microsoft/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/microsoft/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Microsoft's repo signal \"microsoft/Staccato-Stuttered-ASR\" for frontier lab strategy."},"semantic_triples":[{"subject":"Microsoft","predicate":"published repo","object":"microsoft/Staccato-Stuttered-ASR","text":"Microsoft published repo microsoft/Staccato-Stuttered-ASR."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"is classified as","object":"repo signal","text":"microsoft/Staccato-Stuttered-ASR is classified as repo signal."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"belongs to","object":"repos desk","text":"microsoft/Staccato-Stuttered-ASR belongs to repos desk."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has context","object":"Python","text":"microsoft/Staccato-Stuttered-ASR has context Python."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has evidence coverage","object":"1 captured evidence page","text":"microsoft/Staccato-Stuttered-ASR has evidence coverage 1 captured evidence page."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has captured page count","object":"1","text":"microsoft/Staccato-Stuttered-ASR has captured page count 1."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has readable page count","object":"1","text":"microsoft/Staccato-Stuttered-ASR has readable page count 1."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has related signal count","object":"6","text":"microsoft/Staccato-Stuttered-ASR has related signal count 6."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"microsoft/Staccato-Stuttered-ASR has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has source host","object":"github.com","text":"microsoft/Staccato-Stuttered-ASR has source host github.com."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has lab","object":"Microsoft","text":"microsoft/Staccato-Stuttered-ASR has lab Microsoft."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has signal desk","object":"repos","text":"microsoft/Staccato-Stuttered-ASR has signal desk repos."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has source host","object":"github.com","text":"microsoft/Staccato-Stuttered-ASR has source host github.com."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has repository","object":"microsoft/Staccato-Stuttered-ASR","text":"microsoft/Staccato-Stuttered-ASR has repository microsoft/Staccato-Stuttered-ASR."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has language","object":"Python","text":"microsoft/Staccato-Stuttered-ASR has language Python."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has notability","object":"New repo from Microsoft on ASR, no traction info","text":"microsoft/Staccato-Stuttered-ASR has notability New repo from Microsoft on ASR, no traction info."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has watch term","object":"Eval methodology","text":"microsoft/Staccato-Stuttered-ASR has watch term Eval methodology."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has watch term","object":"Infrastructure","text":"microsoft/Staccato-Stuttered-ASR has watch term Infrastructure."}]},"intelligence":{"signal_desk":"repos","answer":"Microsoft published microsoft/Staccato-Stuttered-ASR (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo microsoft/Staccato-Stuttered-ASR · language Python · New repo from Microsoft on ASR, no traction info. onlylabs links this event to 1 captured evidence page and 6 related repo signals.","semantic_triples":[{"subject":"Microsoft","predicate":"published repo","object":"microsoft/Staccato-Stuttered-ASR","text":"Microsoft published repo microsoft/Staccato-Stuttered-ASR."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"is classified as","object":"repo signal","text":"microsoft/Staccato-Stuttered-ASR is classified as repo signal."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"belongs to","object":"repos desk","text":"microsoft/Staccato-Stuttered-ASR belongs to repos desk."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has context","object":"Python","text":"microsoft/Staccato-Stuttered-ASR has context Python."},{"subject":"microsoft/Staccato-Stuttered-ASR","predicate":"has evidence coverage","object":"1 captured evidence page","text":"microsoft/Staccato-Stuttered-ASR has evidence coverage 1 captured evidence page."}]},"signal":{"id":"6153a7ef-2070-4c98-b5d7-6eb5bdab5f93","url":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93","json_url":"https://onlylabs.fyi/signals/6153a7ef-2070-4c98-b5d7-6eb5bdab5f93/signal.json","source_url":"https://github.com/microsoft/Staccato-Stuttered-ASR","title":"microsoft/Staccato-Stuttered-ASR","summary":"Microsoft published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-01-07T21:54:17+00:00","first_seen_at":"2026-06-06T01:49:41.740219+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/microsoft/Staccato-Stuttered-ASR"]},"facets":{"repo":"microsoft/Staccato-Stuttered-ASR","language":"Python"},"traction":{"github_stars":0,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://github.com/microsoft/Staccato-Stuttered-ASR","final_url":"https://github.com/microsoft/Staccato-Stuttered-ASR","title":"microsoft/Staccato-Stuttered-ASR repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:03:02.497009+00:00","bytes":11760,"raw_path":"78e82f2417e63d139f7e2c9a7d3d155d41ac523340bd395045c00c992d0925e5.json","content_hash":"8632e872bae52090d356e05cb23f34a245f7ffa8b4c43bd4217112de1fc8bb1a","excerpt_chars":1200,"truncated":true,"excerpt":"microsoft/Staccato-Stuttered-ASR Language: Python License: MIT Stars: 0 Forks: 0 Open issues: 15 Created: 2026-01-07T21:54:17Z Pushed: 2026-06-05T23:41:43Z Default branch: main Fork: no Archived: no README: Staccato: Stuttered Speech Recognition Staccato is a speech recognition pipeline optimized for transcribing stuttered speech. It combines OpenAI's Whisper model with GPT-4o to produce accurate transcriptions that capture the speaker's intended message, filtering out involuntary disfluencies. Overview People who stutter speak with involuntary sound repetitions, word repetitions, prolongations, and blocks. Standard ASR models like Whisper are not trained on stuttered speech data and often produce poor transcriptions. Staccato addresses this by: 1. **Whisper transcription**: Initial transcription using Whisper Large V3 2. **GPT-4o refinement**: Uses GPT-4o with audio understanding to refine the transcription, leveraging both the audio and initial transcription Installation Prerequisites - Python 3.12+ - NVIDIA GPU with CUDA support (CUDA 11.8+) - CUDA toolkit installed (`nvcc` must be in PATH) - Linux (tested on Ubuntu) - Git Setup 1. Clone the repository: ```bash git clone..."},"evidence_pages":[{"url":"https://github.com/microsoft/Staccato-Stuttered-ASR","final_url":"https://github.com/microsoft/Staccato-Stuttered-ASR","title":"microsoft/Staccato-Stuttered-ASR repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:03:02.497009+00:00","bytes":11760,"raw_path":"78e82f2417e63d139f7e2c9a7d3d155d41ac523340bd395045c00c992d0925e5.json","content_hash":"8632e872bae52090d356e05cb23f34a245f7ffa8b4c43bd4217112de1fc8bb1a","excerpt_chars":1200,"truncated":true,"excerpt":"microsoft/Staccato-Stuttered-ASR Language: Python License: MIT Stars: 0 Forks: 0 Open issues: 15 Created: 2026-01-07T21:54:17Z Pushed: 2026-06-05T23:41:43Z Default branch: main Fork: no Archived: no README: Staccato: Stuttered Speech Recognition Staccato is a speech recognition pipeline optimized for transcribing stuttered speech. It combines OpenAI's Whisper model with GPT-4o to produce accurate transcriptions that capture the speaker's intended message, filtering out involuntary disfluencies. Overview People who stutter speak with involuntary sound repetitions, word repetitions, prolongations, and blocks. Standard ASR models like Whisper are not trained on stuttered speech data and often produce poor transcriptions. Staccato addresses this by: 1. **Whisper transcription**: Initial transcription using Whisper Large V3 2. **GPT-4o refinement**: Uses GPT-4o with audio understanding to refine the transcription, leveraging both the audio and initial transcription Installation Prerequisites - Python 3.12+ - NVIDIA GPU with CUDA support (CUDA 11.8+) - CUDA toolkit installed (`nvcc` must be in PATH) - Linux (tested on Ubuntu) - Git Setup 1. Clone the repository: ```bash git clone..."}],"related_signals":[{"id":"8afe79f4-378b-4748-9e2a-3cf5e3253fdb","url":"https://onlylabs.fyi/signals/8afe79f4-378b-4748-9e2a-3cf5e3253fdb","source_url":"https://github.com/microsoft/Dev-Trio","title":"microsoft/Dev-Trio","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-08T03:41:01+00:00","first_seen_at":"2026-06-08T07:01:04.198092+00:00","date_source":"source"},{"id":"9e75fa50-dba7-4b77-9faf-166c323e3dff","url":"https://onlylabs.fyi/signals/9e75fa50-dba7-4b77-9faf-166c323e3dff","source_url":"https://github.com/microsoft/amplifier-app-paperclip","title":"microsoft/amplifier-app-paperclip","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-04T21:13:41+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"76cacf33-54b2-4074-bec0-23944d8fb67c","url":"https://onlylabs.fyi/signals/76cacf33-54b2-4074-bec0-23944d8fb67c","source_url":"https://github.com/microsoft/create-github-app-token-via-key-vault","title":"microsoft/create-github-app-token-via-key-vault","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-04T18:22:49+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"b2f7bcbd-9db3-4785-8a2a-2e0e0cb22ed2","url":"https://onlylabs.fyi/signals/b2f7bcbd-9db3-4785-8a2a-2e0e0cb22ed2","source_url":"https://github.com/microsoft/Enterprise-AI-Analytics-Pipeline","title":"microsoft/Enterprise-AI-Analytics-Pipeline","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-04T16:48:58+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"51a9ec5d-5f14-45d9-b57a-db362b5d1ace","url":"https://onlylabs.fyi/signals/51a9ec5d-5f14-45d9-b57a-db362b5d1ace","source_url":"https://github.com/microsoft/fabric-org-app-template","title":"microsoft/fabric-org-app-template","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-03T18:26:42+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"},{"id":"f26025da-153f-4d27-851c-7b4892602810","url":"https://onlylabs.fyi/signals/f26025da-153f-4d27-851c-7b4892602810","source_url":"https://github.com/microsoft/amplifier-bundle-amplifier-online","title":"microsoft/amplifier-bundle-amplifier-online","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"microsoft","name":"Microsoft","category":"frontier-lab"},"occurred_at":"2026-06-03T17:26:20+00:00","first_seen_at":"2026-06-05T20:58:41.438741+00:00","date_source":"source"}]}