{"schema_version":"onlylabs.public_signal.v1","title":"Qwen (Alibaba Cloud) Writing: QwQ-32B: Embracing the Power of Reinforcement Learning","description":"Qwen (Alibaba Cloud) writing signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d","json_url":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d/signal.json","generated_at":"2026-06-07T21:16:10.756207+00:00","org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/qwen","dossier_json_url":"https://onlylabs.fyi/labs/qwen/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d","signal_json":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d/signal.json","source":"https://qwenlm.github.io/blog/qwq-32b/","lab_dossier":"https://onlylabs.fyi/labs/qwen","lab_dossier_json":"https://onlylabs.fyi/labs/qwen/dossier.json","analysis":"https://onlylabs.fyi/analysis/qwen","analysis_json":"https://onlylabs.fyi/analysis/qwen/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/qwen/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":"https://onlylabs.fyi/topics/talking","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","data_business":{"radar":"https://onlylabs.fyi/data-radar","radar_json":"https://onlylabs.fyi/data-radar.json","opportunities":"https://onlylabs.fyi/opportunities","opportunities_json":"https://onlylabs.fyi/opportunities.json","lanes":[{"key":"data","label":"Data demand","url":"https://onlylabs.fyi/data-radar/data","json_url":"https://onlylabs.fyi/data-radar/data/signals.json"},{"key":"infrastructure","label":"Infrastructure","url":"https://onlylabs.fyi/data-radar/infrastructure","json_url":"https://onlylabs.fyi/data-radar/infrastructure/signals.json"}]}},"answer_pack":{"answer":"Qwen (Alibaba Cloud) published QwQ-32B: Embracing the Power of Reinforcement Learning. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: Notable 32B model release from Qwen on RL. · QwQ-32B: Embracing the Power of Reinforcement Learning | Qwen We have a new blog! View this page at qwen.ai . This page will automatically redirect in 5 seconds. If you.... onlylabs links this event to 1 captured evidence page and 6 related writing signals. It also maps to Data demand, Infrastructure in the data-business radar.","signal_desk":"talking","source_context":{"source_url":"https://qwenlm.github.io/blog/qwq-32b/","source_host":"qwenlm.github.io","occurred_at":"2025-03-06T00:00:00.000Z","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"page.visible_date","context":null},"context_markers":[{"label":"Lab","value":"Qwen (Alibaba Cloud)","source":"signal"},{"label":"Signal desk","value":"talking","source":"signal"},{"label":"Source host","value":"qwenlm.github.io","source":"source"},{"label":"Notability","value":"Notable 32B model release from Qwen on RL.","source":"signal"},{"label":"Radar lane","value":"Data demand","source":"radar"},{"label":"Radar lane","value":"Infrastructure","source":"radar"},{"label":"Matched term","value":"data","source":"radar"},{"label":"Matched term","value":"training","source":"radar"},{"label":"Matched term","value":"scaling","source":"radar"},{"label":"Watch term","value":"RL environments","source":"evidence"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Model card","source":"model"},{"label":"Watch term","value":"Infrastructure","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"},{"label":"Watch term","value":"Agents and tool use","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://qwenlm.github.io/blog/qwq-32b/"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-07T21:16:10.756207+00:00"},"data_business":{"matches":true,"lanes":[{"key":"data","label":"Data demand","url":"https://onlylabs.fyi/data-radar/data","json_url":"https://onlylabs.fyi/data-radar/data/signals.json"},{"key":"infrastructure","label":"Infrastructure","url":"https://onlylabs.fyi/data-radar/infrastructure","json_url":"https://onlylabs.fyi/data-radar/infrastructure/signals.json"}],"matched_terms":["data","training","scaling"],"score":27,"reason":"Qwen (Alibaba Cloud) has a writing signal matching data demand, infrastructure."},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d/signal.json","dossier_json":"https://onlylabs.fyi/labs/qwen/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/qwen/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/qwen/evidence.json","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":"https://onlylabs.fyi/data-radar.json","opportunities_json":"https://onlylabs.fyi/opportunities.json"},"analysis_playbook":{"objective":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","evidence_focus":["post title","source URL","captured page text","HN traction","linked model or paper references","publication date"],"extraction_questions":["Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Which writing reframes a recent release, model, hiring wave, or policy stance?","Which posts mention data, evals, infrastructure, safety, or deployment workflows?"],"signal_questions":["What public theme, launch framing, or research direction does this writing signal expose?","Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Which data-business lane explains this signal: Data demand, Infrastructure?","Do the 6 related writing signals show a repeated pattern?"],"output_fields":["org","theme","public_framing","traction","data_business_lane","evidence_url"],"data_business_relevance":"Public writing supplies the narrative layer over raw signals and helps identify which frontier-lab priorities are becoming externally legible.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d/signal.json","required":true},{"label":"source","url":"https://qwenlm.github.io/blog/qwq-32b/","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/qwen/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/qwen/evidence.json","required":true},{"label":"topic_signals_json","url":"https://onlylabs.fyi/topics/talking/signals.json","required":false},{"label":"data_radar_json","url":"https://onlylabs.fyi/data-radar.json","required":true}],"expected_output":["one-paragraph source-grounded interpretation","data-business implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Qwen (Alibaba Cloud)'s writing signal \"QwQ-32B: Embracing the Power of Reinforcement Learning\" for frontier lab strategy and data-business implications."},"semantic_triples":[{"subject":"Qwen (Alibaba Cloud)","predicate":"published","object":"QwQ-32B: Embracing the Power of Reinforcement Learning","text":"Qwen (Alibaba Cloud) published QwQ-32B: Embracing the Power of Reinforcement Learning."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"is classified as","object":"writing signal","text":"QwQ-32B: Embracing the Power of Reinforcement Learning is classified as writing signal."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"belongs to","object":"talking desk","text":"QwQ-32B: Embracing the Power of Reinforcement Learning belongs to talking desk."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has evidence coverage","object":"1 captured evidence page","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has evidence coverage 1 captured evidence page."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"matches data-business lanes","object":"Data demand, Infrastructure","text":"QwQ-32B: Embracing the Power of Reinforcement Learning matches data-business lanes Data demand, Infrastructure."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has captured page count","object":"1","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has captured page count 1."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has readable page count","object":"1","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has readable page count 1."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has related signal count","object":"6","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has related signal count 6."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has analysis playbook objective","object":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has analysis playbook objective Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has source host","object":"qwenlm.github.io","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has source host qwenlm.github.io."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has lab","object":"Qwen (Alibaba Cloud)","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has lab Qwen (Alibaba Cloud)."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has signal desk","object":"talking","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has signal desk talking."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has source host","object":"qwenlm.github.io","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has source host qwenlm.github.io."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has notability","object":"Notable 32B model release from Qwen on RL.","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has notability Notable 32B model release from Qwen on RL.."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has radar lane","object":"Data demand","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has radar lane Data demand."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has radar lane","object":"Infrastructure","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has radar lane Infrastructure."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has matched term","object":"data","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has matched term data."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has matched term","object":"training","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has matched term training."}]},"intelligence":{"signal_desk":"talking","answer":"Qwen (Alibaba Cloud) published QwQ-32B: Embracing the Power of Reinforcement Learning. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: Notable 32B model release from Qwen on RL. · QwQ-32B: Embracing the Power of Reinforcement Learning | Qwen We have a new blog! View this page at qwen.ai . This page will automatically redirect in 5 seconds. If you.... onlylabs links this event to 1 captured evidence page and 6 related writing signals. It also maps to Data demand, Infrastructure in the data-business radar.","semantic_triples":[{"subject":"Qwen (Alibaba Cloud)","predicate":"published","object":"QwQ-32B: Embracing the Power of Reinforcement Learning","text":"Qwen (Alibaba Cloud) published QwQ-32B: Embracing the Power of Reinforcement Learning."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"is classified as","object":"writing signal","text":"QwQ-32B: Embracing the Power of Reinforcement Learning is classified as writing signal."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"belongs to","object":"talking desk","text":"QwQ-32B: Embracing the Power of Reinforcement Learning belongs to talking desk."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"has evidence coverage","object":"1 captured evidence page","text":"QwQ-32B: Embracing the Power of Reinforcement Learning has evidence coverage 1 captured evidence page."},{"subject":"QwQ-32B: Embracing the Power of Reinforcement Learning","predicate":"matches data-business lanes","object":"Data demand, Infrastructure","text":"QwQ-32B: Embracing the Power of Reinforcement Learning matches data-business lanes Data demand, Infrastructure."}]},"signal":{"id":"9c153b01-a5ba-44cf-be25-8f8516b3fa5d","url":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d","json_url":"https://onlylabs.fyi/signals/9c153b01-a5ba-44cf-be25-8f8516b3fa5d/signal.json","source_url":"https://qwenlm.github.io/blog/qwq-32b/","title":"QwQ-32B: Embracing the Power of Reinforcement Learning","summary":"Qwen (Alibaba Cloud) published a writing signal. onlylabs watches public writing for research themes, product direction, and model-launch context.","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab"},"occurred_at":"2025-03-06T00:00:00.000Z","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"page.visible_date","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://qwenlm.github.io/blog/qwq-32b/"]},"facets":{},"traction":{"github_stars":null,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":{"lanes":[{"key":"data","label":"Data demand","url":"https://onlylabs.fyi/data-radar/data"},{"key":"infrastructure","label":"Infrastructure","url":"https://onlylabs.fyi/data-radar/infrastructure"}],"score":27,"matched_terms":["data","training","scaling"],"reason":"Qwen (Alibaba Cloud) has a writing signal matching data demand, infrastructure."}},"primary_evidence_page":{"url":"https://qwenlm.github.io/blog/qwq-32b/","final_url":"https://qwenlm.github.io/blog/qwq-32b/","title":"QwQ-32B: Embracing the Power of Reinforcement Learning","http_status":200,"content_type":"text/html; charset=utf-8","capture_method":"plain","fetched_at":"2026-06-07T21:16:10.756207+00:00","bytes":38445,"raw_path":"e4f2769e35e0d4258db229c9e4578f4c33dee785954d3a547d5b8c1d85fe39d0.html","content_hash":"3737d8bf0f14f300b2950436ef0ee44946d99c5b4e2d5465ad8564f856258a03","excerpt_chars":1200,"truncated":true,"excerpt":"QwQ-32B: Embracing the Power of Reinforcement Learning | Qwen We have a new blog! View this page at qwen.ai . This page will automatically redirect in 5 seconds. If you are not redirected automatically, please click the button below. Go Now QwQ-32B: Embracing the Power of Reinforcement Learning March 6, 2025 · 4 min · 742 words · Qwen Team | Translations: 简体中文 QWEN CHAT Hugging Face ModelScope DEMO DISCORD Scaling Reinforcement Learning (RL) has the potential to enhance model performance beyond conventional pretraining and post-training methods. Recent studies have demonstrated that RL can significantly improve the reasoning capabilities of models. For instance, DeepSeek R1 has achieved state-of-the-art performance by integrating cold-start data and multi-stage training, enabling deep thinking and complex reasoning. Our research explores the scalability of Reinforcement Learning (RL) and its impact on enhancing the intelligence of large language models. We are excited to introduce QwQ-32B, a model with 32 billion parameters that achieves performance comparable to DeepSeek-R1, which boasts 671 billion parameters (with 37 billion activated). This remarkable outcome underscores the..."},"evidence_pages":[{"url":"https://qwenlm.github.io/blog/qwq-32b/","final_url":"https://qwenlm.github.io/blog/qwq-32b/","title":"QwQ-32B: Embracing the Power of Reinforcement Learning","http_status":200,"content_type":"text/html; charset=utf-8","capture_method":"plain","fetched_at":"2026-06-07T21:16:10.756207+00:00","bytes":38445,"raw_path":"e4f2769e35e0d4258db229c9e4578f4c33dee785954d3a547d5b8c1d85fe39d0.html","content_hash":"3737d8bf0f14f300b2950436ef0ee44946d99c5b4e2d5465ad8564f856258a03","excerpt_chars":1200,"truncated":true,"excerpt":"QwQ-32B: Embracing the Power of Reinforcement Learning | Qwen We have a new blog! View this page at qwen.ai . This page will automatically redirect in 5 seconds. If you are not redirected automatically, please click the button below. Go Now QwQ-32B: Embracing the Power of Reinforcement Learning March 6, 2025 · 4 min · 742 words · Qwen Team | Translations: 简体中文 QWEN CHAT Hugging Face ModelScope DEMO DISCORD Scaling Reinforcement Learning (RL) has the potential to enhance model performance beyond conventional pretraining and post-training methods. Recent studies have demonstrated that RL can significantly improve the reasoning capabilities of models. For instance, DeepSeek R1 has achieved state-of-the-art performance by integrating cold-start data and multi-stage training, enabling deep thinking and complex reasoning. Our research explores the scalability of Reinforcement Learning (RL) and its impact on enhancing the intelligence of large language models. We are excited to introduce QwQ-32B, a model with 32 billion parameters that achieves performance comparable to DeepSeek-R1, which boasts 671 billion parameters (with 37 billion activated). This remarkable outcome underscores the..."}],"related_signals":[{"id":"54029233-5b0e-4748-aae1-6013ae3553d0","url":"https://onlylabs.fyi/signals/54029233-5b0e-4748-aae1-6013ae3553d0","source_url":"https://qwenlm.github.io/blog/qwen3guard/","title":"Qwen3Guard: Real-time Safety for Your Token Stream","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab"},"occurred_at":"2025-09-22T20:00:00+00:00","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"rss.item_date"},{"id":"4e64c872-3d4f-4d01-8908-35b65736eb6e","url":"https://onlylabs.fyi/signals/4e64c872-3d4f-4d01-8908-35b65736eb6e","source_url":"https://qwenlm.github.io/blog/qwen-image-edit/","title":"Qwen-Image-Edit: Image Editing with Higher Quality and Efficiency","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab"},"occurred_at":"2025-08-18T17:30:00+00:00","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"rss.item_date"},{"id":"27bd1b4a-28a4-423c-abb0-e5d24251de65","url":"https://onlylabs.fyi/signals/27bd1b4a-28a4-423c-abb0-e5d24251de65","source_url":"https://qwenlm.github.io/blog/qwen-image/","title":"Qwen-Image: Crafting with Native Text Rendering","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab"},"occurred_at":"2025-08-04T14:08:30+00:00","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"rss.item_date"},{"id":"c662ae5e-1dd9-42a6-8297-87bc670d59ef","url":"https://onlylabs.fyi/signals/c662ae5e-1dd9-42a6-8297-87bc670d59ef","source_url":"https://qwenlm.github.io/blog/gspo/","title":"GSPO: Towards Scalable Reinforcement Learning for Language Models","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab"},"occurred_at":"2025-07-27T07:00:00+00:00","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"rss.item_date"},{"id":"22c0d58c-5ce1-4d1f-97df-de5ebd764517","url":"https://onlylabs.fyi/signals/22c0d58c-5ce1-4d1f-97df-de5ebd764517","source_url":"https://qwenlm.github.io/blog/qwen-mt/","title":"Qwen-MT: Where Speed Meets Smart Translation","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab"},"occurred_at":"2025-07-24T14:00:00+00:00","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"rss.item_date"},{"id":"b6e0bdb2-ffd3-4aed-b44b-732a5e0424a5","url":"https://onlylabs.fyi/signals/b6e0bdb2-ffd3-4aed-b44b-732a5e0424a5","source_url":"https://qwenlm.github.io/blog/qwen3-coder/","title":"Qwen3-Coder: Agentic Coding in the World","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"qwen","name":"Qwen (Alibaba Cloud)","category":"frontier-lab"},"occurred_at":"2025-07-22T13:00:00+00:00","first_seen_at":"2026-06-05T05:42:59.088452+00:00","date_source":"rss.item_date"}]}