{"schema_version":"onlylabs.public_signal.v1","title":"Tencent Hunyuan Repo: Tencent-Hunyuan/C3-Benchmark","description":"Tencent Hunyuan repo signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72","json_url":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72/signal.json","generated_at":"2026-06-11T03:57:32.506242+00:00","org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/tencent-hunyuan","dossier_json_url":"https://onlylabs.fyi/labs/tencent-hunyuan/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72","signal_json":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72/signal.json","source":"https://github.com/Tencent-Hunyuan/C3-Benchmark","lab_dossier":"https://onlylabs.fyi/labs/tencent-hunyuan","lab_dossier_json":"https://onlylabs.fyi/labs/tencent-hunyuan/dossier.json","analysis":"https://onlylabs.fyi/analysis/tencent-hunyuan","analysis_json":"https://onlylabs.fyi/analysis/tencent-hunyuan/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/tencent-hunyuan/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":{"radar":"https://onlylabs.fyi/data-radar","radar_json":"https://onlylabs.fyi/data-radar.json","opportunities":"https://onlylabs.fyi/opportunities","opportunities_json":"https://onlylabs.fyi/opportunities.json","lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"}]}},"answer_pack":{"answer":"Tencent Hunyuan published Tencent-Hunyuan/C3-Benchmark (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo Tencent-Hunyuan/C3-Benchmark · language Python · New benchmark repo, low traction. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality in the data-business radar.","signal_desk":"repos","source_context":{"source_url":"https://github.com/Tencent-Hunyuan/C3-Benchmark","source_host":"github.com","occurred_at":"2025-06-26T13:37:43+00:00","first_seen_at":"2026-06-05T21:53:29.068517+00:00","date_source":"source","context":"Python"},"context_markers":[{"label":"Lab","value":"Tencent Hunyuan","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"Tencent-Hunyuan/C3-Benchmark","source":"source"},{"label":"Language","value":"Python","source":"source"},{"label":"Stars","value":"38","source":"traction"},{"label":"Notability","value":"New benchmark repo, low traction","source":"signal"},{"label":"Radar lane","value":"Evals and quality","source":"radar"},{"label":"Matched term","value":"benchmark","source":"radar"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Data pipeline","source":"evidence"},{"label":"Watch term","value":"Infrastructure","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"},{"label":"Watch term","value":"Agents and tool use","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/Tencent-Hunyuan/C3-Benchmark"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:57:32.506242+00:00"},"data_business":{"matches":true,"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"}],"matched_terms":["benchmark"],"score":14,"reason":"Tencent Hunyuan has a repo signal matching evals and quality."},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72/signal.json","dossier_json":"https://onlylabs.fyi/labs/tencent-hunyuan/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/tencent-hunyuan/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/tencent-hunyuan/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":"https://onlylabs.fyi/data-radar.json","opportunities_json":"https://onlylabs.fyi/opportunities.json"},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Which data-business lane explains this signal: Evals and quality?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","data_business_lane","evidence_url"],"data_business_relevance":"New repositories can expose organization build priorities early, especially around internal tooling, eval infrastructure, data systems, deployment, and agent workflows.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72/signal.json","required":true},{"label":"source","url":"https://github.com/Tencent-Hunyuan/C3-Benchmark","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/tencent-hunyuan/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/tencent-hunyuan/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":"https://onlylabs.fyi/data-radar.json","required":true}],"expected_output":["one-paragraph source-grounded interpretation","data-business implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Tencent Hunyuan's repo signal \"Tencent-Hunyuan/C3-Benchmark\" for frontier lab strategy and data-business implications."},"semantic_triples":[{"subject":"Tencent Hunyuan","predicate":"published repo","object":"Tencent-Hunyuan/C3-Benchmark","text":"Tencent Hunyuan published repo Tencent-Hunyuan/C3-Benchmark."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"is classified as","object":"repo signal","text":"Tencent-Hunyuan/C3-Benchmark is classified as repo signal."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"belongs to","object":"repos desk","text":"Tencent-Hunyuan/C3-Benchmark belongs to repos desk."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has context","object":"Python","text":"Tencent-Hunyuan/C3-Benchmark has context Python."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Tencent-Hunyuan/C3-Benchmark has evidence coverage 1 captured evidence page."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"matches data-business lanes","object":"Evals and quality","text":"Tencent-Hunyuan/C3-Benchmark matches data-business lanes Evals and quality."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has captured page count","object":"1","text":"Tencent-Hunyuan/C3-Benchmark has captured page count 1."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has readable page count","object":"1","text":"Tencent-Hunyuan/C3-Benchmark has readable page count 1."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has related signal count","object":"6","text":"Tencent-Hunyuan/C3-Benchmark has related signal count 6."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"Tencent-Hunyuan/C3-Benchmark has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has source host","object":"github.com","text":"Tencent-Hunyuan/C3-Benchmark has source host github.com."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has lab","object":"Tencent Hunyuan","text":"Tencent-Hunyuan/C3-Benchmark has lab Tencent Hunyuan."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has signal desk","object":"repos","text":"Tencent-Hunyuan/C3-Benchmark has signal desk repos."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has source host","object":"github.com","text":"Tencent-Hunyuan/C3-Benchmark has source host github.com."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has repository","object":"Tencent-Hunyuan/C3-Benchmark","text":"Tencent-Hunyuan/C3-Benchmark has repository Tencent-Hunyuan/C3-Benchmark."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has language","object":"Python","text":"Tencent-Hunyuan/C3-Benchmark has language Python."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has stars","object":"38","text":"Tencent-Hunyuan/C3-Benchmark has stars 38."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has notability","object":"New benchmark repo, low traction","text":"Tencent-Hunyuan/C3-Benchmark has notability New benchmark repo, low traction."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has radar lane","object":"Evals and quality","text":"Tencent-Hunyuan/C3-Benchmark has radar lane Evals and quality."}]},"intelligence":{"signal_desk":"repos","answer":"Tencent Hunyuan published Tencent-Hunyuan/C3-Benchmark (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo Tencent-Hunyuan/C3-Benchmark · language Python · New benchmark repo, low traction. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality in the data-business radar.","semantic_triples":[{"subject":"Tencent Hunyuan","predicate":"published repo","object":"Tencent-Hunyuan/C3-Benchmark","text":"Tencent Hunyuan published repo Tencent-Hunyuan/C3-Benchmark."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"is classified as","object":"repo signal","text":"Tencent-Hunyuan/C3-Benchmark is classified as repo signal."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"belongs to","object":"repos desk","text":"Tencent-Hunyuan/C3-Benchmark belongs to repos desk."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has context","object":"Python","text":"Tencent-Hunyuan/C3-Benchmark has context Python."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Tencent-Hunyuan/C3-Benchmark has evidence coverage 1 captured evidence page."},{"subject":"Tencent-Hunyuan/C3-Benchmark","predicate":"matches data-business lanes","object":"Evals and quality","text":"Tencent-Hunyuan/C3-Benchmark matches data-business lanes Evals and quality."}]},"signal":{"id":"d15f4044-37db-464d-81a7-f0d4736b8e72","url":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72","json_url":"https://onlylabs.fyi/signals/d15f4044-37db-464d-81a7-f0d4736b8e72/signal.json","source_url":"https://github.com/Tencent-Hunyuan/C3-Benchmark","title":"Tencent-Hunyuan/C3-Benchmark","summary":"Tencent Hunyuan published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab"},"occurred_at":"2025-06-26T13:37:43+00:00","first_seen_at":"2026-06-05T21:53:29.068517+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/Tencent-Hunyuan/C3-Benchmark"]},"facets":{"repo":"Tencent-Hunyuan/C3-Benchmark","language":"Python"},"traction":{"github_stars":38,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":{"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals"}],"score":14,"matched_terms":["benchmark"],"reason":"Tencent Hunyuan has a repo signal matching evals and quality."}},"primary_evidence_page":{"url":"https://github.com/Tencent-Hunyuan/C3-Benchmark","final_url":"https://github.com/Tencent-Hunyuan/C3-Benchmark","title":"Tencent-Hunyuan/C3-Benchmark repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:57:32.506242+00:00","bytes":30613,"raw_path":"dd1e0b35a2deaae3c4a37d2d49f0bb2a06ba2943afdd5941aed40fa30326f2d5.json","content_hash":"855af22efbcfa8040dcc79d794d7b8a7785a51b6b35847e118c185bf04505689","excerpt_chars":1200,"truncated":true,"excerpt":"Tencent-Hunyuan/C3-Benchmark Description: C^3-Bench: The Things Real Disturbing LLM based Agent in Multi-Tasking Language: Python License: NOASSERTION Stars: 38 Forks: 3 Open issues: 0 Created: 2025-06-26T13:37:43Z Pushed: 2026-03-01T15:28:39Z Default branch: main Fork: no Archived: no README: C^3-Bench: The Things Real Disturbing LLM based Agent in Multi-Tasking <p align=\"center\"> 📖 <a>English</a> • <a href=\"README_ZH.md\">中文</a> <br> 🤗 <a href=\"https://huggingface.co/datasets/tencent/C3-BenchMark\">Dataset</a> • 📚 <a href=\"https://arxiv.org/abs/2505.18746\">Preprint Paper</a> </p> ![Example](./picture/first.png) 🎆 News - This repo has moved to https://github.com/yupeijei1997/WildToolBench, Please check our latest progress there. - 2026.1.26 🎉🎉🎉 Our paper <a href=\"https://openreview.net/forum?id=yz7fL5vfpn\">Benchmarking LLM Tool-Use in the Wild</a> is accepted by ICLR 2026! 📖 Overview Agents based on large language models leverage tools to modify environments, revolutionizing how AI interacts with the physical world. Unlike traditional NLP tasks that rely solely on historical dialogue for responses, these agents must consider more complex factors, such as inter-tool..."},"evidence_pages":[{"url":"https://github.com/Tencent-Hunyuan/C3-Benchmark","final_url":"https://github.com/Tencent-Hunyuan/C3-Benchmark","title":"Tencent-Hunyuan/C3-Benchmark repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:57:32.506242+00:00","bytes":30613,"raw_path":"dd1e0b35a2deaae3c4a37d2d49f0bb2a06ba2943afdd5941aed40fa30326f2d5.json","content_hash":"855af22efbcfa8040dcc79d794d7b8a7785a51b6b35847e118c185bf04505689","excerpt_chars":1200,"truncated":true,"excerpt":"Tencent-Hunyuan/C3-Benchmark Description: C^3-Bench: The Things Real Disturbing LLM based Agent in Multi-Tasking Language: Python License: NOASSERTION Stars: 38 Forks: 3 Open issues: 0 Created: 2025-06-26T13:37:43Z Pushed: 2026-03-01T15:28:39Z Default branch: main Fork: no Archived: no README: C^3-Bench: The Things Real Disturbing LLM based Agent in Multi-Tasking <p align=\"center\"> 📖 <a>English</a> • <a href=\"README_ZH.md\">中文</a> <br> 🤗 <a href=\"https://huggingface.co/datasets/tencent/C3-BenchMark\">Dataset</a> • 📚 <a href=\"https://arxiv.org/abs/2505.18746\">Preprint Paper</a> </p> ![Example](./picture/first.png) 🎆 News - This repo has moved to https://github.com/yupeijei1997/WildToolBench, Please check our latest progress there. - 2026.1.26 🎉🎉🎉 Our paper <a href=\"https://openreview.net/forum?id=yz7fL5vfpn\">Benchmarking LLM Tool-Use in the Wild</a> is accepted by ICLR 2026! 📖 Overview Agents based on large language models leverage tools to modify environments, revolutionizing how AI interacts with the physical world. Unlike traditional NLP tasks that rely solely on historical dialogue for responses, these agents must consider more complex factors, such as inter-tool..."}],"related_signals":[{"id":"30ef45dc-aee6-470e-8bb6-1aff274256c4","url":"https://onlylabs.fyi/signals/30ef45dc-aee6-470e-8bb6-1aff274256c4","source_url":"https://github.com/Tencent-Hunyuan/UniRL","title":"Tencent-Hunyuan/UniRL","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab"},"occurred_at":"2026-06-08T12:29:36+00:00","first_seen_at":"2026-06-09T07:00:33.142136+00:00","date_source":"source"},{"id":"a4a55c54-84f7-4b5d-b58a-26ff8fa578d7","url":"https://onlylabs.fyi/signals/a4a55c54-84f7-4b5d-b58a-26ff8fa578d7","source_url":"https://github.com/Tencent-Hunyuan/PlanningBench","title":"Tencent-Hunyuan/PlanningBench","context":null,"kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab"},"occurred_at":"2026-05-29T02:24:44+00:00","first_seen_at":"2026-06-05T21:53:29.068517+00:00","date_source":"source"},{"id":"7c054af3-8d52-42c8-8d3a-9cf4d0f97e99","url":"https://onlylabs.fyi/signals/7c054af3-8d52-42c8-8d3a-9cf4d0f97e99","source_url":"https://github.com/Tencent-Hunyuan/Precise","title":"Tencent-Hunyuan/Precise","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab"},"occurred_at":"2026-05-22T02:07:30+00:00","first_seen_at":"2026-06-05T21:53:29.068517+00:00","date_source":"source"},{"id":"79193606-cf5c-4e28-89fb-30f176808c2f","url":"https://onlylabs.fyi/signals/79193606-cf5c-4e28-89fb-30f176808c2f","source_url":"https://github.com/Tencent-Hunyuan/Hy-MT2","title":"Tencent-Hunyuan/Hy-MT2","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab"},"occurred_at":"2026-05-18T07:54:11+00:00","first_seen_at":"2026-06-05T21:53:29.068517+00:00","date_source":"source"},{"id":"f4f4c0ae-5f78-4070-8653-5516eb1f71ee","url":"https://onlylabs.fyi/signals/f4f4c0ae-5f78-4070-8653-5516eb1f71ee","source_url":"https://github.com/Tencent-Hunyuan/Hy-Embodied-RoboFusion","title":"Tencent-Hunyuan/Hy-Embodied-RoboFusion","context":"C","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab"},"occurred_at":"2026-05-06T06:20:04+00:00","first_seen_at":"2026-06-05T21:53:29.068517+00:00","date_source":"source"},{"id":"0eb03731-82e8-475f-8a1b-786ca5b4fe59","url":"https://onlylabs.fyi/signals/0eb03731-82e8-475f-8a1b-786ca5b4fe59","source_url":"https://github.com/Tencent-Hunyuan/R-DMesh","title":"Tencent-Hunyuan/R-DMesh","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"tencent-hunyuan","name":"Tencent Hunyuan","category":"frontier-lab"},"occurred_at":"2026-04-29T07:36:06+00:00","first_seen_at":"2026-06-05T21:53:29.068517+00:00","date_source":"source"}]}