{"schema_version":"onlylabs.public_signal.v1","title":"InclusionAI (Ant Group) Writing: ABench: An Evolving Open-Source Benchmark","description":"InclusionAI (Ant Group) writing signal with public source context, captured evidence pages, related signals, and category-scoped analysis context.","url":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3","json_url":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3/signal.json","generated_at":"2026-06-11T03:23:10.427618+00:00","org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab","category_label":"Neolab","dossier_url":"https://onlylabs.fyi/labs/inclusionai","dossier_json_url":"https://onlylabs.fyi/labs/inclusionai/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3","signal_json":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3/signal.json","source":"https://www.inclusion-ai.org/blog/abench","lab_dossier":"https://onlylabs.fyi/labs/inclusionai","lab_dossier_json":"https://onlylabs.fyi/labs/inclusionai/dossier.json","analysis":"https://onlylabs.fyi/analysis/inclusionai","analysis_json":"https://onlylabs.fyi/analysis/inclusionai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/inclusionai/evidence.json","category":"https://onlylabs.fyi/neolabs","category_json":"https://onlylabs.fyi/neolabs.json","category_feed":"https://onlylabs.fyi/neolabs/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json?category=neolab","topic":"https://onlylabs.fyi/topics/talking","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json?category=neolab","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml?category=neolab","data_business":null},"answer_pack":{"answer":"InclusionAI (Ant Group) published ABench: An Evolving Open-Source Benchmark. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: New open-source benchmark, no traction data · ABench: An Evolving Open-Source Benchmark | INCLUSION AI Skip to main content GITHUB 🌟 Overview ​ ABench is an evolving open-source benchmark suite designed to.... onlylabs links this event to 1 captured evidence page and 6 related writing signals.","signal_desk":"talking","source_context":{"source_url":"https://www.inclusion-ai.org/blog/abench","source_host":"inclusion-ai.org","occurred_at":"2025-07-08T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date","context":null},"context_markers":[{"label":"Lab","value":"InclusionAI (Ant Group)","source":"signal"},{"label":"Signal desk","value":"talking","source":"signal"},{"label":"Source host","value":"inclusion-ai.org","source":"source"},{"label":"Author","value":"ospo@antgroup.com (inclusionAI)","source":"source"},{"label":"Notability","value":"New open-source benchmark, no traction data","source":"signal"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Data pipeline","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://www.inclusion-ai.org/blog/abench"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:23:10.427618+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3/signal.json","dossier_json":"https://onlylabs.fyi/labs/inclusionai/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/inclusionai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/inclusionai/evidence.json","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json?category=neolab","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml?category=neolab","category_signals_json":"https://onlylabs.fyi/signals.json?category=neolab","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","evidence_focus":["post title","source URL","captured page text","HN traction","linked model or paper references","publication date"],"extraction_questions":["Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Which writing reframes a recent release, model, hiring wave, or policy stance?","Which posts mention data, evals, infrastructure, safety, or deployment workflows?"],"signal_questions":["What public theme, launch framing, or research direction does this writing signal expose?","Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Do the 6 related writing signals show a repeated pattern?"],"output_fields":["org","theme","public_framing","traction","evidence_url"],"data_business_relevance":"Data-business lane extraction is scoped to frontier labs; for this category, keep conclusions tied to category-specific strategy, source evidence, and follow-up questions.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3/signal.json","required":true},{"label":"source","url":"https://www.inclusion-ai.org/blog/abench","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/inclusionai/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/inclusionai/evidence.json","required":true},{"label":"topic_signals_json","url":"https://onlylabs.fyi/topics/talking/signals.json?category=neolab","required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze InclusionAI (Ant Group)'s writing signal \"ABench: An Evolving Open-Source Benchmark\" for neolab strategy."},"semantic_triples":[{"subject":"InclusionAI (Ant Group)","predicate":"published","object":"ABench: An Evolving Open-Source Benchmark","text":"InclusionAI (Ant Group) published ABench: An Evolving Open-Source Benchmark."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"is classified as","object":"writing signal","text":"ABench: An Evolving Open-Source Benchmark is classified as writing signal."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"belongs to","object":"talking desk","text":"ABench: An Evolving Open-Source Benchmark belongs to talking desk."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has evidence coverage","object":"1 captured evidence page","text":"ABench: An Evolving Open-Source Benchmark has evidence coverage 1 captured evidence page."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has captured page count","object":"1","text":"ABench: An Evolving Open-Source Benchmark has captured page count 1."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has readable page count","object":"1","text":"ABench: An Evolving Open-Source Benchmark has readable page count 1."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has related signal count","object":"6","text":"ABench: An Evolving Open-Source Benchmark has related signal count 6."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has analysis playbook objective","object":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","text":"ABench: An Evolving Open-Source Benchmark has analysis playbook objective Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has source host","object":"inclusion-ai.org","text":"ABench: An Evolving Open-Source Benchmark has source host inclusion-ai.org."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has lab","object":"InclusionAI (Ant Group)","text":"ABench: An Evolving Open-Source Benchmark has lab InclusionAI (Ant Group)."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has signal desk","object":"talking","text":"ABench: An Evolving Open-Source Benchmark has signal desk talking."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has source host","object":"inclusion-ai.org","text":"ABench: An Evolving Open-Source Benchmark has source host inclusion-ai.org."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has author","object":"ospo@antgroup.com (inclusionAI)","text":"ABench: An Evolving Open-Source Benchmark has author ospo@antgroup.com (inclusionAI)."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has notability","object":"New open-source benchmark, no traction data","text":"ABench: An Evolving Open-Source Benchmark has notability New open-source benchmark, no traction data."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has watch term","object":"Eval methodology","text":"ABench: An Evolving Open-Source Benchmark has watch term Eval methodology."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has watch term","object":"Data pipeline","text":"ABench: An Evolving Open-Source Benchmark has watch term Data pipeline."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has watch term","object":"Safety and alignment","text":"ABench: An Evolving Open-Source Benchmark has watch term Safety and alignment."}]},"intelligence":{"signal_desk":"talking","answer":"InclusionAI (Ant Group) published ABench: An Evolving Open-Source Benchmark. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: New open-source benchmark, no traction data · ABench: An Evolving Open-Source Benchmark | INCLUSION AI Skip to main content GITHUB 🌟 Overview ​ ABench is an evolving open-source benchmark suite designed to.... onlylabs links this event to 1 captured evidence page and 6 related writing signals.","semantic_triples":[{"subject":"InclusionAI (Ant Group)","predicate":"published","object":"ABench: An Evolving Open-Source Benchmark","text":"InclusionAI (Ant Group) published ABench: An Evolving Open-Source Benchmark."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"is classified as","object":"writing signal","text":"ABench: An Evolving Open-Source Benchmark is classified as writing signal."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"belongs to","object":"talking desk","text":"ABench: An Evolving Open-Source Benchmark belongs to talking desk."},{"subject":"ABench: An Evolving Open-Source Benchmark","predicate":"has evidence coverage","object":"1 captured evidence page","text":"ABench: An Evolving Open-Source Benchmark has evidence coverage 1 captured evidence page."}]},"signal":{"id":"dd5ec616-9ce6-4065-8f85-a3688a2875b3","url":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3","json_url":"https://onlylabs.fyi/signals/dd5ec616-9ce6-4065-8f85-a3688a2875b3/signal.json","source_url":"https://www.inclusion-ai.org/blog/abench","title":"ABench: An Evolving Open-Source Benchmark","summary":"InclusionAI (Ant Group) published a writing signal. onlylabs watches public writing for research themes, product direction, and model-launch context.","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab"},"occurred_at":"2025-07-08T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://www.inclusion-ai.org/blog/abench"]},"facets":{},"traction":{"github_stars":null,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://www.inclusion-ai.org/blog/abench","final_url":"https://www.inclusion-ai.org/blog/abench/","title":"ABench: An Evolving Open-Source Benchmark","http_status":200,"content_type":"text/html; charset=utf-8","capture_method":"plain","fetched_at":"2026-06-11T03:23:10.427618+00:00","bytes":18787,"raw_path":"7d0cf91c96f40fe875ac9c8f4e4638dd0b1965a93efe6cc5ad180526f58242df.html","content_hash":"3d7c047a80b3a15e05cd9f1e2379b3f68d110448615e1e803982c1ea12cf9df9","excerpt_chars":1200,"truncated":true,"excerpt":"ABench: An Evolving Open-Source Benchmark | INCLUSION AI Skip to main content GITHUB 🌟 Overview ​ ABench is an evolving open-source benchmark suite designed to rigorously evaluate and enhance Large Language Models (LLMs) on complex cross-domain tasks . By targeting current model weaknesses, ABench provides systematic challenges in high-difficulty specialized domains , including physics, actuarial science, logical reasoning, law, and psychology. 🎯 Core Objectives ​ Address Evaluation Gaps : Design high-differentiation assessment tasks targeting underperforming question types Establish Unified Standards : Create reliable, comparable benchmarks for multi-domain LLM evaluation Expand Capability Boundaries : Drive continuous optimization of knowledge systems and reasoning mechanisms through challenging innovative problems 📊 Dataset Release Status ​ Domain Description Status Physics 500 university/competition-level physics problems (400 static + 100 dynamic parametric variants) covering 10+ fields from classical mechanics to modern physics ✅ Released Actuary Curated actuarial exam problems covering core topics: probability statistics, financial mathematics, life/non-life insurance,..."},"evidence_pages":[{"url":"https://www.inclusion-ai.org/blog/abench","final_url":"https://www.inclusion-ai.org/blog/abench/","title":"ABench: An Evolving Open-Source Benchmark","http_status":200,"content_type":"text/html; charset=utf-8","capture_method":"plain","fetched_at":"2026-06-11T03:23:10.427618+00:00","bytes":18787,"raw_path":"7d0cf91c96f40fe875ac9c8f4e4638dd0b1965a93efe6cc5ad180526f58242df.html","content_hash":"3d7c047a80b3a15e05cd9f1e2379b3f68d110448615e1e803982c1ea12cf9df9","excerpt_chars":1200,"truncated":true,"excerpt":"ABench: An Evolving Open-Source Benchmark | INCLUSION AI Skip to main content GITHUB 🌟 Overview ​ ABench is an evolving open-source benchmark suite designed to rigorously evaluate and enhance Large Language Models (LLMs) on complex cross-domain tasks . By targeting current model weaknesses, ABench provides systematic challenges in high-difficulty specialized domains , including physics, actuarial science, logical reasoning, law, and psychology. 🎯 Core Objectives ​ Address Evaluation Gaps : Design high-differentiation assessment tasks targeting underperforming question types Establish Unified Standards : Create reliable, comparable benchmarks for multi-domain LLM evaluation Expand Capability Boundaries : Drive continuous optimization of knowledge systems and reasoning mechanisms through challenging innovative problems 📊 Dataset Release Status ​ Domain Description Status Physics 500 university/competition-level physics problems (400 static + 100 dynamic parametric variants) covering 10+ fields from classical mechanics to modern physics ✅ Released Actuary Curated actuarial exam problems covering core topics: probability statistics, financial mathematics, life/non-life insurance,..."}],"related_signals":[{"id":"2cbb5136-91f1-45ad-ab49-648a7e5cdf57","url":"https://onlylabs.fyi/signals/2cbb5136-91f1-45ad-ab49-648a7e5cdf57","source_url":"https://www.inclusion-ai.org/blog/agentic-landscape-in-2026-Q1","title":"Taking the Pulse of Agentic AI from the Developer Community at the End of Q1 2026","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab"},"occurred_at":"2026-04-01T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date"},{"id":"5e1cfc8a-4c7d-492f-a99f-dd64392daa52","url":"https://onlylabs.fyi/signals/5e1cfc8a-4c7d-492f-a99f-dd64392daa52","source_url":"https://www.inclusion-ai.org/blog/ming-omni-tts","title":"Ming-Omni-TTS: Simple and Efficient Unified Generation of Speech, Music, and Sound with Precise Control","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab"},"occurred_at":"2026-03-04T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date"},{"id":"957b8d9f-1548-4ee4-a149-d34b39ed4dea","url":"https://onlylabs.fyi/signals/957b8d9f-1548-4ee4-a149-d34b39ed4dea","source_url":"https://www.inclusion-ai.org/blog/llm-landscape-vllm-sgl","title":"The Community Stories of vLLM and SGLang","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab"},"occurred_at":"2025-12-17T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date"},{"id":"12b75563-2758-4e3e-9e19-672d996b030c","url":"https://onlylabs.fyi/signals/12b75563-2758-4e3e-9e19-672d996b030c","source_url":"https://www.inclusion-ai.org/blog/ming-flash-omni-preview","title":"Ming-flash-omni-Preview: A Sparse, Unified Architecture for Multimodal Perception and Generation","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab"},"occurred_at":"2025-10-28T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date"},{"id":"1fb31514-221f-4f68-bbdf-52eae4fa2366","url":"https://onlylabs.fyi/signals/1fb31514-221f-4f68-bbdf-52eae4fa2366","source_url":"https://www.inclusion-ai.org/blog/llm-landscape-2-0","title":"Open Source LLM Development Landscape 2.0: 2025 Revisited","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab"},"occurred_at":"2025-10-11T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date"},{"id":"6443bea9-11eb-40ed-9c4f-9648b55c8137","url":"https://onlylabs.fyi/signals/6443bea9-11eb-40ed-9c4f-9648b55c8137","source_url":"https://www.inclusion-ai.org/blog/ming-uniaudio","title":"Ming-UniAudio: Speech LLM for Joint Understanding, Generation and Editing with Unified Representation","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"inclusionai","name":"InclusionAI (Ant Group)","category":"neolab"},"occurred_at":"2025-10-01T00:00:00+00:00","first_seen_at":"2026-06-05T22:32:23.327834+00:00","date_source":"rss.item_date"}]}