{"schema_version":"onlylabs.public_signal.v1","title":"OpenAI Writing: Inside OpenAI’s in-house data agent","description":"OpenAI writing signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de","json_url":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de/signal.json","generated_at":"2026-06-08T15:45:23.082+00:00","org":{"slug":"openai","name":"OpenAI","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/openai","dossier_json_url":"https://onlylabs.fyi/labs/openai/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de","signal_json":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de/signal.json","source":"https://openai.com/index/inside-our-in-house-data-agent","lab_dossier":"https://onlylabs.fyi/labs/openai","lab_dossier_json":"https://onlylabs.fyi/labs/openai/dossier.json","analysis":"https://onlylabs.fyi/analysis/openai","analysis_json":"https://onlylabs.fyi/analysis/openai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/openai/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":"https://onlylabs.fyi/topics/talking","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","data_business":{"radar":"https://onlylabs.fyi/data-radar","radar_json":"https://onlylabs.fyi/data-radar.json","opportunities":"https://onlylabs.fyi/opportunities","opportunities_json":"https://onlylabs.fyi/opportunities.json","lanes":[{"key":"data","label":"Data demand","url":"https://onlylabs.fyi/data-radar/data","json_url":"https://onlylabs.fyi/data-radar/data/signals.json"}]}},"answer_pack":{"answer":"OpenAI published Inside OpenAI’s in-house data agent. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: Substantive post but not a major model release. · Inside OpenAI’s in-house data agent | OpenAI January 29, 2026 Inside OpenAI’s in-house data agent By Bonnie Xu, Aravind Suresh, and Emma Tang Loading… Share Data powers.... onlylabs links this event to 1 captured evidence page and 6 related writing signals. It also maps to Data demand in the data-business radar.","signal_desk":"talking","source_context":{"source_url":"https://openai.com/index/inside-our-in-house-data-agent","source_host":"openai.com","occurred_at":"2026-01-29T10:00:00+00:00","first_seen_at":"2026-06-05T05:42:57.832854+00:00","date_source":"rss.item_date","context":null},"context_markers":[{"label":"Lab","value":"OpenAI","source":"signal"},{"label":"Signal desk","value":"talking","source":"signal"},{"label":"Source host","value":"openai.com","source":"source"},{"label":"Notability","value":"Substantive post but not a major model release.","source":"signal"},{"label":"Radar lane","value":"Data demand","source":"radar"},{"label":"Matched term","value":"data","source":"radar"},{"label":"Matched term","value":"dataset","source":"radar"},{"label":"Matched term","value":"datasets","source":"radar"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Data pipeline","source":"evidence"},{"label":"Watch term","value":"Infrastructure","source":"evidence"},{"label":"Watch term","value":"Agents and tool use","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["exa"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://openai.com/index/inside-our-in-house-data-agent"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-08T15:45:23.082+00:00"},"data_business":{"matches":true,"lanes":[{"key":"data","label":"Data demand","url":"https://onlylabs.fyi/data-radar/data","json_url":"https://onlylabs.fyi/data-radar/data/signals.json"}],"matched_terms":["data","dataset","datasets"],"score":19,"reason":"OpenAI has a writing signal matching data demand."},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de/signal.json","dossier_json":"https://onlylabs.fyi/labs/openai/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/openai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/openai/evidence.json","topic_signals_json":"https://onlylabs.fyi/topics/talking/signals.json","topic_feed":"https://onlylabs.fyi/topics/talking/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":"https://onlylabs.fyi/data-radar.json","opportunities_json":"https://onlylabs.fyi/opportunities.json"},"analysis_playbook":{"objective":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","evidence_focus":["post title","source URL","captured page text","HN traction","linked model or paper references","publication date"],"extraction_questions":["Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Which writing reframes a recent release, model, hiring wave, or policy stance?","Which posts mention data, evals, infrastructure, safety, or deployment workflows?"],"signal_questions":["What public theme, launch framing, or research direction does this writing signal expose?","Which themes are labs choosing to explain publicly?","Which posts are attracting outside discussion?","Which data-business lane explains this signal: Data demand?","Do the 6 related writing signals show a repeated pattern?"],"output_fields":["org","theme","public_framing","traction","data_business_lane","evidence_url"],"data_business_relevance":"Public writing supplies the narrative layer over raw signals and helps identify which frontier-lab priorities are becoming externally legible.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de/signal.json","required":true},{"label":"source","url":"https://openai.com/index/inside-our-in-house-data-agent","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/openai/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/openai/evidence.json","required":true},{"label":"topic_signals_json","url":"https://onlylabs.fyi/topics/talking/signals.json","required":false},{"label":"data_radar_json","url":"https://onlylabs.fyi/data-radar.json","required":true}],"expected_output":["one-paragraph source-grounded interpretation","data-business implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze OpenAI's writing signal \"Inside OpenAI’s in-house data agent\" for frontier lab strategy and data-business implications."},"semantic_triples":[{"subject":"OpenAI","predicate":"published","object":"Inside OpenAI’s in-house data agent","text":"OpenAI published Inside OpenAI’s in-house data agent."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"is classified as","object":"writing signal","text":"Inside OpenAI’s in-house data agent is classified as writing signal."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"belongs to","object":"talking desk","text":"Inside OpenAI’s in-house data agent belongs to talking desk."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Inside OpenAI’s in-house data agent has evidence coverage 1 captured evidence page."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"matches data-business lanes","object":"Data demand","text":"Inside OpenAI’s in-house data agent matches data-business lanes Data demand."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has captured page count","object":"1","text":"Inside OpenAI’s in-house data agent has captured page count 1."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has readable page count","object":"1","text":"Inside OpenAI’s in-house data agent has readable page count 1."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has related signal count","object":"6","text":"Inside OpenAI’s in-house data agent has related signal count 6."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has analysis playbook objective","object":"Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.","text":"Inside OpenAI’s in-house data agent has analysis playbook objective Turn public writing and discussion into a readable map of research themes, product framing, policy posture, launch narratives, and market attention.."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has source host","object":"openai.com","text":"Inside OpenAI’s in-house data agent has source host openai.com."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has lab","object":"OpenAI","text":"Inside OpenAI’s in-house data agent has lab OpenAI."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has signal desk","object":"talking","text":"Inside OpenAI’s in-house data agent has signal desk talking."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has source host","object":"openai.com","text":"Inside OpenAI’s in-house data agent has source host openai.com."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has notability","object":"Substantive post but not a major model release.","text":"Inside OpenAI’s in-house data agent has notability Substantive post but not a major model release.."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has radar lane","object":"Data demand","text":"Inside OpenAI’s in-house data agent has radar lane Data demand."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has matched term","object":"data","text":"Inside OpenAI’s in-house data agent has matched term data."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has matched term","object":"dataset","text":"Inside OpenAI’s in-house data agent has matched term dataset."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has matched term","object":"datasets","text":"Inside OpenAI’s in-house data agent has matched term datasets."}]},"intelligence":{"signal_desk":"talking","answer":"OpenAI published Inside OpenAI’s in-house data agent. This talking signal gives public context for research themes, product direction, policy, or launch framing. High-signal details: Substantive post but not a major model release. · Inside OpenAI’s in-house data agent | OpenAI January 29, 2026 Inside OpenAI’s in-house data agent By Bonnie Xu, Aravind Suresh, and Emma Tang Loading… Share Data powers.... onlylabs links this event to 1 captured evidence page and 6 related writing signals. It also maps to Data demand in the data-business radar.","semantic_triples":[{"subject":"OpenAI","predicate":"published","object":"Inside OpenAI’s in-house data agent","text":"OpenAI published Inside OpenAI’s in-house data agent."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"is classified as","object":"writing signal","text":"Inside OpenAI’s in-house data agent is classified as writing signal."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"belongs to","object":"talking desk","text":"Inside OpenAI’s in-house data agent belongs to talking desk."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"has evidence coverage","object":"1 captured evidence page","text":"Inside OpenAI’s in-house data agent has evidence coverage 1 captured evidence page."},{"subject":"Inside OpenAI’s in-house data agent","predicate":"matches data-business lanes","object":"Data demand","text":"Inside OpenAI’s in-house data agent matches data-business lanes Data demand."}]},"signal":{"id":"c474881f-0699-40b0-8d81-d2863f79e4de","url":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de","json_url":"https://onlylabs.fyi/signals/c474881f-0699-40b0-8d81-d2863f79e4de/signal.json","source_url":"https://openai.com/index/inside-our-in-house-data-agent","title":"Inside OpenAI’s in-house data agent","summary":"OpenAI published a writing signal. onlylabs watches public writing for research themes, product direction, and model-launch context.","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-01-29T10:00:00+00:00","first_seen_at":"2026-06-05T05:42:57.832854+00:00","date_source":"rss.item_date","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["exa"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://openai.com/index/inside-our-in-house-data-agent"]},"facets":{},"traction":{"github_stars":null,"hn_points":70,"hn_comments":23,"hn_story_id":"46814115","hf_downloads":null,"hf_likes":null},"data_radar":{"lanes":[{"key":"data","label":"Data demand","url":"https://onlylabs.fyi/data-radar/data"}],"score":19,"matched_terms":["data","dataset","datasets"],"reason":"OpenAI has a writing signal matching data demand."}},"primary_evidence_page":{"url":"https://openai.com/index/inside-our-in-house-data-agent","final_url":"https://openai.com/index/inside-our-in-house-data-agent","title":"Inside OpenAI’s in-house data agent","http_status":200,"content_type":null,"capture_method":"exa","fetched_at":"2026-06-08T15:45:23.082+00:00","bytes":null,"raw_path":null,"content_hash":null,"excerpt_chars":1200,"truncated":true,"excerpt":"Inside OpenAI’s in-house data agent | OpenAI January 29, 2026 Inside OpenAI’s in-house data agent By Bonnie Xu, Aravind Suresh, and Emma Tang Loading… Share Data powers how systems learn, products evolve, and how companies make choices. But getting answers quickly, correctly, and with the right context is often harder than it should be. To make this easier as OpenAI scales, we built our own bespoke in-house AI data agent that explores and reasons over our own platform. Our agent is a custom internal-only tool (not an external offering), built specifically around OpenAI’s data, permissions, and workflows. We’re showing how we built and use it to help surface examples of the real, impactful ways AI can support day-to-day work across our teams. The OpenAI tools we used to build and run it (Codex, our GPT‑5 flagship model, the Evals API⁠, and the Embeddings API⁠) are the same tools we make available to developers everywhere. Our data agent lets employees go from question to insight in minutes, not days. This lowers the bar to pulling data and nuanced analysis across all functions, not just by our data team. Today, teams across Engineering, Data Science, Go-To-Market, Finance, and..."},"evidence_pages":[{"url":"https://openai.com/index/inside-our-in-house-data-agent","final_url":"https://openai.com/index/inside-our-in-house-data-agent","title":"Inside OpenAI’s in-house data agent","http_status":200,"content_type":null,"capture_method":"exa","fetched_at":"2026-06-08T15:45:23.082+00:00","bytes":null,"raw_path":null,"content_hash":null,"excerpt_chars":1200,"truncated":true,"excerpt":"Inside OpenAI’s in-house data agent | OpenAI January 29, 2026 Inside OpenAI’s in-house data agent By Bonnie Xu, Aravind Suresh, and Emma Tang Loading… Share Data powers how systems learn, products evolve, and how companies make choices. But getting answers quickly, correctly, and with the right context is often harder than it should be. To make this easier as OpenAI scales, we built our own bespoke in-house AI data agent that explores and reasons over our own platform. Our agent is a custom internal-only tool (not an external offering), built specifically around OpenAI’s data, permissions, and workflows. We’re showing how we built and use it to help surface examples of the real, impactful ways AI can support day-to-day work across our teams. The OpenAI tools we used to build and run it (Codex, our GPT‑5 flagship model, the Evals API⁠, and the Embeddings API⁠) are the same tools we make available to developers everywhere. Our data agent lets employees go from question to insight in minutes, not days. This lowers the bar to pulling data and nuanced analysis across all functions, not just by our data team. Today, teams across Engineering, Data Science, Go-To-Market, Finance, and..."}],"related_signals":[{"id":"b3668d3b-26d2-40c0-9d4f-ed1a67927aa4","url":"https://onlylabs.fyi/signals/b3668d3b-26d2-40c0-9d4f-ed1a67927aa4","source_url":"https://openai.com/index/supporting-eu-trustworthy-ai-ecosystem","title":"Supporting Europe’s work in ensuring a trustworthy AI ecosystem ","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-11T00:00:00+00:00","first_seen_at":"2026-06-11T08:00:56.140796+00:00","date_source":"rss.item_date"},{"id":"2638c0a7-b372-409c-ac72-f6d81d6464dc","url":"https://onlylabs.fyi/signals/2638c0a7-b372-409c-ac72-f6d81d6464dc","source_url":"https://openai.com/index/using-codex-to-simulate-black-holes","title":"How an astrophysicist uses Codex to help simulate black holes","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-11T00:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"509ea784-51ec-4ede-855b-5a4d1b27d3be","url":"https://onlylabs.fyi/signals/509ea784-51ec-4ede-855b-5a4d1b27d3be","source_url":"https://openai.com/index/openai-on-oracle-cloud","title":"Access OpenAI models and Codex through your Oracle cloud commitment","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T20:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"4f051449-87f2-466e-941e-b5918381a8fe","url":"https://onlylabs.fyi/signals/4f051449-87f2-466e-941e-b5918381a8fe","source_url":"https://openai.com/index/prc-linked-influence-operations-ai-debates","title":"PRC-linked influence operations are targeting AI debates in the US","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T12:00:00+00:00","first_seen_at":"2026-06-11T07:01:16.936464+00:00","date_source":"rss.item_date"},{"id":"4507c0c1-cb74-4bb3-b62b-5f6c2d37e20d","url":"https://onlylabs.fyi/signals/4507c0c1-cb74-4bb3-b62b-5f6c2d37e20d","source_url":"https://openai.com/index/lseg","title":"From data to decisions: how LSEG is scaling trusted AI","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-10T00:00:00+00:00","first_seen_at":"2026-06-10T09:18:54.26094+00:00","date_source":"rss.item_date"},{"id":"fb16aa7a-c4ef-4859-b514-0839c2f1330d","url":"https://onlylabs.fyi/signals/fb16aa7a-c4ef-4859-b514-0839c2f1330d","source_url":"https://openai.com/index/nextdoor","title":"How engineers at Nextdoor use Codex to build without limits","context":null,"kind":{"key":"post_published","label":"Writing"},"org":{"slug":"openai","name":"OpenAI","category":"frontier-lab"},"occurred_at":"2026-06-09T12:00:00+00:00","first_seen_at":"2026-06-10T07:01:28.700378+00:00","date_source":"rss.item_date"}]}