{"schema_version":"onlylabs.public_signal.v1","title":"Anthropic Repo: anthropics/rogue-deploy-eval","description":"Anthropic repo signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11","json_url":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11/signal.json","generated_at":"2026-06-11T03:59:12.476466+00:00","org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/anthropic","dossier_json_url":"https://onlylabs.fyi/labs/anthropic/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11","signal_json":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11/signal.json","source":"https://github.com/anthropics/rogue-deploy-eval","lab_dossier":"https://onlylabs.fyi/labs/anthropic","lab_dossier_json":"https://onlylabs.fyi/labs/anthropic/dossier.json","analysis":"https://onlylabs.fyi/analysis/anthropic","analysis_json":"https://onlylabs.fyi/analysis/anthropic/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/anthropic/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":{"radar":"https://onlylabs.fyi/data-radar","radar_json":"https://onlylabs.fyi/data-radar.json","opportunities":"https://onlylabs.fyi/opportunities","opportunities_json":"https://onlylabs.fyi/opportunities.json","lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"}]}},"answer_pack":{"answer":"Anthropic published anthropics/rogue-deploy-eval (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo anthropics/rogue-deploy-eval · language Python · Low traction (15 stars) for a new repo from Anthropic, likely a routine research tool.. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality in the data-business radar.","signal_desk":"repos","source_context":{"source_url":"https://github.com/anthropics/rogue-deploy-eval","source_host":"github.com","occurred_at":"2024-11-05T15:21:13+00:00","first_seen_at":"2026-06-05T05:42:58.841369+00:00","date_source":"source","context":"Python"},"context_markers":[{"label":"Lab","value":"Anthropic","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"anthropics/rogue-deploy-eval","source":"source"},{"label":"Language","value":"Python","source":"source"},{"label":"Stars","value":"15","source":"traction"},{"label":"Notability","value":"Low traction (15 stars) for a new repo from Anthropic, likely a routine research tool.","source":"signal"},{"label":"Radar lane","value":"Evals and quality","source":"radar"},{"label":"Matched term","value":"eval","source":"radar"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Infrastructure","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/anthropics/rogue-deploy-eval"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:59:12.476466+00:00"},"data_business":{"matches":true,"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"}],"matched_terms":["eval"],"score":14,"reason":"Anthropic has a repo signal matching evals and quality."},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11/signal.json","dossier_json":"https://onlylabs.fyi/labs/anthropic/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/anthropic/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/anthropic/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":"https://onlylabs.fyi/data-radar.json","opportunities_json":"https://onlylabs.fyi/opportunities.json"},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Which data-business lane explains this signal: Evals and quality?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","data_business_lane","evidence_url"],"data_business_relevance":"New repositories can expose organization build priorities early, especially around internal tooling, eval infrastructure, data systems, deployment, and agent workflows.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11/signal.json","required":true},{"label":"source","url":"https://github.com/anthropics/rogue-deploy-eval","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/anthropic/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/anthropic/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":"https://onlylabs.fyi/data-radar.json","required":true}],"expected_output":["one-paragraph source-grounded interpretation","data-business implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Anthropic's repo signal \"anthropics/rogue-deploy-eval\" for frontier lab strategy and data-business implications."},"semantic_triples":[{"subject":"Anthropic","predicate":"published repo","object":"anthropics/rogue-deploy-eval","text":"Anthropic published repo anthropics/rogue-deploy-eval."},{"subject":"anthropics/rogue-deploy-eval","predicate":"is classified as","object":"repo signal","text":"anthropics/rogue-deploy-eval is classified as repo signal."},{"subject":"anthropics/rogue-deploy-eval","predicate":"belongs to","object":"repos desk","text":"anthropics/rogue-deploy-eval belongs to repos desk."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has context","object":"Python","text":"anthropics/rogue-deploy-eval has context Python."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has evidence coverage","object":"1 captured evidence page","text":"anthropics/rogue-deploy-eval has evidence coverage 1 captured evidence page."},{"subject":"anthropics/rogue-deploy-eval","predicate":"matches data-business lanes","object":"Evals and quality","text":"anthropics/rogue-deploy-eval matches data-business lanes Evals and quality."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has captured page count","object":"1","text":"anthropics/rogue-deploy-eval has captured page count 1."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has readable page count","object":"1","text":"anthropics/rogue-deploy-eval has readable page count 1."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has related signal count","object":"6","text":"anthropics/rogue-deploy-eval has related signal count 6."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"anthropics/rogue-deploy-eval has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has source host","object":"github.com","text":"anthropics/rogue-deploy-eval has source host github.com."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has lab","object":"Anthropic","text":"anthropics/rogue-deploy-eval has lab Anthropic."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has signal desk","object":"repos","text":"anthropics/rogue-deploy-eval has signal desk repos."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has source host","object":"github.com","text":"anthropics/rogue-deploy-eval has source host github.com."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has repository","object":"anthropics/rogue-deploy-eval","text":"anthropics/rogue-deploy-eval has repository anthropics/rogue-deploy-eval."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has language","object":"Python","text":"anthropics/rogue-deploy-eval has language Python."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has stars","object":"15","text":"anthropics/rogue-deploy-eval has stars 15."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has notability","object":"Low traction (15 stars) for a new repo from Anthropic, likely a routine research tool.","text":"anthropics/rogue-deploy-eval has notability Low traction (15 stars) for a new repo from Anthropic, likely a routine research tool.."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has radar lane","object":"Evals and quality","text":"anthropics/rogue-deploy-eval has radar lane Evals and quality."}]},"intelligence":{"signal_desk":"repos","answer":"Anthropic published anthropics/rogue-deploy-eval (Python). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo anthropics/rogue-deploy-eval · language Python · Low traction (15 stars) for a new repo from Anthropic, likely a routine research tool.. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality in the data-business radar.","semantic_triples":[{"subject":"Anthropic","predicate":"published repo","object":"anthropics/rogue-deploy-eval","text":"Anthropic published repo anthropics/rogue-deploy-eval."},{"subject":"anthropics/rogue-deploy-eval","predicate":"is classified as","object":"repo signal","text":"anthropics/rogue-deploy-eval is classified as repo signal."},{"subject":"anthropics/rogue-deploy-eval","predicate":"belongs to","object":"repos desk","text":"anthropics/rogue-deploy-eval belongs to repos desk."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has context","object":"Python","text":"anthropics/rogue-deploy-eval has context Python."},{"subject":"anthropics/rogue-deploy-eval","predicate":"has evidence coverage","object":"1 captured evidence page","text":"anthropics/rogue-deploy-eval has evidence coverage 1 captured evidence page."},{"subject":"anthropics/rogue-deploy-eval","predicate":"matches data-business lanes","object":"Evals and quality","text":"anthropics/rogue-deploy-eval matches data-business lanes Evals and quality."}]},"signal":{"id":"6de2a0af-fc46-4e1b-ae79-6fd234e0fe11","url":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11","json_url":"https://onlylabs.fyi/signals/6de2a0af-fc46-4e1b-ae79-6fd234e0fe11/signal.json","source_url":"https://github.com/anthropics/rogue-deploy-eval","title":"anthropics/rogue-deploy-eval","summary":"Anthropic published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab"},"occurred_at":"2024-11-05T15:21:13+00:00","first_seen_at":"2026-06-05T05:42:58.841369+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/anthropics/rogue-deploy-eval"]},"facets":{"repo":"anthropics/rogue-deploy-eval","language":"Python"},"traction":{"github_stars":15,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":{"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals"}],"score":14,"matched_terms":["eval"],"reason":"Anthropic has a repo signal matching evals and quality."}},"primary_evidence_page":{"url":"https://github.com/anthropics/rogue-deploy-eval","final_url":"https://github.com/anthropics/rogue-deploy-eval","title":"anthropics/rogue-deploy-eval repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:59:12.476466+00:00","bytes":8837,"raw_path":"02349755377932ed7a2a523542a85766084280a3d25f728b7e70f9c807f222d6.json","content_hash":"a251acc359f5812bc0f5803f2fba1c80674b3524b610293937ddebc5346d94b5","excerpt_chars":1200,"truncated":false,"excerpt":"anthropics/rogue-deploy-eval Language: Python License: MIT Stars: 15 Forks: 7 Open issues: 0 Created: 2024-11-05T15:21:13Z Pushed: 2025-01-21T14:20:23Z Default branch: main Fork: no Archived: yes README: A toy evaluation of inference code tampering This is the code for [this blog post](https://alignment.anthropic.com/2024/rogue-eval/). This allows running a semi-quantitative evaluation of a model's ability to write code that modifies a simple generation function to disable the generation monitor while solving another task. How to use this code To run the experiment 1. Fill the places in the repository that are 'TO_FILL', as our experiments relied on private tools for GPU code execution and LLM inference. 2. Run the notebook `rogue_deploy/simple_pipeline.py` 3. Run the notebook `rogue_deploy/print_pipeline.py`"},"evidence_pages":[{"url":"https://github.com/anthropics/rogue-deploy-eval","final_url":"https://github.com/anthropics/rogue-deploy-eval","title":"anthropics/rogue-deploy-eval repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:59:12.476466+00:00","bytes":8837,"raw_path":"02349755377932ed7a2a523542a85766084280a3d25f728b7e70f9c807f222d6.json","content_hash":"a251acc359f5812bc0f5803f2fba1c80674b3524b610293937ddebc5346d94b5","excerpt_chars":1200,"truncated":false,"excerpt":"anthropics/rogue-deploy-eval Language: Python License: MIT Stars: 15 Forks: 7 Open issues: 0 Created: 2024-11-05T15:21:13Z Pushed: 2025-01-21T14:20:23Z Default branch: main Fork: no Archived: yes README: A toy evaluation of inference code tampering This is the code for [this blog post](https://alignment.anthropic.com/2024/rogue-eval/). This allows running a semi-quantitative evaluation of a model's ability to write code that modifies a simple generation function to disable the generation monitor while solving another task. How to use this code To run the experiment 1. Fill the places in the repository that are 'TO_FILL', as our experiments relied on private tools for GPU code execution and LLM inference. 2. Run the notebook `rogue_deploy/simple_pipeline.py` 3. Run the notebook `rogue_deploy/print_pipeline.py`"}],"related_signals":[{"id":"d655a3de-1616-4e38-b9a0-27254762c1f0","url":"https://onlylabs.fyi/signals/d655a3de-1616-4e38-b9a0-27254762c1f0","source_url":"https://github.com/anthropics/defending-code-reference-harness","title":"anthropics/defending-code-reference-harness","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab"},"occurred_at":"2026-05-22T16:00:56+00:00","first_seen_at":"2026-06-05T05:42:58.841369+00:00","date_source":"source"},{"id":"f91bba87-e295-4641-8aa0-9fa254e149b1","url":"https://onlylabs.fyi/signals/f91bba87-e295-4641-8aa0-9fa254e149b1","source_url":"https://github.com/anthropics/ClaudeForFoundationModels","title":"anthropics/ClaudeForFoundationModels","context":"Swift","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab"},"occurred_at":"2026-05-20T15:41:18+00:00","first_seen_at":"2026-06-09T07:00:07.44979+00:00","date_source":"source"},{"id":"7f417861-19b7-493f-b6d7-bf9ef54a9a1f","url":"https://onlylabs.fyi/signals/7f417861-19b7-493f-b6d7-bf9ef54a9a1f","source_url":"https://github.com/anthropics/cargo-nix-plugin","title":"anthropics/cargo-nix-plugin","context":"Rust","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab"},"occurred_at":"2026-05-19T17:07:44+00:00","first_seen_at":"2026-06-05T05:42:58.841369+00:00","date_source":"source"},{"id":"0c515bfd-ccd4-4a21-868f-944fd4945f19","url":"https://onlylabs.fyi/signals/0c515bfd-ccd4-4a21-868f-944fd4945f19","source_url":"https://github.com/anthropics/scone-bench","title":"anthropics/scone-bench","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab"},"occurred_at":"2026-05-12T22:17:19+00:00","first_seen_at":"2026-06-05T05:42:58.841369+00:00","date_source":"source"},{"id":"7f529da9-d1d8-4424-aaf5-face018ae4f8","url":"https://onlylabs.fyi/signals/7f529da9-d1d8-4424-aaf5-face018ae4f8","source_url":"https://github.com/anthropics/html-effectiveness","title":"anthropics/html-effectiveness","context":"HTML","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab"},"occurred_at":"2026-05-12T06:25:16+00:00","first_seen_at":"2026-06-05T05:42:58.841369+00:00","date_source":"source"},{"id":"3ea41c6f-444c-4f24-a8f7-ad037263bde0","url":"https://onlylabs.fyi/signals/3ea41c6f-444c-4f24-a8f7-ad037263bde0","source_url":"https://github.com/anthropics/cwc-workshops","title":"anthropics/cwc-workshops","context":"TypeScript","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"anthropic","name":"Anthropic","category":"frontier-lab"},"occurred_at":"2026-05-06T03:53:01+00:00","first_seen_at":"2026-06-05T05:42:58.841369+00:00","date_source":"source"}]}