{"schema_version":"onlylabs.public_signal.v1","title":"Fireworks AI Fork: fw-ai/llama-cuda-graph-example","description":"Fireworks AI fork signal with public source context, captured evidence pages, related signals, and category-scoped analysis context.","url":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc","json_url":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc/signal.json","generated_at":"2026-06-11T04:19:34.484772+00:00","org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud","category_label":"Neocloud","dossier_url":"https://onlylabs.fyi/labs/fireworks-ai","dossier_json_url":"https://onlylabs.fyi/labs/fireworks-ai/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc","signal_json":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc/signal.json","source":"https://github.com/fw-ai/llama-cuda-graph-example","lab_dossier":"https://onlylabs.fyi/labs/fireworks-ai","lab_dossier_json":"https://onlylabs.fyi/labs/fireworks-ai/dossier.json","analysis":"https://onlylabs.fyi/analysis/fireworks-ai","analysis_json":"https://onlylabs.fyi/analysis/fireworks-ai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/fireworks-ai/evidence.json","category":"https://onlylabs.fyi/neoclouds","category_json":"https://onlylabs.fyi/neoclouds.json","category_feed":"https://onlylabs.fyi/neoclouds/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json?category=neocloud","topic":"https://onlylabs.fyi/topics/forks","topic_signals_json":"https://onlylabs.fyi/topics/forks/signals.json?category=neocloud","topic_feed":"https://onlylabs.fyi/topics/forks/feed.xml?category=neocloud","data_business":null},"answer_pack":{"answer":"Fireworks AI forked fw-ai/llama-cuda-graph-example (forked from meta-llama/llama). This fork signal points to upstream code the lab may be inspecting, patching, or building on. High-signal details: repo fw-ai/llama-cuda-graph-example · parent meta-llama/llama. onlylabs links this event to 1 captured evidence page and 6 related fork signals.","signal_desk":"forks","source_context":{"source_url":"https://github.com/fw-ai/llama-cuda-graph-example","source_host":"github.com","occurred_at":"2023-08-16T21:36:02+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source","context":"forked from meta-llama/llama"},"context_markers":[{"label":"Lab","value":"Fireworks AI","source":"signal"},{"label":"Signal desk","value":"forks","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"fw-ai/llama-cuda-graph-example","source":"source"},{"label":"Parent","value":"meta-llama/llama","source":"source"},{"label":"Stars","value":"11","source":"traction"},{"label":"Watch term","value":"Model card","source":"model"},{"label":"Watch term","value":"Infrastructure","source":"evidence"},{"label":"Watch term","value":"Safety and alignment","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/fw-ai/llama-cuda-graph-example"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T04:19:34.484772+00:00"},"data_business":{"matches":false,"lanes":[],"matched_terms":[],"score":null,"reason":null},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc/signal.json","dossier_json":"https://onlylabs.fyi/labs/fireworks-ai/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/fireworks-ai/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/fireworks-ai/evidence.json","topic_signals_json":"https://onlylabs.fyi/topics/forks/signals.json?category=neocloud","topic_feed":"https://onlylabs.fyi/topics/forks/feed.xml?category=neocloud","category_signals_json":"https://onlylabs.fyi/signals.json?category=neocloud","data_radar_json":null,"opportunities_json":null},"analysis_playbook":{"objective":"Turn fork activity into a map of upstream tools, libraries, model utilities, agent frameworks, and research dependencies being inspected or adapted.","evidence_focus":["forked parent repo","repo owner","language","description","stars","org and recency"],"extraction_questions":["Which upstream projects are repeated across labs?","Which forks point to evals, agents, infrastructure, model tooling, or data pipelines?","Which low-profile forks could precede a release or hiring wave?","Which labs are converging on the same technical adjacency?"],"signal_questions":["What upstream dependency or technical adjacency does this fork reveal?","Which upstream projects are repeated across labs?","Which forks point to evals, agents, infrastructure, model tooling, or data pipelines?","Do the 6 related fork signals show a repeated pattern?"],"output_fields":["org","upstream_repo","language","technical_theme","evidence_url"],"data_business_relevance":"Data-business lane extraction is scoped to frontier labs; for this category, keep conclusions tied to category-specific strategy, source evidence, and follow-up questions.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc/signal.json","required":true},{"label":"source","url":"https://github.com/fw-ai/llama-cuda-graph-example","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/fireworks-ai/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/fireworks-ai/evidence.json","required":true},{"label":"topic_signals_json","url":"https://onlylabs.fyi/topics/forks/signals.json?category=neocloud","required":false},{"label":"data_radar_json","url":null,"required":false}],"expected_output":["one-paragraph source-grounded interpretation","category-specific implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Fireworks AI's fork signal \"fw-ai/llama-cuda-graph-example\" for neocloud strategy."},"semantic_triples":[{"subject":"Fireworks AI","predicate":"forked","object":"fw-ai/llama-cuda-graph-example","text":"Fireworks AI forked fw-ai/llama-cuda-graph-example."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"is classified as","object":"fork signal","text":"fw-ai/llama-cuda-graph-example is classified as fork signal."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"belongs to","object":"forks desk","text":"fw-ai/llama-cuda-graph-example belongs to forks desk."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has context","object":"forked from meta-llama/llama","text":"fw-ai/llama-cuda-graph-example has context forked from meta-llama/llama."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has evidence coverage","object":"1 captured evidence page","text":"fw-ai/llama-cuda-graph-example has evidence coverage 1 captured evidence page."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has captured page count","object":"1","text":"fw-ai/llama-cuda-graph-example has captured page count 1."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has readable page count","object":"1","text":"fw-ai/llama-cuda-graph-example has readable page count 1."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has related signal count","object":"6","text":"fw-ai/llama-cuda-graph-example has related signal count 6."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has analysis playbook objective","object":"Turn fork activity into a map of upstream tools, libraries, model utilities, agent frameworks, and research dependencies being inspected or adapted.","text":"fw-ai/llama-cuda-graph-example has analysis playbook objective Turn fork activity into a map of upstream tools, libraries, model utilities, agent frameworks, and research dependencies being inspected or adapted.."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has source host","object":"github.com","text":"fw-ai/llama-cuda-graph-example has source host github.com."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has lab","object":"Fireworks AI","text":"fw-ai/llama-cuda-graph-example has lab Fireworks AI."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has signal desk","object":"forks","text":"fw-ai/llama-cuda-graph-example has signal desk forks."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has source host","object":"github.com","text":"fw-ai/llama-cuda-graph-example has source host github.com."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has repository","object":"fw-ai/llama-cuda-graph-example","text":"fw-ai/llama-cuda-graph-example has repository fw-ai/llama-cuda-graph-example."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has parent","object":"meta-llama/llama","text":"fw-ai/llama-cuda-graph-example has parent meta-llama/llama."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has stars","object":"11","text":"fw-ai/llama-cuda-graph-example has stars 11."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has watch term","object":"Model card","text":"fw-ai/llama-cuda-graph-example has watch term Model card."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has watch term","object":"Infrastructure","text":"fw-ai/llama-cuda-graph-example has watch term Infrastructure."}]},"intelligence":{"signal_desk":"forks","answer":"Fireworks AI forked fw-ai/llama-cuda-graph-example (forked from meta-llama/llama). This fork signal points to upstream code the lab may be inspecting, patching, or building on. High-signal details: repo fw-ai/llama-cuda-graph-example · parent meta-llama/llama. onlylabs links this event to 1 captured evidence page and 6 related fork signals.","semantic_triples":[{"subject":"Fireworks AI","predicate":"forked","object":"fw-ai/llama-cuda-graph-example","text":"Fireworks AI forked fw-ai/llama-cuda-graph-example."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"is classified as","object":"fork signal","text":"fw-ai/llama-cuda-graph-example is classified as fork signal."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"belongs to","object":"forks desk","text":"fw-ai/llama-cuda-graph-example belongs to forks desk."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has context","object":"forked from meta-llama/llama","text":"fw-ai/llama-cuda-graph-example has context forked from meta-llama/llama."},{"subject":"fw-ai/llama-cuda-graph-example","predicate":"has evidence coverage","object":"1 captured evidence page","text":"fw-ai/llama-cuda-graph-example has evidence coverage 1 captured evidence page."}]},"signal":{"id":"3d277a30-e481-477c-b998-557fa5bf09dc","url":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc","json_url":"https://onlylabs.fyi/signals/3d277a30-e481-477c-b998-557fa5bf09dc/signal.json","source_url":"https://github.com/fw-ai/llama-cuda-graph-example","title":"fw-ai/llama-cuda-graph-example","summary":"Fireworks AI forked upstream code. onlylabs watches forks for tooling, infrastructure, research dependencies, and product-adjacent work.","context":"forked from meta-llama/llama","kind":{"key":"repo_forked","label":"Fork"},"org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud"},"occurred_at":"2023-08-16T21:36:02+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/fw-ai/llama-cuda-graph-example"]},"facets":{"repo":"fw-ai/llama-cuda-graph-example","parent":"meta-llama/llama"},"traction":{"github_stars":11,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":null},"primary_evidence_page":{"url":"https://github.com/fw-ai/llama-cuda-graph-example","final_url":"https://github.com/fw-ai/llama-cuda-graph-example","title":"fw-ai/llama-cuda-graph-example repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T04:19:34.484772+00:00","bytes":26204,"raw_path":"17385866f793d7c08d0367f2765cdd458602ae082703ab6124669288519d2fb9.json","content_hash":"d0c244f6f034f4af3c9b295d5c8405579bc6c24233ad1b79093288120ebc4582","excerpt_chars":1200,"truncated":true,"excerpt":"fw-ai/llama-cuda-graph-example Description: Example of applying CUDA graphs to LLaMA-v2 License: NOASSERTION Stars: 11 Forks: 5 Open issues: 0 Created: 2023-08-16T21:36:02Z Pushed: 2023-08-25T23:08:38Z Default branch: main Fork: yes Parent repository: meta-llama/llama Archived: no README: Llama 2 We are unlocking the power of large language models. Our latest version of Llama is now accessible to individuals, creators, researchers and businesses of all sizes so that they can experiment, innovate and scale their ideas responsibly. This release includes model weights and starting code for pretrained and fine-tuned Llama language models — ranging from 7B to 70B parameters. This repository is intended as a minimal example to load [Llama 2](https://ai.meta.com/research/publications/llama-2-open-foundation-and-fine-tuned-chat-models/) models and run inference. For more detailed examples leveraging HuggingFace, see [llama-recipes](https://github.com/facebookresearch/llama-recipes/). Updates post-launch See [UPDATES.md](UPDATES.md). Download ⚠️ **7/18: We're aware of people encountering a number of download issues today. Anyone still encountering issues should remove all local files,..."},"evidence_pages":[{"url":"https://github.com/fw-ai/llama-cuda-graph-example","final_url":"https://github.com/fw-ai/llama-cuda-graph-example","title":"fw-ai/llama-cuda-graph-example repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T04:19:34.484772+00:00","bytes":26204,"raw_path":"17385866f793d7c08d0367f2765cdd458602ae082703ab6124669288519d2fb9.json","content_hash":"d0c244f6f034f4af3c9b295d5c8405579bc6c24233ad1b79093288120ebc4582","excerpt_chars":1200,"truncated":true,"excerpt":"fw-ai/llama-cuda-graph-example Description: Example of applying CUDA graphs to LLaMA-v2 License: NOASSERTION Stars: 11 Forks: 5 Open issues: 0 Created: 2023-08-16T21:36:02Z Pushed: 2023-08-25T23:08:38Z Default branch: main Fork: yes Parent repository: meta-llama/llama Archived: no README: Llama 2 We are unlocking the power of large language models. Our latest version of Llama is now accessible to individuals, creators, researchers and businesses of all sizes so that they can experiment, innovate and scale their ideas responsibly. This release includes model weights and starting code for pretrained and fine-tuned Llama language models — ranging from 7B to 70B parameters. This repository is intended as a minimal example to load [Llama 2](https://ai.meta.com/research/publications/llama-2-open-foundation-and-fine-tuned-chat-models/) models and run inference. For more detailed examples leveraging HuggingFace, see [llama-recipes](https://github.com/facebookresearch/llama-recipes/). Updates post-launch See [UPDATES.md](UPDATES.md). Download ⚠️ **7/18: We're aware of people encountering a number of download issues today. Anyone still encountering issues should remove all local files,..."}],"related_signals":[{"id":"322fcebd-97f6-4e75-a3d6-097d673c0dc4","url":"https://onlylabs.fyi/signals/322fcebd-97f6-4e75-a3d6-097d673c0dc4","source_url":"https://github.com/fw-ai/safetensors","title":"fw-ai/safetensors","context":"forked from safetensors/safetensors","kind":{"key":"repo_forked","label":"Fork"},"org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud"},"occurred_at":"2026-06-02T23:45:45+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source"},{"id":"d2d8dd75-c212-408b-9201-c07833f17f5b","url":"https://onlylabs.fyi/signals/d2d8dd75-c212-408b-9201-c07833f17f5b","source_url":"https://github.com/fw-ai/triton","title":"fw-ai/triton","context":"forked from triton-lang/triton","kind":{"key":"repo_forked","label":"Fork"},"org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud"},"occurred_at":"2026-03-17T23:07:43+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source"},{"id":"f4f15245-e148-44e1-a2ce-d9bb30affcb2","url":"https://onlylabs.fyi/signals/f4f15245-e148-44e1-a2ce-d9bb30affcb2","source_url":"https://github.com/fw-ai/nixl","title":"fw-ai/nixl","context":"forked from ai-dynamo/nixl","kind":{"key":"repo_forked","label":"Fork"},"org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud"},"occurred_at":"2026-01-09T21:55:48+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source"},{"id":"375b5e8d-aceb-4979-946a-fe37d093240a","url":"https://onlylabs.fyi/signals/375b5e8d-aceb-4979-946a-fe37d093240a","source_url":"https://github.com/fw-ai/DeepEP","title":"fw-ai/DeepEP","context":"forked from deepseek-ai/DeepEP","kind":{"key":"repo_forked","label":"Fork"},"org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud"},"occurred_at":"2025-06-06T21:48:44+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source"},{"id":"39d882c8-ddfc-4360-8ae6-bf3333e32b70","url":"https://onlylabs.fyi/signals/39d882c8-ddfc-4360-8ae6-bf3333e32b70","source_url":"https://github.com/fw-ai/kaldi","title":"fw-ai/kaldi","context":"forked from kaldi-asr/kaldi","kind":{"key":"repo_forked","label":"Fork"},"org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud"},"occurred_at":"2024-10-07T01:08:21+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source"},{"id":"eab92735-6df1-4fcf-9210-8e9e5860489a","url":"https://onlylabs.fyi/signals/eab92735-6df1-4fcf-9210-8e9e5860489a","source_url":"https://github.com/fw-ai/cutlass","title":"fw-ai/cutlass","context":"forked from NVIDIA/cutlass","kind":{"key":"repo_forked","label":"Fork"},"org":{"slug":"fireworks-ai","name":"Fireworks AI","category":"neocloud"},"occurred_at":"2024-09-09T17:47:04+00:00","first_seen_at":"2026-06-05T22:32:07.992054+00:00","date_source":"source"}]}