{"schema_version":"onlylabs.public_signal.v1","title":"Amazon (Nova) Repo: amazon-science/hotel-quest-benchmark","description":"Amazon (Nova) repo signal with public source context, captured evidence pages, related signals, and data-business radar classification.","url":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5","json_url":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5/signal.json","generated_at":"2026-06-11T03:02:53.147046+00:00","org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab","category_label":"Frontier lab","dossier_url":"https://onlylabs.fyi/labs/amazon","dossier_json_url":"https://onlylabs.fyi/labs/amazon/dossier.json"},"related_urls":{"signal":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5","signal_json":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5/signal.json","source":"https://github.com/amazon-science/hotel-quest-benchmark","lab_dossier":"https://onlylabs.fyi/labs/amazon","lab_dossier_json":"https://onlylabs.fyi/labs/amazon/dossier.json","analysis":"https://onlylabs.fyi/analysis/amazon","analysis_json":"https://onlylabs.fyi/analysis/amazon/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/amazon/evidence.json","category":"https://onlylabs.fyi/frontier","category_json":"https://onlylabs.fyi/frontier.json","category_feed":"https://onlylabs.fyi/frontier/feed.xml","category_signals_json":"https://onlylabs.fyi/signals.json","topic":null,"topic_signals_json":null,"topic_feed":null,"data_business":{"radar":"https://onlylabs.fyi/data-radar","radar_json":"https://onlylabs.fyi/data-radar.json","opportunities":"https://onlylabs.fyi/opportunities","opportunities_json":"https://onlylabs.fyi/opportunities.json","lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"}]}},"answer_pack":{"answer":"Amazon (Nova) published amazon-science/hotel-quest-benchmark (Jupyter Notebook). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo amazon-science/hotel-quest-benchmark · language Jupyter Notebook · New benchmark repo, low traction. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality in the data-business radar.","signal_desk":"repos","source_context":{"source_url":"https://github.com/amazon-science/hotel-quest-benchmark","source_host":"github.com","occurred_at":"2026-01-14T13:54:05+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source","context":"Jupyter Notebook"},"context_markers":[{"label":"Lab","value":"Amazon (Nova)","source":"signal"},{"label":"Signal desk","value":"repos","source":"signal"},{"label":"Source host","value":"github.com","source":"source"},{"label":"Repository","value":"amazon-science/hotel-quest-benchmark","source":"source"},{"label":"Language","value":"Jupyter Notebook","source":"source"},{"label":"Stars","value":"2","source":"traction"},{"label":"Notability","value":"New benchmark repo, low traction","source":"signal"},{"label":"Radar lane","value":"Evals and quality","source":"radar"},{"label":"Matched term","value":"benchmark","source":"radar"},{"label":"Watch term","value":"Eval methodology","source":"evidence"},{"label":"Watch term","value":"Data pipeline","source":"evidence"},{"label":"Watch term","value":"Infrastructure","source":"evidence"},{"label":"Watch term","value":"Agents and tool use","source":"evidence"}],"evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/amazon-science/hotel-quest-benchmark"],"related_signals":6,"has_source_url":true,"latest_page_fetched_at":"2026-06-11T03:02:53.147046+00:00"},"data_business":{"matches":true,"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals","json_url":"https://onlylabs.fyi/data-radar/evals/signals.json"}],"matched_terms":["benchmark"],"score":14,"reason":"Amazon (Nova) has a repo signal matching evals and quality."},"agent_handoff":{"signal_json":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5/signal.json","dossier_json":"https://onlylabs.fyi/labs/amazon/dossier.json","analysis_json":"https://onlylabs.fyi/analysis/amazon/analysis.json","analysis_evidence_json":"https://onlylabs.fyi/analysis/amazon/evidence.json","topic_signals_json":null,"topic_feed":null,"category_signals_json":"https://onlylabs.fyi/signals.json","data_radar_json":"https://onlylabs.fyi/data-radar.json","opportunities_json":"https://onlylabs.fyi/opportunities.json"},"analysis_playbook":{"objective":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","evidence_focus":["repo name","owner","description","language","stars","source URL","first seen time","data, eval, infra, safety, and product terms"],"extraction_questions":["What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Is the repo new evidence for a lab direction that is not yet in writing or releases?","Which related signals should an analyst inspect next?"],"signal_questions":["What does this new repository reveal before a formal announcement exists?","What technical area does this repository expose?","Does the repo imply eval, data, infrastructure, agent, or deployment work?","Which data-business lane explains this signal: Evals and quality?","Do the 6 related repo signals show a repeated pattern?"],"output_fields":["org","repo","technical_theme","data_business_lane","evidence_url"],"data_business_relevance":"New repositories can expose organization build priorities early, especially around internal tooling, eval infrastructure, data systems, deployment, and agent workflows.","required_sources":[{"label":"signal_json","url":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5/signal.json","required":true},{"label":"source","url":"https://github.com/amazon-science/hotel-quest-benchmark","required":true},{"label":"dossier_json","url":"https://onlylabs.fyi/labs/amazon/dossier.json","required":true},{"label":"analysis_evidence_json","url":"https://onlylabs.fyi/analysis/amazon/evidence.json","required":true},{"label":"topic_signals_json","url":null,"required":false},{"label":"data_radar_json","url":"https://onlylabs.fyi/data-radar.json","required":true}],"expected_output":["one-paragraph source-grounded interpretation","data-business implication","confidence and missing evidence","recommended next source to inspect"],"prompt_seed":"Using only the linked onlylabs JSON, captured source context, and cited evidence, analyze Amazon (Nova)'s repo signal \"amazon-science/hotel-quest-benchmark\" for frontier lab strategy and data-business implications."},"semantic_triples":[{"subject":"Amazon (Nova)","predicate":"published repo","object":"amazon-science/hotel-quest-benchmark","text":"Amazon (Nova) published repo amazon-science/hotel-quest-benchmark."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"is classified as","object":"repo signal","text":"amazon-science/hotel-quest-benchmark is classified as repo signal."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"belongs to","object":"repos desk","text":"amazon-science/hotel-quest-benchmark belongs to repos desk."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has context","object":"Jupyter Notebook","text":"amazon-science/hotel-quest-benchmark has context Jupyter Notebook."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has evidence coverage","object":"1 captured evidence page","text":"amazon-science/hotel-quest-benchmark has evidence coverage 1 captured evidence page."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"matches data-business lanes","object":"Evals and quality","text":"amazon-science/hotel-quest-benchmark matches data-business lanes Evals and quality."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has captured page count","object":"1","text":"amazon-science/hotel-quest-benchmark has captured page count 1."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has readable page count","object":"1","text":"amazon-science/hotel-quest-benchmark has readable page count 1."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has related signal count","object":"6","text":"amazon-science/hotel-quest-benchmark has related signal count 6."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has analysis playbook objective","object":"Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.","text":"amazon-science/hotel-quest-benchmark has analysis playbook objective Turn new repository signals into early evidence of tooling, eval, infrastructure, model-adjacent, or product work before it appears in polished launch channels.."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has source host","object":"github.com","text":"amazon-science/hotel-quest-benchmark has source host github.com."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has lab","object":"Amazon (Nova)","text":"amazon-science/hotel-quest-benchmark has lab Amazon (Nova)."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has signal desk","object":"repos","text":"amazon-science/hotel-quest-benchmark has signal desk repos."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has source host","object":"github.com","text":"amazon-science/hotel-quest-benchmark has source host github.com."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has repository","object":"amazon-science/hotel-quest-benchmark","text":"amazon-science/hotel-quest-benchmark has repository amazon-science/hotel-quest-benchmark."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has language","object":"Jupyter Notebook","text":"amazon-science/hotel-quest-benchmark has language Jupyter Notebook."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has stars","object":"2","text":"amazon-science/hotel-quest-benchmark has stars 2."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has notability","object":"New benchmark repo, low traction","text":"amazon-science/hotel-quest-benchmark has notability New benchmark repo, low traction."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has radar lane","object":"Evals and quality","text":"amazon-science/hotel-quest-benchmark has radar lane Evals and quality."}]},"intelligence":{"signal_desk":"repos","answer":"Amazon (Nova) published amazon-science/hotel-quest-benchmark (Jupyter Notebook). This repository signal exposes tooling, eval, infrastructure, or model-adjacent work before it may appear in a launch post. High-signal details: repo amazon-science/hotel-quest-benchmark · language Jupyter Notebook · New benchmark repo, low traction. onlylabs links this event to 1 captured evidence page and 6 related repo signals. It also maps to Evals and quality in the data-business radar.","semantic_triples":[{"subject":"Amazon (Nova)","predicate":"published repo","object":"amazon-science/hotel-quest-benchmark","text":"Amazon (Nova) published repo amazon-science/hotel-quest-benchmark."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"is classified as","object":"repo signal","text":"amazon-science/hotel-quest-benchmark is classified as repo signal."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"belongs to","object":"repos desk","text":"amazon-science/hotel-quest-benchmark belongs to repos desk."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has context","object":"Jupyter Notebook","text":"amazon-science/hotel-quest-benchmark has context Jupyter Notebook."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"has evidence coverage","object":"1 captured evidence page","text":"amazon-science/hotel-quest-benchmark has evidence coverage 1 captured evidence page."},{"subject":"amazon-science/hotel-quest-benchmark","predicate":"matches data-business lanes","object":"Evals and quality","text":"amazon-science/hotel-quest-benchmark matches data-business lanes Evals and quality."}]},"signal":{"id":"f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5","url":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5","json_url":"https://onlylabs.fyi/signals/f3fe01f6-fc0a-43f5-9a77-b5acedc0e9e5/signal.json","source_url":"https://github.com/amazon-science/hotel-quest-benchmark","title":"amazon-science/hotel-quest-benchmark","summary":"Amazon (Nova) published a new repository. onlylabs watches repos for tooling, eval, infra, and model-adjacent work.","context":"Jupyter Notebook","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab"},"occurred_at":"2026-01-14T13:54:05+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source","evidence_coverage":{"target_pages":1,"captured_pages":1,"readable_pages":1,"capture_methods":["plain"],"missing_page_urls":[],"failed_page_urls":[],"blocked_page_urls":[],"page_urls":["https://github.com/amazon-science/hotel-quest-benchmark"]},"facets":{"repo":"amazon-science/hotel-quest-benchmark","language":"Jupyter Notebook"},"traction":{"github_stars":2,"hn_points":null,"hn_comments":null,"hn_story_id":null,"hf_downloads":null,"hf_likes":null},"data_radar":{"lanes":[{"key":"evals","label":"Evals and quality","url":"https://onlylabs.fyi/data-radar/evals"}],"score":14,"matched_terms":["benchmark"],"reason":"Amazon (Nova) has a repo signal matching evals and quality."}},"primary_evidence_page":{"url":"https://github.com/amazon-science/hotel-quest-benchmark","final_url":"https://github.com/amazon-science/hotel-quest-benchmark","title":"amazon-science/hotel-quest-benchmark repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:02:53.147046+00:00","bytes":19237,"raw_path":"2f366c291337d82f84afe9a1fad79a176615c36186fa4bc93ba9f830b49fe6fd.json","content_hash":"1db821798e6212e9b7488bb6292a2bcc24ddb969ce7bea33e51a4a0aae46476d","excerpt_chars":1200,"truncated":true,"excerpt":"amazon-science/hotel-quest-benchmark Language: Jupyter Notebook License: NOASSERTION Stars: 2 Forks: 0 Open issues: 0 Created: 2026-01-14T13:54:05Z Pushed: 2026-01-17T15:47:03Z Default branch: main Fork: no Archived: no README: HotelQuEST: Balancing Quality and Efficiency in Agentic Search [//]: # (## 📢 Latest Updates) [//]: # (- **2026 Jan-15**: Code and benchmark data released.) [//]: # (- **2025 Dec**: Paper accepted at EACL 2026.) HotelQuEST Benchmark 💡 HotelQuEST is a benchmark comprising 214 hotel search queries that range from simple factual requests to complex queries, enabling evaluation of agentic search systems across the full spectrum of query difficulty. The benchmark focuses on the trade-off between **answer quality** and **computational efficiency**. Contributions 🏆 - **A benchmark for agentic search:** A set of 214 simple to complex hotel queries, each with complexity ratings, ground-truth clarifications for underspecified preferences, and structured decompositions for detailed analysis of agent behavior. - **Joint evaluation of quality and efficiency:** A systematic measurement of answer quality together with cost, token usage, and latency, capturing tradeoffs..."},"evidence_pages":[{"url":"https://github.com/amazon-science/hotel-quest-benchmark","final_url":"https://github.com/amazon-science/hotel-quest-benchmark","title":"amazon-science/hotel-quest-benchmark repository metadata","http_status":200,"content_type":"application/json","capture_method":"plain","fetched_at":"2026-06-11T03:02:53.147046+00:00","bytes":19237,"raw_path":"2f366c291337d82f84afe9a1fad79a176615c36186fa4bc93ba9f830b49fe6fd.json","content_hash":"1db821798e6212e9b7488bb6292a2bcc24ddb969ce7bea33e51a4a0aae46476d","excerpt_chars":1200,"truncated":true,"excerpt":"amazon-science/hotel-quest-benchmark Language: Jupyter Notebook License: NOASSERTION Stars: 2 Forks: 0 Open issues: 0 Created: 2026-01-14T13:54:05Z Pushed: 2026-01-17T15:47:03Z Default branch: main Fork: no Archived: no README: HotelQuEST: Balancing Quality and Efficiency in Agentic Search [//]: # (## 📢 Latest Updates) [//]: # (- **2026 Jan-15**: Code and benchmark data released.) [//]: # (- **2025 Dec**: Paper accepted at EACL 2026.) HotelQuEST Benchmark 💡 HotelQuEST is a benchmark comprising 214 hotel search queries that range from simple factual requests to complex queries, enabling evaluation of agentic search systems across the full spectrum of query difficulty. The benchmark focuses on the trade-off between **answer quality** and **computational efficiency**. Contributions 🏆 - **A benchmark for agentic search:** A set of 214 simple to complex hotel queries, each with complexity ratings, ground-truth clarifications for underspecified preferences, and structured decompositions for detailed analysis of agent behavior. - **Joint evaluation of quality and efficiency:** A systematic measurement of answer quality together with cost, token usage, and latency, capturing tradeoffs..."}],"related_signals":[{"id":"087c32a2-6ad0-4981-9315-11fdd32a0153","url":"https://onlylabs.fyi/signals/087c32a2-6ad0-4981-9315-11fdd32a0153","source_url":"https://github.com/amazon-science/reskill","title":"amazon-science/reskill","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab"},"occurred_at":"2026-06-04T02:13:35+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source"},{"id":"e5701aed-6cd3-48dd-bfa6-ef839031e2e8","url":"https://onlylabs.fyi/signals/e5701aed-6cd3-48dd-bfa6-ef839031e2e8","source_url":"https://github.com/amazon-science/dualkv-flash-attn-for-rl","title":"amazon-science/dualkv-flash-attn-for-rl","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab"},"occurred_at":"2026-05-27T17:38:58+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source"},{"id":"8af28f0c-7331-4b08-b517-e18b3555e503","url":"https://onlylabs.fyi/signals/8af28f0c-7331-4b08-b517-e18b3555e503","source_url":"https://github.com/amazon-science/EvoMAS","title":"amazon-science/EvoMAS","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab"},"occurred_at":"2026-05-19T19:23:29+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source"},{"id":"e3ff8718-7daa-4ebd-a3e6-3d825c538b74","url":"https://onlylabs.fyi/signals/e3ff8718-7daa-4ebd-a3e6-3d825c538b74","source_url":"https://github.com/amazon-science/adaptive-layerwise-perturbation","title":"amazon-science/adaptive-layerwise-perturbation","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab"},"occurred_at":"2026-05-14T17:44:17+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source"},{"id":"9afcd328-0124-485c-8ace-9c3ad546e316","url":"https://onlylabs.fyi/signals/9afcd328-0124-485c-8ace-9c3ad546e316","source_url":"https://github.com/amazon-science/temporal-reasoning-dataset","title":"amazon-science/temporal-reasoning-dataset","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab"},"occurred_at":"2026-05-13T13:07:08+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source"},{"id":"e19ce80b-3d6a-4aaf-9b1a-82d1b19ab682","url":"https://onlylabs.fyi/signals/e19ce80b-3d6a-4aaf-9b1a-82d1b19ab682","source_url":"https://github.com/amazon-science/PROF-GRPO","title":"amazon-science/PROF-GRPO","context":"Python","kind":{"key":"repo_new","label":"Repo"},"org":{"slug":"amazon","name":"Amazon (Nova)","category":"frontier-lab"},"occurred_at":"2026-05-12T19:43:55+00:00","first_seen_at":"2026-06-05T20:58:37.464059+00:00","date_source":"source"}]}