<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Issue Genie Benchmark:  Different responses in UI and Benchmark in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/issue-genie-benchmark-different-responses-in-ui-and-benchmark/m-p/155874#M54325</link>
    <description>&lt;P&gt;Hello, I am trying to add a benchmark dataset for my genie space.&lt;BR /&gt;&lt;BR /&gt;When I ask the a question on the Genie space UI directly, I get the right output. However when I add the same question in the genie benchmark, the result is quite bad and the sql it uses in benchmark is incomplete.&lt;/P&gt;</description>
    <pubDate>Thu, 30 Apr 2026 12:59:19 GMT</pubDate>
    <dc:creator>maze2498</dc:creator>
    <dc:date>2026-04-30T12:59:19Z</dc:date>
    <item>
      <title>Issue Genie Benchmark:  Different responses in UI and Benchmark</title>
      <link>https://community.databricks.com/t5/data-engineering/issue-genie-benchmark-different-responses-in-ui-and-benchmark/m-p/155874#M54325</link>
      <description>&lt;P&gt;Hello, I am trying to add a benchmark dataset for my genie space.&lt;BR /&gt;&lt;BR /&gt;When I ask the a question on the Genie space UI directly, I get the right output. However when I add the same question in the genie benchmark, the result is quite bad and the sql it uses in benchmark is incomplete.&lt;/P&gt;</description>
      <pubDate>Thu, 30 Apr 2026 12:59:19 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/issue-genie-benchmark-different-responses-in-ui-and-benchmark/m-p/155874#M54325</guid>
      <dc:creator>maze2498</dc:creator>
      <dc:date>2026-04-30T12:59:19Z</dc:date>
    </item>
    <item>
      <title>Re: Issue Genie Benchmark:  Different responses in UI and Benchmark</title>
      <link>https://community.databricks.com/t5/data-engineering/issue-genie-benchmark-different-responses-in-ui-and-benchmark/m-p/155884#M54326</link>
      <description>&lt;P&gt;Hi, when you say the sql it generates is quite bad and missing, do you mean when you run the benchmark? The benchmark purposefully doesn't have any conversation history unlike the Genie Space. So sometimes the results can vary. Ie if you've asked a lot of questions before the one in your Genie Space there will be additional context th&lt;/P&gt;</description>
      <pubDate>Thu, 30 Apr 2026 15:00:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/issue-genie-benchmark-different-responses-in-ui-and-benchmark/m-p/155884#M54326</guid>
      <dc:creator>emma_s</dc:creator>
      <dc:date>2026-04-30T15:00:41Z</dc:date>
    </item>
  </channel>
</rss>

