<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: How to eval the accuracy/quality of a LLM? in Machine Learning</title>
    <link>https://community.databricks.com/t5/machine-learning/how-to-eval-the-accuracy-quality-of-a-llm/m-p/36128#M1880</link>
    <description>&lt;P&gt;There aren't exact metrics to evaluate how LLM is accurate right now. Just make test questions have a large coverage could be a tip. I expect many people will work on it!&lt;/P&gt;</description>
    <pubDate>Thu, 29 Jun 2023 00:32:41 GMT</pubDate>
    <dc:creator>Hyunkee</dc:creator>
    <dc:date>2023-06-29T00:32:41Z</dc:date>
    <item>
      <title>How to eval the accuracy/quality of a LLM?</title>
      <link>https://community.databricks.com/t5/machine-learning/how-to-eval-the-accuracy-quality-of-a-llm/m-p/36051#M1876</link>
      <description>&lt;P&gt;extremely subjective (human responses on likert scale don't suffice and hard to quantify with one metric on accuracy). curious how others have approached this&lt;/P&gt;</description>
      <pubDate>Wed, 28 Jun 2023 23:35:10 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/how-to-eval-the-accuracy-quality-of-a-llm/m-p/36051#M1876</guid>
      <dc:creator>cloud712</dc:creator>
      <dc:date>2023-06-28T23:35:10Z</dc:date>
    </item>
    <item>
      <title>Re: How to eval the accuracy/quality of a LLM?</title>
      <link>https://community.databricks.com/t5/machine-learning/how-to-eval-the-accuracy-quality-of-a-llm/m-p/36128#M1880</link>
      <description>&lt;P&gt;There aren't exact metrics to evaluate how LLM is accurate right now. Just make test questions have a large coverage could be a tip. I expect many people will work on it!&lt;/P&gt;</description>
      <pubDate>Thu, 29 Jun 2023 00:32:41 GMT</pubDate>
      <guid>https://community.databricks.com/t5/machine-learning/how-to-eval-the-accuracy-quality-of-a-llm/m-p/36128#M1880</guid>
      <dc:creator>Hyunkee</dc:creator>
      <dc:date>2023-06-29T00:32:41Z</dc:date>
    </item>
  </channel>
</rss>

