<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Report on SQL queries that are being executed in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31114#M22636</link>
    <description>&lt;P&gt;@Alex Davies​&amp;nbsp;- Would you be willing to share your solution when you've got it? &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt; &lt;/P&gt;</description>
    <pubDate>Mon, 07 Mar 2022 00:29:44 GMT</pubDate>
    <dc:creator>Anonymous</dc:creator>
    <dc:date>2022-03-07T00:29:44Z</dc:date>
    <item>
      <title>Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31105#M22627</link>
      <description>&lt;P&gt;We have a SQL workspace with a cluster running that services a number of self service reports against a range of datasets. We want to be able to analyse and report on the queries our self service users are executing so we can get better visibility of who is using the data platform, and what/how the tables are being used. Ideally this would be using databricks SQL workspace to do this reporting rather than using another tool.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;All this information is available in the UI in the Query history, but this is not in a form we can easily analyse or create graphs against&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We know there is an API to pull the query history from the UI, however it does seem convoluted to query the API to fetch data about our cluster so we can ingest into our cluster so we can query it&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;What is the best way to get query history information information into a hive table so we can query, analyse and graph it?&lt;/P&gt;</description>
      <pubDate>Mon, 24 Jan 2022 15:33:22 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31105#M22627</guid>
      <dc:creator>AlexDavies</dc:creator>
      <dc:date>2022-01-24T15:33:22Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31106#M22628</link>
      <description>&lt;P&gt;Hello, @Alex Davies​! My name is Piper, and I'm one of the moderators here in the community. Welcome to the community; it's great to meet you!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We'll give the community some time to respond then we will come back to this if we need to. Thanks for your patience. &lt;/P&gt;</description>
      <pubDate>Tue, 25 Jan 2022 15:01:30 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31106#M22628</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-01-25T15:01:30Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31107#M22629</link>
      <description>&lt;P&gt;Were you able to find a solution for this? &lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 05:25:47 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31107#M22629</guid>
      <dc:creator>Constantine</dc:creator>
      <dc:date>2022-02-09T05:25:47Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31108#M22630</link>
      <description>&lt;P&gt;@John Constantine​&amp;nbsp;- I'm sorry it is taking so long. I will escalate this to the team. &lt;/P&gt;</description>
      <pubDate>Wed, 09 Feb 2022 15:53:49 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31108#M22630</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-02-09T15:53:49Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31110#M22632</link>
      <description>&lt;P&gt;&lt;A href="https://docs.microsoft.com/en-us/azure/databricks/sql/admin/query-history" target="test_blank"&gt;https://docs.microsoft.com/en-us/azure/databricks/sql/admin/query-history&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Is this help @Alex Davies​&amp;nbsp; or. the one Kaniz has shared .&lt;/P&gt;</description>
      <pubDate>Sat, 12 Feb 2022 15:57:55 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31110#M22632</guid>
      <dc:creator>Atanu</dc:creator>
      <dc:date>2022-02-12T15:57:55Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31111#M22633</link>
      <description>&lt;P&gt;@Kaniz Fatma​&amp;nbsp;, @Atanu Sarkar​&amp;nbsp;thanks for your repsonse, and for investigating an individual query the UI is great and import could be a useful feature&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;But what we were after was a way to analyse the queyr history as an aggregate. For example graphing the number of queries over time, or who has been making the most queries, or the 95th percentile of query times. This sort of analysis is not possible in the UI and the data is not exposed in a way we can just utilize the already existing data analytics tools on the platform&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We have started to make progress on working around this by calling the API and downloading the Query History into a table. Then we can write SQL queries and create dashboards from the downloaded data. Considering this a platform to processing data it is a bit surprising that its own internal data is so hard extract for processing&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;We did also notice Overwatch (https://github.com/databrickslabs/overwatch) but it does not seem to import any of the SQL workspace entities so does not solve this issue, but may well solve other related issues of getting visibility of internal data&lt;/P&gt;</description>
      <pubDate>Mon, 14 Feb 2022 08:56:53 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31111#M22633</guid>
      <dc:creator>AlexDavies</dc:creator>
      <dc:date>2022-02-14T08:56:53Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31113#M22635</link>
      <description>&lt;P&gt;These features are amazing and we do use these to optimize individual queries&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;But I was looking for a way where we can calculate statistics over &lt;B&gt;all&lt;/B&gt; the queries running on the platform. Answer questions like &lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Who is running the most queries&lt;/LI&gt;&lt;LI&gt;What is the average query execution time&lt;/LI&gt;&lt;LI&gt;What tables are being used the most/least&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;The information required to service these queries is available in the query history tab, but in its current form its impossible to run aggregation queries over of top of that data. I was looking to see if that data could easily be exposed as a table in databricks &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;But, as it doesn't appear possible, we are writing something custom to export query history from the API and import it into a table&lt;/P&gt;</description>
      <pubDate>Thu, 17 Feb 2022 09:30:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31113#M22635</guid>
      <dc:creator>AlexDavies</dc:creator>
      <dc:date>2022-02-17T09:30:07Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31114#M22636</link>
      <description>&lt;P&gt;@Alex Davies​&amp;nbsp;- Would you be willing to share your solution when you've got it? &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt; &lt;/P&gt;</description>
      <pubDate>Mon, 07 Mar 2022 00:29:44 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31114#M22636</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-03-07T00:29:44Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31117#M22639</link>
      <description>&lt;P&gt;Hey there @Alex Davies​&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Hope you are doing great. Just checking in if you were able to resolve your issue or do you need more help? We'd love to hear from you.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 02 May 2022 15:21:26 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/31117#M22639</guid>
      <dc:creator>Anonymous</dc:creator>
      <dc:date>2022-05-02T15:21:26Z</dc:date>
    </item>
    <item>
      <title>Re: Report on SQL queries that are being executed</title>
      <link>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/93169#M38639</link>
      <description>&lt;P&gt;I would like to&amp;nbsp;see if there are any queries running with run time more than 30 minutes or queries pulling more than 1 million&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 08 Oct 2024 17:12:24 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/report-on-sql-queries-that-are-being-executed/m-p/93169#M38639</guid>
      <dc:creator>slakshmanan</dc:creator>
      <dc:date>2024-10-08T17:12:24Z</dc:date>
    </item>
  </channel>
</rss>

