<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: File information is not passed to trigger job on file arrival in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91469#M38169</link>
    <description>&lt;P&gt;Any ETA ? We are having to use other Orchestration products because of this limitation.&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Mon, 23 Sep 2024 16:22:13 GMT</pubDate>
    <dc:creator>srsnarendran</dc:creator>
    <dc:date>2024-09-23T16:22:13Z</dc:date>
    <item>
      <title>File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39266#M26905</link>
      <description>&lt;P&gt;We are using the UC mechanism for triggering jobs on file arrival, as described here: &lt;A href="https://learn.microsoft.com/en-us/azure/databricks/workflows/jobs/file-arrival-triggers" target="_blank" rel="noopener"&gt;https://learn.microsoft.com/en-us/azure/databricks/workflows/jobs/file-arrival-triggers&lt;/A&gt;.&lt;/P&gt;&lt;P&gt;Unfortunately, the trigger doesn't actually pass the file-path that is generating the trigger to the job... (The Run Parameters are empty). Is there any way to get this information?&lt;/P&gt;</description>
      <pubDate>Mon, 07 Aug 2023 14:57:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39266#M26905</guid>
      <dc:creator>Rik</dc:creator>
      <dc:date>2023-08-07T14:57:18Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39320#M26919</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/48571"&gt;@Rik&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;For now, we do not send the file details as part of the trigger. The trigger is used to run a pipeline.&lt;/P&gt;&lt;P&gt;Alternately, You can use autoloader as part of the triggered pipeline to get the details of the file that arrived.&lt;/P&gt;</description>
      <pubDate>Tue, 08 Aug 2023 05:03:44 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39320#M26919</guid>
      <dc:creator>Tharun-Kumar</dc:creator>
      <dc:date>2023-08-08T05:03:44Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39354#M26931</link>
      <description>&lt;P&gt;&lt;EM&gt;"Alternately, You can use autoloader as part of the triggered pipeline to get the details of the file that arrived."&lt;/EM&gt;&lt;/P&gt;&lt;P&gt;That doesn't quite fit our requirements unfortunately... Are there any plans on adding this functionality?&lt;/P&gt;</description>
      <pubDate>Tue, 08 Aug 2023 12:36:18 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39354#M26931</guid>
      <dc:creator>Rik</dc:creator>
      <dc:date>2023-08-08T12:36:18Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39394#M26958</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/48571"&gt;@Rik&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;We have got this request from other Customers too. Our Engineering team is already notified of this and there is an internal ticket for the same. But we don't have an ETA for now.&lt;/P&gt;</description>
      <pubDate>Tue, 08 Aug 2023 17:48:46 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/39394#M26958</guid>
      <dc:creator>Tharun-Kumar</dc:creator>
      <dc:date>2023-08-08T17:48:46Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/60330#M31640</link>
      <description>&lt;P&gt;Could you please provide an update on the status of this particular request? Additionally, do we have any ETA for it?&lt;/P&gt;</description>
      <pubDate>Thu, 15 Feb 2024 18:24:57 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/60330#M31640</guid>
      <dc:creator>Panda</dc:creator>
      <dc:date>2024-02-15T18:24:57Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/71716#M34386</link>
      <description>&lt;P&gt;Also something I'm interested in using, would be really helpful to use File Trigger and get relevant information about exactly what file triggered the workflow!&lt;/P&gt;</description>
      <pubDate>Wed, 05 Jun 2024 08:18:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/71716#M34386</guid>
      <dc:creator>marcuskw</dc:creator>
      <dc:date>2024-06-05T08:18:23Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91469#M38169</link>
      <description>&lt;P&gt;Any ETA ? We are having to use other Orchestration products because of this limitation.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 23 Sep 2024 16:22:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91469#M38169</guid>
      <dc:creator>srsnarendran</dc:creator>
      <dc:date>2024-09-23T16:22:13Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91483#M38171</link>
      <description>&lt;P&gt;Same here!&lt;/P&gt;&lt;P&gt;Additionally would be great to enhance it to support not just the path to a directory, but also the prefix of the file name (or regex for bonus points). Right now if you have 10 types of files arriving to the same folder, it would be much cleaner to have each workflow handling a given type only process the relevant file arrived.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 23 Sep 2024 19:37:46 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91483#M38171</guid>
      <dc:creator>artemich</dc:creator>
      <dc:date>2024-09-23T19:37:46Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91484#M38172</link>
      <description>&lt;P&gt;You are able to provide filter options to select only relevant files:&lt;BR /&gt;&lt;A href="https://docs.databricks.com/en/ingestion/cloud-object-storage/auto-loader/patterns.html#filtering-directories-or-files-using-glob-patterns" target="_blank"&gt;https://docs.databricks.com/en/ingestion/cloud-object-storage/auto-loader/patterns.html#filtering-directories-or-files-using-glob-patterns&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 23 Sep 2024 19:46:01 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91484#M38172</guid>
      <dc:creator>marcuskw</dc:creator>
      <dc:date>2024-09-23T19:46:01Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91620#M38222</link>
      <description>&lt;P&gt;For loading file with AutoLoader - for sure. My wish is to have similar capability for File Arrival Trigger.&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;"A file arrival trigger can be configured to monitor the root of a Unity Catalog external location or volume, or a subpath of an external location or volume."&lt;BR /&gt;&lt;/SPAN&gt;&lt;A href="https://learn.microsoft.com/en-us/azure/databricks/jobs/file-arrival-triggers" target="_blank"&gt;https://learn.microsoft.com/en-us/azure/databricks/jobs/file-arrival-triggers&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Quite often files for multiple data entities (or even pipelines) land in the same directories from a given provider and it would be great to be able to easily manage such scenarios.&lt;/P&gt;</description>
      <pubDate>Tue, 24 Sep 2024 19:38:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/91620#M38222</guid>
      <dc:creator>artemich</dc:creator>
      <dc:date>2024-09-24T19:38:36Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/95684#M39148</link>
      <description>&lt;P&gt;What do you need to achieve?&lt;/P&gt;&lt;P&gt;Autoloader is much more efficient since it can handle a bunch of files (only new ones) in a single operation. Handling file by file, especially with a lot of files, will increase latency and increase costs.&lt;/P&gt;</description>
      <pubDate>Wed, 23 Oct 2024 09:31:55 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/95684#M39148</guid>
      <dc:creator>mattiazeni</dc:creator>
      <dc:date>2024-10-23T09:31:55Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/95726#M39163</link>
      <description>&lt;P&gt;What I wanted to achieve was a dynamic schema application based on what file was picked up.&lt;BR /&gt;So I implement 1 autoloader task to collect files from a specific path "source":&lt;BR /&gt;- source/employees/0001.csv&lt;BR /&gt;- source/holiday/0001.csv&lt;/P&gt;&lt;P&gt;If the path of the file was available I could then apply the relevant schema in runtime.&lt;BR /&gt;But autoloader may want to process both files and put them into the same dataframe?&lt;BR /&gt;Maybe this isn't the best usecase, I guess you would recommend to implement multiple tasks/checkpoints for the respective folders?&lt;/P&gt;</description>
      <pubDate>Wed, 23 Oct 2024 13:24:48 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/95726#M39163</guid>
      <dc:creator>marcuskw</dc:creator>
      <dc:date>2024-10-23T13:24:48Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/112912#M44357</link>
      <description>&lt;P&gt;any news?&lt;/P&gt;</description>
      <pubDate>Tue, 18 Mar 2025 10:57:27 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/112912#M44357</guid>
      <dc:creator>007</dc:creator>
      <dc:date>2025-03-18T10:57:27Z</dc:date>
    </item>
    <item>
      <title>Re: File information is not passed to trigger job on file arrival</title>
      <link>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/113209#M44469</link>
      <description>&lt;P&gt;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/115282"&gt;@007&lt;/a&gt;&amp;nbsp; - Review the link&amp;nbsp;&lt;A href="https://community.databricks.com/t5/data-engineering/file-arrival-trigger/m-p/94069/highlight/true#M38808" target="_blank"&gt;https://community.databricks.com/t5/data-engineering/file-arrival-trigger/m-p/94069/highlight/true#M38808&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 20 Mar 2025 20:05:25 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/file-information-is-not-passed-to-trigger-job-on-file-arrival/m-p/113209#M44469</guid>
      <dc:creator>Panda</dc:creator>
      <dc:date>2025-03-20T20:05:25Z</dc:date>
    </item>
  </channel>
</rss>

