<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: Can we use multiple git repos for a job running multiple tasks? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17696#M11660</link>
    <description>&lt;P&gt;Hi @Prabakar Ammeappin​&amp;nbsp;, task2 depends on task1, as it sends out the results from task1.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I also tried removing the dependency and edited the git reference, but it changes the git reference for all the tasks in the job.&lt;/P&gt;&lt;P&gt;Do you know if that is a feature missing from jobs, or if it is intentional?&lt;/P&gt;</description>
    <pubDate>Thu, 16 Jun 2022 07:17:27 GMT</pubDate>
    <dc:creator>thib</dc:creator>
    <dc:date>2022-06-16T07:17:27Z</dc:date>
    <item>
      <title>Can we use multiple git repos for a job running multiple tasks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17694#M11658</link>
      <description>&lt;P&gt;I have a job running multiple tasks :&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Task 1 runs a machine learning pipeline from git repo 1&lt;/LI&gt;&lt;LI&gt;Task 2 runs an ETL pipeline from git repo 1&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Task 2 is actually a generic pipeline and should not be checked in repo 1, and will be made available in another repo where various ETL pipelines are stored.&lt;/P&gt;&lt;P&gt;However I see now that git repos are set up per Job, and not per Task.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Does anyone have a solution for this, which I would suppose is quite a common scenario?&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1803iA1EDBDB1DAC08D56/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 14 Jun 2022 17:52:04 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17694#M11658</guid>
      <dc:creator>thib</dc:creator>
      <dc:date>2022-06-14T17:52:04Z</dc:date>
    </item>
    <item>
      <title>Re: Can we use multiple git repos for a job running multiple tasks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17695#M11659</link>
      <description>&lt;P&gt;hi @Thibault Daoulas​ if task2 is generic and doesnt depend on task1, could you try removing the depends on filed in task2 and run the pipeline?&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1787iCF4D3EC812DF85FC/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 16 Jun 2022 06:29:04 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17695#M11659</guid>
      <dc:creator>Prabakar</dc:creator>
      <dc:date>2022-06-16T06:29:04Z</dc:date>
    </item>
    <item>
      <title>Re: Can we use multiple git repos for a job running multiple tasks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17696#M11660</link>
      <description>&lt;P&gt;Hi @Prabakar Ammeappin​&amp;nbsp;, task2 depends on task1, as it sends out the results from task1.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I also tried removing the dependency and edited the git reference, but it changes the git reference for all the tasks in the job.&lt;/P&gt;&lt;P&gt;Do you know if that is a feature missing from jobs, or if it is intentional?&lt;/P&gt;</description>
      <pubDate>Thu, 16 Jun 2022 07:17:27 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17696#M11660</guid>
      <dc:creator>thib</dc:creator>
      <dc:date>2022-06-16T07:17:27Z</dc:date>
    </item>
    <item>
      <title>Re: Can we use multiple git repos for a job running multiple tasks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17697#M11661</link>
      <description>&lt;P&gt;The way to go about this would be to create Databricks repos in the workspace and then use that in the task formation. This way we can refer multiple repos in different tasks.&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper" image-alt="image"&gt;&lt;img src="https://community.databricks.com/t5/image/serverpage/image-id/1793i17732E8DE5EB078F/image-size/large?v=v2&amp;amp;px=999" role="button" title="image" alt="image" /&gt;&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 11 May 2023 08:15:35 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/17697#M11661</guid>
      <dc:creator>trijit</dc:creator>
      <dc:date>2023-05-11T08:15:35Z</dc:date>
    </item>
    <item>
      <title>Re: Can we use multiple git repos for a job running multiple tasks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/108702#M43120</link>
      <description>&lt;P&gt;Had this same problem. Fix was to have two workflows with no triggers, each pointing to the respective git repo. Then setup a 3rd workflow with appropriate triggers/schedule which calls the first 2 workflows.&amp;nbsp;&lt;BR /&gt;A workflow can run other workflows.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 04 Feb 2025 06:27:07 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/108702#M43120</guid>
      <dc:creator>tors_r_us</dc:creator>
      <dc:date>2025-02-04T06:27:07Z</dc:date>
    </item>
    <item>
      <title>Re: Can we use multiple git repos for a job running multiple tasks?</title>
      <link>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/135132#M50282</link>
      <description>&lt;P&gt;Yes, but this can cause an issue on waiting more time to have the cluster up.. How did u fix this?&lt;/P&gt;</description>
      <pubDate>Thu, 16 Oct 2025 14:14:32 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/can-we-use-multiple-git-repos-for-a-job-running-multiple-tasks/m-p/135132#M50282</guid>
      <dc:creator>jeremy98</dc:creator>
      <dc:date>2025-10-16T14:14:32Z</dc:date>
    </item>
  </channel>
</rss>

