<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Scheduling Jobs with Multiple Git Repos on a Single Job Cluster in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/scheduling-jobs-with-multiple-git-repos-on-a-single-job-cluster/m-p/110805#M43691</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I'm trying to create a scheduled job that runs notebooks from &lt;STRONG&gt;three different repos&lt;/STRONG&gt;. However, since a job can only be associated with &lt;STRONG&gt;one&lt;/STRONG&gt; repo, I've had to create three separate jobs and a master job that triggers them sequentially.&lt;/P&gt;&lt;P&gt;This setup works, except that &lt;STRONG&gt;job clusters are limited to one job each&lt;/STRONG&gt;. This is problematic because starting a new cluster for each job delays execution, and I need the job to run as quickly as possible.&lt;/P&gt;&lt;P&gt;&lt;STRONG&gt;How can I either create a job with multiple repos using a single cluster, or configure multiple jobs to share the same job cluster?&lt;/STRONG&gt;&lt;/P&gt;</description>
    <pubDate>Fri, 21 Feb 2025 00:25:13 GMT</pubDate>
    <dc:creator>SOlivero</dc:creator>
    <dc:date>2025-02-21T00:25:13Z</dc:date>
    <item>
      <title>Scheduling Jobs with Multiple Git Repos on a Single Job Cluster</title>
      <link>https://community.databricks.com/t5/data-engineering/scheduling-jobs-with-multiple-git-repos-on-a-single-job-cluster/m-p/110805#M43691</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I'm trying to create a scheduled job that runs notebooks from &lt;STRONG&gt;three different repos&lt;/STRONG&gt;. However, since a job can only be associated with &lt;STRONG&gt;one&lt;/STRONG&gt; repo, I've had to create three separate jobs and a master job that triggers them sequentially.&lt;/P&gt;&lt;P&gt;This setup works, except that &lt;STRONG&gt;job clusters are limited to one job each&lt;/STRONG&gt;. This is problematic because starting a new cluster for each job delays execution, and I need the job to run as quickly as possible.&lt;/P&gt;&lt;P&gt;&lt;STRONG&gt;How can I either create a job with multiple repos using a single cluster, or configure multiple jobs to share the same job cluster?&lt;/STRONG&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 21 Feb 2025 00:25:13 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/scheduling-jobs-with-multiple-git-repos-on-a-single-job-cluster/m-p/110805#M43691</guid>
      <dc:creator>SOlivero</dc:creator>
      <dc:date>2025-02-21T00:25:13Z</dc:date>
    </item>
    <item>
      <title>Re: Scheduling Jobs with Multiple Git Repos on a Single Job Cluster</title>
      <link>https://community.databricks.com/t5/data-engineering/scheduling-jobs-with-multiple-git-repos-on-a-single-job-cluster/m-p/110808#M43694</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/85726"&gt;@SOlivero&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;Try&amp;nbsp;configuring a &lt;STRONG&gt;shared all-purpose cluster&lt;/STRONG&gt; and set each job to use this existing cluster rather than creating new job-specific clusters, ensuring the cluster stays warm and avoiding startup delays. Another option is to restructure your master job to run the notebooks sequentially using &lt;STRONG&gt;task dependencies&lt;/STRONG&gt; within a single job definition, allowing all tasks to share the same cluster. This setup should help improve speed and efficiency, making your jobs run faster without the need for multiple clusters.&lt;/P&gt;&lt;P&gt;Hope this helps!&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;Brahma&lt;/P&gt;</description>
      <pubDate>Fri, 21 Feb 2025 03:46:23 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/scheduling-jobs-with-multiple-git-repos-on-a-single-job-cluster/m-p/110808#M43694</guid>
      <dc:creator>Brahmareddy</dc:creator>
      <dc:date>2025-02-21T03:46:23Z</dc:date>
    </item>
  </channel>
</rss>

