<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: How do we create a job cluster in Databricks Asset Bundles for use across different jobs? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/107206#M42730</link>
    <description>&lt;P&gt;job_clusters:&lt;BR /&gt;- job_cluster_key: small_cluster&lt;BR /&gt;new_cluster:&lt;BR /&gt;spark_version: "7.3.x-scala2.12"&lt;BR /&gt;node_type_id: "i3.xlarge"&lt;BR /&gt;num_workers: 2&lt;BR /&gt;autotermination_minutes: 20&lt;BR /&gt;- job_cluster_key: large_cluster&lt;BR /&gt;new_cluster:&lt;BR /&gt;spark_version: "7.3.x-scala2.12"&lt;BR /&gt;node_type_id: "i3.2xlarge"&lt;BR /&gt;num_workers: 10&lt;BR /&gt;autotermination_minutes: 20&lt;/P&gt;&lt;P&gt;tasks:&lt;BR /&gt;- task_key: task1&lt;BR /&gt;job_cluster_key: small_cluster&lt;BR /&gt;notebook_task:&lt;BR /&gt;notebook_path: "/Users/your_user/task1_notebook"&lt;BR /&gt;- task_key: task2&lt;BR /&gt;job_cluster_key: large_cluster&lt;BR /&gt;notebook_task:&lt;BR /&gt;notebook_path: "/Users/your_user/task2_notebook"&lt;BR /&gt;- task_key: task3&lt;BR /&gt;job_cluster_key: small_cluster&lt;BR /&gt;notebook_task:&lt;BR /&gt;notebook_path: "/Users/your_user/task3_notebook"&lt;/P&gt;</description>
    <pubDate>Mon, 27 Jan 2025 11:19:21 GMT</pubDate>
    <dc:creator>saurabh18cs</dc:creator>
    <dc:date>2025-01-27T11:19:21Z</dc:date>
    <item>
      <title>How do we create a job cluster in Databricks Asset Bundles for use across different jobs?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/100991#M40505</link>
      <description>&lt;P&gt;When developing jobs on DABs, we use new_cluster to create a cluster for a particular job. I think it's a lot of lines and YAML when what I really need is a "small cluster" and "big cluster" to reference for certain kind of jobs. Tags would be on the job and get propagated to the cluster.&lt;BR /&gt;&lt;BR /&gt;According to the dab-docs, we can create a cluster under&amp;nbsp;&lt;EM&gt;resources: clusters:&lt;/EM&gt; but surely we are not meant to use all-purpose clusters as a job cluster?&lt;/P&gt;&lt;P&gt;See the example here:&amp;nbsp;&lt;A href="https://docs.databricks.com/en/dev-tools/bundles/resources.html#cluster" target="_blank"&gt;https://docs.databricks.com/en/dev-tools/bundles/resources.html#cluster&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 04 Dec 2024 23:31:08 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/100991#M40505</guid>
      <dc:creator>oakhill</dc:creator>
      <dc:date>2024-12-04T23:31:08Z</dc:date>
    </item>
    <item>
      <title>Re: How do we create a job cluster in Databricks Asset Bundles for use across different jobs?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/101035#M40519</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.databricks.com/t5/user/viewprofilepage/user-id/110230"&gt;@oakhill&lt;/a&gt;&amp;nbsp;,&lt;BR /&gt;&lt;BR /&gt;You can specify you job cluster configuration in your variables:&lt;/P&gt;&lt;LI-CODE lang="python"&gt;variables:
  small_cluster_id:
    description: "The small cluster with 2 workers used by the jobs"
    type: complex
    default:
      spark_version: "15.4.x-scala2.12"
      node_type_id: "Standard_D4ds_v5"
      num_workers: 2&lt;/LI-CODE&gt;&lt;P&gt;Now you can specify using this cluster in your jobs:&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;resources:
  jobs:
    my_job:
      name: my_job

      job_clusters:
        - job_cluster_key: small_cluster
          new_cluster: ${var.small_cluster_id}    &lt;/LI-CODE&gt;</description>
      <pubDate>Thu, 05 Dec 2024 08:56:11 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/101035#M40519</guid>
      <dc:creator>filipniziol</dc:creator>
      <dc:date>2024-12-05T08:56:11Z</dc:date>
    </item>
    <item>
      <title>Re: How do we create a job cluster in Databricks Asset Bundles for use across different jobs?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/107150#M42712</link>
      <description>&lt;P&gt;Nice, this method allows to reduce the redundancy to&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;      job_clusters:
        - job_cluster_key: small_cluster
          new_cluster: ${var.small_cluster_id}  &lt;/LI-CODE&gt;&lt;P&gt;which has to be repeated within each job definition. But this redundancy is still a lot! How can we define a job_cluster exactly once and refer to it by name / id? In other words, what is the job-cluster equivalent to the &lt;A href="https://docs.databricks.com/en/dev-tools/bundles/resources.html#cluster" target="_self"&gt;top-level resource cluster&lt;/A&gt;?&lt;/P&gt;</description>
      <pubDate>Mon, 27 Jan 2025 08:41:51 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/107150#M42712</guid>
      <dc:creator>jkb7</dc:creator>
      <dc:date>2025-01-27T08:41:51Z</dc:date>
    </item>
    <item>
      <title>Re: How do we create a job cluster in Databricks Asset Bundles for use across different jobs?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/107206#M42730</link>
      <description>&lt;P&gt;job_clusters:&lt;BR /&gt;- job_cluster_key: small_cluster&lt;BR /&gt;new_cluster:&lt;BR /&gt;spark_version: "7.3.x-scala2.12"&lt;BR /&gt;node_type_id: "i3.xlarge"&lt;BR /&gt;num_workers: 2&lt;BR /&gt;autotermination_minutes: 20&lt;BR /&gt;- job_cluster_key: large_cluster&lt;BR /&gt;new_cluster:&lt;BR /&gt;spark_version: "7.3.x-scala2.12"&lt;BR /&gt;node_type_id: "i3.2xlarge"&lt;BR /&gt;num_workers: 10&lt;BR /&gt;autotermination_minutes: 20&lt;/P&gt;&lt;P&gt;tasks:&lt;BR /&gt;- task_key: task1&lt;BR /&gt;job_cluster_key: small_cluster&lt;BR /&gt;notebook_task:&lt;BR /&gt;notebook_path: "/Users/your_user/task1_notebook"&lt;BR /&gt;- task_key: task2&lt;BR /&gt;job_cluster_key: large_cluster&lt;BR /&gt;notebook_task:&lt;BR /&gt;notebook_path: "/Users/your_user/task2_notebook"&lt;BR /&gt;- task_key: task3&lt;BR /&gt;job_cluster_key: small_cluster&lt;BR /&gt;notebook_task:&lt;BR /&gt;notebook_path: "/Users/your_user/task3_notebook"&lt;/P&gt;</description>
      <pubDate>Mon, 27 Jan 2025 11:19:21 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-do-we-create-a-job-cluster-in-databricks-asset-bundles-for/m-p/107206#M42730</guid>
      <dc:creator>saurabh18cs</dc:creator>
      <dc:date>2025-01-27T11:19:21Z</dc:date>
    </item>
  </channel>
</rss>

