<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Configure job to use one cluster instance to multiple jobs in Get Started Discussions</title>
    <link>https://community.databricks.com/t5/get-started-discussions/configure-job-to-use-one-cluster-instance-to-multiple-jobs/m-p/38782#M5596</link>
    <description>&lt;P&gt;Hi! I have several tiny jobs that run in parallel and I want them to run on the same cluster:&lt;/P&gt;&lt;P&gt;- Tasks type Python Script: I send the parameters this way to run the pyspark scripts.&lt;/P&gt;&lt;P&gt;- Job compute cluster created as (copied JSON from Databricks Job UI)&lt;/P&gt;&lt;P&gt;How can I achieve that if I send 5 jobs they all run in the same instance of the cluster instead of instancing 5 clusters?&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;{
    "num_workers": 2,
    "cluster_name": "",
    "spark_version": "12.2.x-scala2.12",
    "spark_conf": {},
    "aws_attributes": {
        "first_on_demand": 1,
        "availability": "SPOT_WITH_FALLBACK",
        "zone_id": "us-east-1d",
        "instance_profile_arn": "xxxx",
        "spot_bid_price_percent": 80,
        "ebs_volume_type": "GENERAL_PURPOSE_SSD",
        "ebs_volume_count": 1,
        "ebs_volume_size": 100
    },
    "node_type_id": "c5.2xlarge",
    "driver_node_type_id": "m5a.large",
    "ssh_public_keys": [],
    "spark_env_vars": {},
    "enable_elastic_disk": false,
    "cluster_source": "JOB",
    "init_scripts": [],
    "data_security_mode": "NONE"
}&lt;/LI-CODE&gt;&lt;P&gt;Thanks!&lt;/P&gt;</description>
    <pubDate>Mon, 31 Jul 2023 14:26:55 GMT</pubDate>
    <dc:creator>alejandrofm</dc:creator>
    <dc:date>2023-07-31T14:26:55Z</dc:date>
    <item>
      <title>Configure job to use one cluster instance to multiple jobs</title>
      <link>https://community.databricks.com/t5/get-started-discussions/configure-job-to-use-one-cluster-instance-to-multiple-jobs/m-p/38782#M5596</link>
      <description>&lt;P&gt;Hi! I have several tiny jobs that run in parallel and I want them to run on the same cluster:&lt;/P&gt;&lt;P&gt;- Tasks type Python Script: I send the parameters this way to run the pyspark scripts.&lt;/P&gt;&lt;P&gt;- Job compute cluster created as (copied JSON from Databricks Job UI)&lt;/P&gt;&lt;P&gt;How can I achieve that if I send 5 jobs they all run in the same instance of the cluster instead of instancing 5 clusters?&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;{
    "num_workers": 2,
    "cluster_name": "",
    "spark_version": "12.2.x-scala2.12",
    "spark_conf": {},
    "aws_attributes": {
        "first_on_demand": 1,
        "availability": "SPOT_WITH_FALLBACK",
        "zone_id": "us-east-1d",
        "instance_profile_arn": "xxxx",
        "spot_bid_price_percent": 80,
        "ebs_volume_type": "GENERAL_PURPOSE_SSD",
        "ebs_volume_count": 1,
        "ebs_volume_size": 100
    },
    "node_type_id": "c5.2xlarge",
    "driver_node_type_id": "m5a.large",
    "ssh_public_keys": [],
    "spark_env_vars": {},
    "enable_elastic_disk": false,
    "cluster_source": "JOB",
    "init_scripts": [],
    "data_security_mode": "NONE"
}&lt;/LI-CODE&gt;&lt;P&gt;Thanks!&lt;/P&gt;</description>
      <pubDate>Mon, 31 Jul 2023 14:26:55 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/configure-job-to-use-one-cluster-instance-to-multiple-jobs/m-p/38782#M5596</guid>
      <dc:creator>alejandrofm</dc:creator>
      <dc:date>2023-07-31T14:26:55Z</dc:date>
    </item>
    <item>
      <title>Re: Configure job to use one cluster instance to multiple jobs</title>
      <link>https://community.databricks.com/t5/get-started-discussions/configure-job-to-use-one-cluster-instance-to-multiple-jobs/m-p/39155#M5597</link>
      <description>&lt;P&gt;Unfortunately, running multiple jobs in parallel using a single job cluster is not supported (yet). New in databricks is the possibility to create a job that orchestrates multiple jobs. These jobs will however still use their own cluster (configuration).&lt;/P&gt;&lt;P&gt;In the case the time of instancing a cluster takes much longer than executing an actual job, you could consider using `all-purpose` cluster. Depending on your use-case it might also be possible to rewrite/re-configure your 5 jobs to a single job with 5 tasks.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 04 Aug 2023 15:16:15 GMT</pubDate>
      <guid>https://community.databricks.com/t5/get-started-discussions/configure-job-to-use-one-cluster-instance-to-multiple-jobs/m-p/39155#M5597</guid>
      <dc:creator>KoenZandvliet</dc:creator>
      <dc:date>2023-08-04T15:16:15Z</dc:date>
    </item>
  </channel>
</rss>

