<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic Re: How can I extract data from different sources and transform it into a fresh, reliable data pipeline? in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20204#M13625</link>
    <description>&lt;P&gt;Thanks for this.&lt;/P&gt;</description>
    <pubDate>Mon, 05 Dec 2022 03:47:03 GMT</pubDate>
    <dc:creator>Aj2</dc:creator>
    <dc:date>2022-12-05T03:47:03Z</dc:date>
    <item>
      <title>How can I extract data from different sources and transform it into a fresh, reliable data pipeline?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20201#M13622</link>
      <description>&lt;P&gt;&lt;I&gt;Tip: These steps are built out for AWS accounts and workspaces that are using &lt;/I&gt;&lt;A href="https://docs.databricks.com/delta/index.html" alt="https://docs.databricks.com/delta/index.html" target="_blank"&gt;&lt;I&gt;&lt;U&gt;Delta Lake&lt;/U&gt;&lt;/I&gt;&lt;/A&gt;&lt;I&gt;. If you would like to learn more &lt;/I&gt;&lt;A href="https://www.youtube.com/watch?v=PftRBoqjhZM&amp;amp;t=62s" alt="https://www.youtube.com/watch?v=PftRBoqjhZM&amp;amp;t=62s" target="_blank"&gt;&lt;I&gt;&lt;U&gt;watch this video&lt;/U&gt;&lt;/I&gt;&lt;/A&gt;&lt;I&gt; and reach out to your &lt;/I&gt;&lt;A href="https://www.databricks.com/company/contact?_ga=2.126171338.659321187.1669655549-630542707.1661985352" alt="https://www.databricks.com/company/contact?_ga=2.126171338.659321187.1669655549-630542707.1661985352" target="_blank"&gt;&lt;I&gt;&lt;U&gt;Databricks sales representative&lt;/U&gt; &lt;/I&gt;&lt;/A&gt;&lt;I&gt;for more information.&lt;/I&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;Step 1:&lt;/B&gt; &lt;A href="https://docs.databricks.com/notebooks/notebooks-manage.html?&amp;amp;_ga=2.126171338.659321187.1669655549-630542707.1661985352#create-a-notebook-in-any-folder" alt="https://docs.databricks.com/notebooks/notebooks-manage.html?&amp;amp;_ga=2.126171338.659321187.1669655549-630542707.1661985352#create-a-notebook-in-any-folder" target="_blank"&gt;&lt;U&gt;Create&lt;/U&gt;&lt;/A&gt; your own notebook or use an existing notebook&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Watch this &lt;A href="https://youtu.be/3-ZqCKScQqM" alt="https://youtu.be/3-ZqCKScQqM" target="_blank"&gt;quick video&lt;/A&gt; &lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;Step 2:&lt;/B&gt; Ensure your data is &lt;A href="https://docs.databricks.com/ingestion/index.html" alt="https://docs.databricks.com/ingestion/index.html" target="_blank"&gt;&lt;U&gt;ingested&lt;/U&gt;&lt;/A&gt; into the lakehouse&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;Step 3:&lt;/B&gt; Efficiently &lt;A href="https://docs.databricks.com/delta/tutorial.html#read-a-table" alt="https://docs.databricks.com/delta/tutorial.html#read-a-table" target="_blank"&gt;&lt;U&gt;read&lt;/U&gt;&lt;/A&gt; and &lt;A href="https://docs.databricks.com/delta/tutorial.html?searchString=&amp;amp;from=0&amp;amp;sortby=_score&amp;amp;orderBy=desc&amp;amp;pageNo=1&amp;amp;aggregations=%5B%5D&amp;amp;uid=7dc8d13f-90bb-11e9-98a5-06d762ad9a62&amp;amp;resultsPerPage=10&amp;amp;exactPhrase=&amp;amp;withOneOrMore=&amp;amp;withoutTheWords=&amp;amp;pageSize=10&amp;amp;language=en&amp;amp;state=1&amp;amp;suCaseCreate=false#write-to-a-table" alt="https://docs.databricks.com/delta/tutorial.html?searchString=&amp;amp;from=0&amp;amp;sortby=_score&amp;amp;orderBy=desc&amp;amp;pageNo=1&amp;amp;aggregations=%5B%5D&amp;amp;uid=7dc8d13f-90bb-11e9-98a5-06d762ad9a62&amp;amp;resultsPerPage=10&amp;amp;exactPhrase=&amp;amp;withOneOrMore=&amp;amp;withoutTheWords=&amp;amp;pageSize=10&amp;amp;language=en&amp;amp;state=1&amp;amp;suCaseCreate=false#write-to-a-table" target="_blank"&gt;&lt;U&gt;write your data&lt;/U&gt;&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;Step 4:&lt;/B&gt; Automate your notebook with a &lt;A href="https://docs.databricks.com/workflows/jobs/jobs-quickstart.html" alt="https://docs.databricks.com/workflows/jobs/jobs-quickstart.html" target="_blank"&gt;&lt;U&gt;job&lt;/U&gt;&lt;/A&gt;&lt;/P&gt;&lt;UL&gt;&lt;LI&gt;Watch this &lt;A href="https://youtu.be/MWGmsnnaGLY" alt="https://youtu.be/MWGmsnnaGLY" target="_blank"&gt;quick video&lt;/A&gt;&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;Step 5:&lt;/B&gt; Run your job interactively or on a&lt;A href="https://docs.databricks.com/workflows/jobs/jobs.html#schedule-a-job" alt="https://docs.databricks.com/workflows/jobs/jobs.html#schedule-a-job" target="_blank"&gt; &lt;U&gt;schedule&lt;/U&gt;&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;B&gt;Step 6:&lt;/B&gt; Further optimize your data pipeline with &lt;A href="https://docs.databricks.com/sql/language-manual/delta-optimize.html" alt="https://docs.databricks.com/sql/language-manual/delta-optimize.html" target="_blank"&gt;&lt;U&gt;delta write optimize&lt;/U&gt;&lt;/A&gt; &amp;amp; &lt;A href="https://docs.databricks.com/workflows/jobs/jobs-api-updates.html" alt="https://docs.databricks.com/workflows/jobs/jobs-api-updates.html" target="_blank"&gt;&lt;U&gt;multi-task jobs&lt;/U&gt;&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;If you'd like to learn more, sign up for the &lt;A href="https://customer-academy.databricks.com/learn/course/62/data-engineering-with-databricks-v2" alt="https://customer-academy.databricks.com/learn/course/62/data-engineering-with-databricks-v2" target="_blank"&gt;&lt;U&gt;Databricks Data Engineering Databricks Academy course&lt;/U&gt;&lt;/A&gt; and get your &lt;A href="https://customer-academy.databricks.com/learn/course/833/certification-overview-databricks-certified-data-engineer-associate-exam?generated_by=13390&amp;amp;hash=699a89c44e0cc3fc8db1ac6bdf191d813f9f5d91" alt="https://customer-academy.databricks.com/learn/course/833/certification-overview-databricks-certified-data-engineer-associate-exam?generated_by=13390&amp;amp;hash=699a89c44e0cc3fc8db1ac6bdf191d813f9f5d91" target="_blank"&gt;&lt;U&gt;Data Engineering Certification&lt;/U&gt;&lt;/A&gt;.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Need more help? Get hands-on with building data pipelines by attending the &lt;A href="https://customer-academy.databricks.com/learn/course/1310/data-engineering-activation-day?ge[…]=249103&amp;amp;hash=d20b1d6f9dddedde49b54ddc6eff9d13586a04b4" alt="https://customer-academy.databricks.com/learn/course/1310/data-engineering-activation-day?ge[…]=249103&amp;amp;hash=d20b1d6f9dddedde49b54ddc6eff9d13586a04b4" target="_blank"&gt;&lt;B&gt;&lt;U&gt;Data Engineering Activation Day on December 6, 2022, at 9 AM PT&lt;/U&gt;&lt;/B&gt;&lt;/A&gt;. Whether you are just getting started ingesting data or you are ready to automate your data pipeline, our Databricks experts will walk you through each step of the way with ample time for your questions.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;In this session, you’ll see demos and learn:&lt;/P&gt;&lt;P&gt;- How to quickly create your own notebook&lt;/P&gt;&lt;P&gt;- All ways to ingest your data&lt;/P&gt;&lt;P&gt;- Best practices to read and write your data&lt;/P&gt;&lt;P&gt;- Automated ways to run your commands with Jobs&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Notebooks will be provided so you can follow along live or review the best practices at your own pace.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 28 Nov 2022 20:04:54 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20201#M13622</guid>
      <dc:creator>User16835756816</dc:creator>
      <dc:date>2022-11-28T20:04:54Z</dc:date>
    </item>
    <item>
      <title>Re: How can I extract data from different sources and transform it into a fresh, reliable data pipeline?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20202#M13623</link>
      <description>&lt;P&gt;thanks man&lt;/P&gt;</description>
      <pubDate>Fri, 02 Dec 2022 09:44:02 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20202#M13623</guid>
      <dc:creator>Aviral-Bhardwaj</dc:creator>
      <dc:date>2022-12-02T09:44:02Z</dc:date>
    </item>
    <item>
      <title>Re: How can I extract data from different sources and transform it into a fresh, reliable data pipeline?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20203#M13624</link>
      <description>&lt;P&gt;If you are using Azure Databricks prefer ADF Pipelines for ETL.​&lt;/P&gt;</description>
      <pubDate>Fri, 02 Dec 2022 12:09:36 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20203#M13624</guid>
      <dc:creator>Own</dc:creator>
      <dc:date>2022-12-02T12:09:36Z</dc:date>
    </item>
    <item>
      <title>Re: How can I extract data from different sources and transform it into a fresh, reliable data pipeline?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20204#M13625</link>
      <description>&lt;P&gt;Thanks for this.&lt;/P&gt;</description>
      <pubDate>Mon, 05 Dec 2022 03:47:03 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20204#M13625</guid>
      <dc:creator>Aj2</dc:creator>
      <dc:date>2022-12-05T03:47:03Z</dc:date>
    </item>
    <item>
      <title>Re: How can I extract data from different sources and transform it into a fresh, reliable data pipeline?</title>
      <link>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20205#M13626</link>
      <description>&lt;P&gt;Thanks @Nithya Thangaraj​&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 05 Dec 2022 07:02:29 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/how-can-i-extract-data-from-different-sources-and-transform-it/m-p/20205#M13626</guid>
      <dc:creator>Ajay-Pandey</dc:creator>
      <dc:date>2022-12-05T07:02:29Z</dc:date>
    </item>
  </channel>
</rss>

