<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>topic SCD type2 snowflake in Data Engineering</title>
    <link>https://community.databricks.com/t5/data-engineering/scd-type2-snowflake/m-p/32549#M23724</link>
    <description>&lt;P&gt;I have monthly files which comes in S3 bucket. I want to implement SCD type2 in snowflake.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I am ok to read the new files, clean it.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;My question is about comparing what I have read from the files, with what is stored in the snowflake table already(millions of records) and capturing the change.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Main question:&lt;/P&gt;&lt;P&gt;How to join the snowflake table to the view created from the monthly file.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;1)I can read the snowflake table in data bricks like select * and can create a view and do the processing.&lt;/P&gt;&lt;P&gt;I am sure this is now how it's done in production.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Any pointers on how to solve the problem?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
    <pubDate>Mon, 05 Sep 2022 10:03:10 GMT</pubDate>
    <dc:creator>sabooalex</dc:creator>
    <dc:date>2022-09-05T10:03:10Z</dc:date>
    <item>
      <title>SCD type2 snowflake</title>
      <link>https://community.databricks.com/t5/data-engineering/scd-type2-snowflake/m-p/32549#M23724</link>
      <description>&lt;P&gt;I have monthly files which comes in S3 bucket. I want to implement SCD type2 in snowflake.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;I am ok to read the new files, clean it.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;My question is about comparing what I have read from the files, with what is stored in the snowflake table already(millions of records) and capturing the change.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Main question:&lt;/P&gt;&lt;P&gt;How to join the snowflake table to the view created from the monthly file.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;1)I can read the snowflake table in data bricks like select * and can create a view and do the processing.&lt;/P&gt;&lt;P&gt;I am sure this is now how it's done in production.&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;Any pointers on how to solve the problem?&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 05 Sep 2022 10:03:10 GMT</pubDate>
      <guid>https://community.databricks.com/t5/data-engineering/scd-type2-snowflake/m-p/32549#M23724</guid>
      <dc:creator>sabooalex</dc:creator>
      <dc:date>2022-09-05T10:03:10Z</dc:date>
    </item>
  </channel>
</rss>

