You are viewing a plain text version of this content. The canonical link for it is here.
Posted to commits@hudi.apache.org by bh...@apache.org on 2023/03/27 18:30:43 UTC

[hudi] branch asf-site updated: Update community content 03242023 (#8291)

This is an automated email from the ASF dual-hosted git repository.

bhavanisudha pushed a commit to branch asf-site
in repository https://gitbox.apache.org/repos/asf/hudi.git


The following commit(s) were added to refs/heads/asf-site by this push:
     new 5e634de29fb Update community content 03242023 (#8291)
5e634de29fb is described below

commit 5e634de29fb66bc0548fd260026a297bf4b01752
Author: nadine farah <nf...@gmail.com>
AuthorDate: Mon Mar 27 11:30:33 2023 -0700

    Update community content 03242023 (#8291)
    
    * added hudi videos and blogs
    
    added aws technical blog
    
    updated file names and pics
    
    * updated content based on sudha's feedback
---
 .../2022-12-01-Run-apache-hudi-at-scale-on-aws.mdx |  19 ++++++++
 ...tion-at-scale-with-apache-hudi-in-aws-glue.mdx} |   6 ++-
 ...tion-with-Incremental-ETL-Using-Apache-Hudi.mdx |  19 ++++++++
 ...-Spark-Part-2-AWS-Glue-Studio-Visual-Editor.mdx |  16 +++++++
 website/src/pages/videos.md                        |  49 +++++++++++++++++++--
 ...ution-at-scale-with-apache-hudi-in-aws-glue.png | Bin
 .../blog/hudi-lakehouse-architecture-uber.png      | Bin 0 -> 428455 bytes
 .../blog/native-support-hudi-for-glue-studio.png   | Bin 0 -> 418820 bytes
 .../images/blog/run-hudi-at-scale-on-aws.png       | Bin 0 -> 523728 bytes
 9 files changed, 104 insertions(+), 5 deletions(-)

diff --git a/website/blog/2022-12-01-Run-apache-hudi-at-scale-on-aws.mdx b/website/blog/2022-12-01-Run-apache-hudi-at-scale-on-aws.mdx
new file mode 100644
index 00000000000..1c81b8240c2
--- /dev/null
+++ b/website/blog/2022-12-01-Run-apache-hudi-at-scale-on-aws.mdx
@@ -0,0 +1,19 @@
+---
+title: "Run Apache Hudi at scale on AWS"
+authors: 
+- name: Imtiaz Sayed,
+- name: Shana Schipers
+- name: Dylan Qu
+- name: Carlos Rodrigues
+- name: Arun A K 
+- name: Francisco Morillo
+category: technical guide
+image: /assets/images/blog/run-hudi-at-scale-on-aws.png
+tags:
+- aws 
+- guide
+- hudi
+---
+import Redirect from '@site/src/components/Redirect';
+
+<Redirect url="https://pages.awscloud.com/GLOBAL-devadopt-DL-Apache-Hudi-Technical-Guide-2023-learn.html?sc_channel=sm&sc_campaign=DB_Blog&sc_publisher=LINKEDIN&sc_geo=GLOBAL&sc_outcome=awareness&trk=DB_Blog&linkId=205888417/">Redirecting... please wait!! </Redirect>
diff --git a/website/blog/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.mdx b/website/blog/2023-02-07-automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.mdx
similarity index 87%
rename from website/blog/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.mdx
rename to website/blog/2023-02-07-automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.mdx
index bf2c3de0960..92b419c7b6d 100644
--- a/website/blog/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.mdx
+++ b/website/blog/2023-02-07-automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.mdx
@@ -1,7 +1,9 @@
 ---
 title: "Automate schema evolution at scale with Apache Hudi in AWS Glue | Amazon Web Services"
-authors:
-- name: Subhro Bose, Eva Fang and Ketan Karalkar
+authors: 
+- name: Subhro Bose
+- name: Eva Fang
+- name: Ketan Karalkar
 category: blog
 image: /assets/images/blog/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.png
 tags:
diff --git a/website/blog/2023-03-16-Setting-Uber-Transactional-Data-Lake-in-Motion-with-Incremental-ETL-Using-Apache-Hudi.mdx b/website/blog/2023-03-16-Setting-Uber-Transactional-Data-Lake-in-Motion-with-Incremental-ETL-Using-Apache-Hudi.mdx
new file mode 100644
index 00000000000..ccd88bf7c5e
--- /dev/null
+++ b/website/blog/2023-03-16-Setting-Uber-Transactional-Data-Lake-in-Motion-with-Incremental-ETL-Using-Apache-Hudi.mdx
@@ -0,0 +1,19 @@
+
+---
+title: "Setting Uber’s Transactional Data Lake in Motion with Incremental ETL Using Apache Hudi"
+authors: 
+- name: Vinoth Govindarajan
+- name: Saketh Chintapalli
+- name: Yogesh Saswade
+- name: Aayush Bareja
+category: blog
+image: /assets/images/blog/hudi-lakehouse-architecture-uber.png
+tags:
+- incremental pipeline
+- datalake
+- hudi
+- medallion architecture
+---
+import Redirect from '@site/src/components/Redirect';
+
+<Redirect url="https://www.uber.com/blog/ubers-lakehouse-architecture/">Redirecting... please wait!! </Redirect>
diff --git a/website/blog/2023-03-20-Introducing-native-support-for-Apache Hudi-Delta-Lake-and-Apache-Iceberg-on-AWS-Glue-for-Apache-Spark-Part-2-AWS-Glue-Studio-Visual-Editor.mdx b/website/blog/2023-03-20-Introducing-native-support-for-Apache Hudi-Delta-Lake-and-Apache-Iceberg-on-AWS-Glue-for-Apache-Spark-Part-2-AWS-Glue-Studio-Visual-Editor.mdx
new file mode 100644
index 00000000000..b233e6bcf01
--- /dev/null
+++ b/website/blog/2023-03-20-Introducing-native-support-for-Apache Hudi-Delta-Lake-and-Apache-Iceberg-on-AWS-Glue-for-Apache-Spark-Part-2-AWS-Glue-Studio-Visual-Editor.mdx	
@@ -0,0 +1,16 @@
+---
+title: "Introducing native support for Apache Hudi, Delta Lake, and Apache Iceberg on AWS Glue for Apache Spark, Part 2: AWS Glue Studio Visual Editor"
+authors: 
+- name: Noritaka Sekiyama
+- name: Scott Long
+- name: Sean Ma
+category: blog
+image: /assets/images/blog/native-support-hudi-for-glue-studio.png
+tags:
+- aws glue
+- glue studio
+- hudi
+---
+import Redirect from '@site/src/components/Redirect';
+
+<Redirect url="https://aws.amazon.com/blogs/big-data/part-2-glue-studio-visual-editor-introducing-native-support-for-apache-hudi-delta-lake-and-apache-iceberg-on-aws-glue-for-apache-spark/">Redirecting... please wait!! </Redirect>
diff --git a/website/src/pages/videos.md b/website/src/pages/videos.md
index 539e9d9b514..a3ce0cce5a0 100644
--- a/website/src/pages/videos.md
+++ b/website/src/pages/videos.md
@@ -114,8 +114,51 @@ last_modified_at: 2022-12-21T15:59:57-04:00
 
 37. [How do I identify Schema Changes in Hudi Tables and Send Email Alert when New Column added/removed](https://www.youtube.com/watch?v=_i5G4ojpwlk) - By Soumil Shah, Jan 20th 2023
 
-38. [How to detect and Mask PII data in Apache Hudi Data Lake | Hands on Lab](https://www.youtube.com/watch?v=l4RG9CP5LTM) - By Soumil Shah, Jan 21st 2023
+38. [How to detect and Mask PII data in Apache Hudi Data Lake | Hands on Lab](https://www.youtube.com/watch?v=l4RG9CP5LTM)- By Soumil Shah, Jan 21st 2023
 
-39. [Learn How to restrict Intern from accessing Certain Column in Hudi Datalake with lake Formation](https://www.youtube.com/watch?v=yPmdCdPT8jo) - By Soumil Shah, Jan 28th 2023
+39. [Writing data quality and validation scripts for a Hudi data lake with AWS Glue and pydeequ| Hands on Lab](https://www.youtube.com/watch?v=1us5YD2lDZw)- By Soumil Shah, Jan 23, 2023 
+
+40. [Learn How to restrict Intern from accessing Certain Column in Hudi Datalake with lake Formation](https://www.youtube.com/watch?v=yPmdCdPT8jo)- By Soumil Shah, Jan 28th 2023
+
+41. [How do I Ingest Extremely Small Files into Hudi Data lake with Glue Incremental data processing](https://www.youtube.com/watch?v=BvoLVeidd-0)- By Soumil Shah, Feb 7th 2023
+
+42. [Create Your Hudi Transaction Datalake on S3 with EMR Serverless for Beginners in fun and easy way](https://www.youtube.com/watch?v=oBoCPaw_kjE)- By Soumil Shah, Feb 11th 2023
+
+43. [Streaming Ingestion from MongoDB into Hudi with Glue, kinesis&Event bridge&MongoStream Hands on labs](https://www.youtube.com/watch?v=yfZx1P9ovxA)- By Soumil Shah, Feb 18th 2023
+
+44. [Apache Hudi Bulk Insert Sort Modes a summary of two incredible blogs](https://www.youtube.com/watch?v=AuZoREO8_zs)- By Soumil Shah, Feb 21st 2023
+
+45. [Apache Hudi Bulk Insert Sort Modes a summary of two incredible blogs](https://www.youtube.com/watch?v=AuZoREO8_zs)- By Soumil Shah, Feb 21st 2023
+
+46. [Use Glue 4.0 to take regular save points for your Hudi tables for backup or disaster Recovery](https://www.youtube.com/watch?v=VgIMPSK7rFA)- By Soumil Shah, Feb 22nd 2023
+
+47. [RFC-51 Change Data Capture in Apache Hudi like Debezium and AWS DMS Hands on Labs](https://www.youtube.com/watch?v=n6D_es6RmHM)- By Soumil Shah, Feb 25th 2023
+
+48. [Python helper class which makes querying incremental data from Hudi Data lakes easy](https://www.youtube.com/watch?v=Ls--9CnweoY)- By Soumil Shah, Feb 26th 2023
+
+49. [Develop Incremental Pipeline with CDC from Hudi to Aurora Postgres | Demo Video](https://www.youtube.com/watch?v=Wy2I1PwIj2A)- By Soumil Shah, Mar 4th 2023
+
+50. [Power your Down Stream ElasticSearch Stack From Apache Hudi Transaction Datalake with CDC|Demo Video](https://www.youtube.com/watch?v=JQmPbHP8cMQ)- By Soumil Shah, Mar 6th 2023
+
+51. [Power your Down Stream Elastic Search Stack From Apache Hudi Transaction Datalake with CDC|DeepDive](https://www.youtube.com/watch?v=rr2V5xhgPeM)- By Soumil Shah, Mar 6th 2023
+
+52. [How to Rollback to Previous Checkpoint during Disaster in Apache Hudi using Glue 4.0 Demo](https://www.youtube.com/watch?v=Vi25q4vzogs)- By Soumil Shah, Mar 7th 2023
+
+53. [How do I read data from Cross Account S3 Buckets and Build Hudi Datalake in Datateam Account](https://www.youtube.com/watch?v=q5Q5MUkXnSE)- By Soumil Shah, Mar 11th 2023
+
+54. [Query cross-account Hudi Glue Data Catalogs using Amazon Athena](https://www.youtube.com/watch?v=6ubAw9RpNZ8)- By Soumil Shah, Mar 11th 2023
+
+54. [Learn About Bucket Index (SIMPLE) In Apache Hudi with lab](https://www.youtube.com/watch?v=lOQFUrfJFP4)- By Soumil Shah, Mar 15th 2023
+
+55. [Setting Uber’s Transactional Data Lake in Motion with Incremental ETL Using Apache Hudi](https://www.youtube.com/watch?v=PvlO_s1pOLQ)- By Soumil Shah, Mar 17th 2023
+
+56. [Push Hudi Commit Notification TO HTTP URI with Callback](https://www.youtube.com/watch?v=dX5ENGnL4cA)- By Soumil Shah, Mar 18th 2023
+
+56. [RFC - 18: Insert Overwrite in Apache Hudi with Example](https://www.youtube.com/watch?v=BKfKfn0h92M)- By Soumil Shah, Mar 19th 2023
+
+57. [RFC 42: Consistent Hashing in APache Hudi MOR Tables](https://www.youtube.com/watch?v=zN8JOBKXxP0)- By Soumil Shah, Mar 21st 2023
+
+58. [Data Analysis for Apache Hudi Blogs on Medium with Pandas](https://www.youtube.com/watch?v=a7FD4zIOwVg)- By Soumil Shah, Mar 24th 2023
+
+58. [How to scrape all Blogs about a topic from medium like pro with Python](https://www.youtube.com/watch?v=-KUSaC_1X6M)- By Soumil Shah, Mar 24th 2023
 
-40. [How do I Ingest Extremely Small Files into Hudi Data lake with Glue Incremental data processing](https://www.youtube.com/watch?v=BvoLVeidd-0) - By Soumil Shah, Feb 7th 2023
diff --git a/website/static/assets/images/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.png b/website/static/assets/images/blog/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.png
similarity index 100%
rename from website/static/assets/images/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.png
rename to website/static/assets/images/blog/automate-schema-evolution-at-scale-with-apache-hudi-in-aws-glue.png
diff --git a/website/static/assets/images/blog/hudi-lakehouse-architecture-uber.png b/website/static/assets/images/blog/hudi-lakehouse-architecture-uber.png
new file mode 100644
index 00000000000..0d9fc4a4cb4
Binary files /dev/null and b/website/static/assets/images/blog/hudi-lakehouse-architecture-uber.png differ
diff --git a/website/static/assets/images/blog/native-support-hudi-for-glue-studio.png b/website/static/assets/images/blog/native-support-hudi-for-glue-studio.png
new file mode 100644
index 00000000000..248883086c0
Binary files /dev/null and b/website/static/assets/images/blog/native-support-hudi-for-glue-studio.png differ
diff --git a/website/static/assets/images/blog/run-hudi-at-scale-on-aws.png b/website/static/assets/images/blog/run-hudi-at-scale-on-aws.png
new file mode 100644
index 00000000000..a7497a47c7e
Binary files /dev/null and b/website/static/assets/images/blog/run-hudi-at-scale-on-aws.png differ