当前位置:   article > 正文

Explore Synapse

Explore Synapse

rm -r dp-203 -f

git clone https://github.com/MicrosoftLearning/dp-203-azure-data-engineer dp-203

cd dp-203/Allfiles/labs/01

./setup.ps1

  1. -- This is auto-generated code
  2. SELECT
  3.     TOP 100*
  4. FROM
  5.     OPENROWSET(
  6.         BULK 'https://datalakexxxxxxx.dfs.core.windows.net/files/product_data/products.csv',
  7.         FORMAT ='CSV',
  8.         PARSER_VERSION='2.0'
  9. ) AS [result]

  1. SELECT
  2.     TOP 100*
  3. FROM
  4.     OPENROWSET(
  5.         BULK 'https://datalakexxxxxxx.dfs.core.windows.net/files/product_data/products.csv',
  6.         FORMAT ='CSV',
  7.         PARSER_VERSION='2.0',
  8. HEADER_ROW = TRUE
  9. ) AS [result]

  1. SELECT
  2.     Category, COUNT(*) AS ProductCount
  3. FROM
  4.     OPENROWSET(
  5.         BULK 'https://datalakexxxxxxx.dfs.core.windows.net/files/product_data/products.csv',
  6.         FORMAT ='CSV',
  7.         PARSER_VERSION='2.0',
  8. HEADER_ROW = TRUE
  9. ) AS [result]
  10. GROUP BY Category;

  1. %%pyspark
  2. df = spark.read.load('abfss://files@datalakexxxxxxx.dfs.core.windows.net/product_data/products.csv', format='csv'
  3. ## If header exists uncomment line below
  4. ##, header=True
  5. )
  6. display(df.limit(10))

  1. %%pyspark
  2. df = spark.read.load('abfss://files@datalakexxxxxxx.dfs.core.windows.net/product_data/products.csv', format='csv'
  3. ## If header exists uncomment line below
  4. , header=True
  5. )
  6. display(df.limit(10))

  1. df_counts = df.groupby(df.Category).count()
  2. display(df_counts)

  1. SELECT d.CalendarYear, d.MonthNumberOfYear, d.EnglishMonthName,
  2. p.EnglishProductName AS Product, SUM(o.OrderQuantity) AS UnitsSold
  3. FROM dbo.FactInternetSales AS o
  4. JOIN dbo.DimDate AS d ON o.OrderDateKey = d.DateKey
  5. JOIN dbo.DimProduct AS p ON o.ProductKey = p.ProductKey
  6. GROUP BY d.CalendarYear, d.MonthNumberOfYear, d.EnglishMonthName, p.EnglishProductName
  7. ORDER BY d.MonthNumberOfYear

声明:本文内容由网友自发贡献,不代表【wpsshop博客】立场,版权归原作者所有,本站不承担相应法律责任。如您发现有侵权的内容,请联系我们。转载请注明出处:https://www.wpsshop.cn/w/从前慢现在也慢/article/detail/796423
推荐阅读
相关标签
  

闽ICP备14008679号