Skip to content

Latest commit

 

History

History
107 lines (81 loc) · 5.97 KB

File metadata and controls

107 lines (81 loc) · 5.97 KB

Data

Raw

  • Check data/raw directory for all raw product sales data. Each file is in csv format, and each entry follow below spark schema:
root
 |-- ProductName: string (nullable = true)
 |-- Category: string (nullable = true)
 |-- Price: double (nullable = true)
 |-- Quantity: integer (nullable = true)
 |-- Date: date (nullable = true)

Aggregation

root
 |-- TotalSalesQuantity: long (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
 |-- TotalSalesDay: long (nullable = false)
root
 |-- Category: string (nullable = true)
 |-- TotalSalesQuantity: long (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
 |-- TotalSalesDay: long (nullable = false)
root
 |-- Date: date (nullable = true)
 |-- TotalSalesQuantity: long (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
root
 |-- ProductName: string (nullable = true)
 |-- TotalSalesQuantity: long (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
 |-- TotalSalesDay: long (nullable = false)
 |-- AverageSellingPrice: double (nullable = true)

Running Total

root
 |-- Date: date (nullable = true)
 |-- TotalSalesQuantity: integer (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
 |-- RunningTotalSalesQuantity: long (nullable = true)
 |-- RunningTotalSalesAmount: double (nullable = true)
root
 |-- Date: date (nullable = true)
 |-- TotalSalesQuantity: integer (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
 |-- RunningTotalSalesQuantity: long (nullable = true)
 |-- RunningTotalSalesAmount: double (nullable = true)

Rolling Average

root
 |-- Date: date (nullable = true)
 |-- TotalSalesQuantity: integer (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
 |-- RollingAverageSalesQuantity: double (nullable = true)
 |-- RollingAverageSalesAmount: double (nullable = true)
root
 |-- Date: date (nullable = true)
 |-- TotalSalesQuantity: integer (nullable = true)
 |-- TotalSalesAmount: double (nullable = true)
 |-- RollingAverageSalesQuantity: double (nullable = true)
 |-- RollingAverageSalesAmount: double (nullable = true)