31 lines
760 B
Plaintext
31 lines
760 B
Plaintext
@raw_parsed = EXTRACT child_id int,
|
|
cp_catalog_page_sk string,
|
|
cp_catalog_page_id string,
|
|
cp_start_date_sk string,
|
|
cp_end_date_sk string,
|
|
cp_department string,
|
|
cp_catalog_number string,
|
|
cp_catalog_page_number string,
|
|
cp_description string,
|
|
cp_type string,
|
|
empty string
|
|
FROM "wasb://catalog-page@aasuseast2/{*}_{child_id:*}_100.dat"
|
|
USING Extractors.Text(delimiter: '|');
|
|
|
|
@filtered_results = SELECT cp_catalog_page_sk,
|
|
cp_catalog_page_id,
|
|
cp_start_date_sk,
|
|
cp_end_date_sk,
|
|
cp_department,
|
|
cp_catalog_number,
|
|
cp_catalog_page_number,
|
|
cp_description,
|
|
cp_type
|
|
FROM @raw_parsed
|
|
ORDER BY child_id ASC
|
|
FETCH 100 ROWS;
|
|
|
|
OUTPUT @filtered_results
|
|
TO "/modelling/catalog_page.csv"
|
|
USING Outputters.Csv(outputHeader: true);
|
|
|