Introduzione al Data Modeling in Snowflake
Nuno Rocha
Director of Engineering






SELECT DISTINCT category
FROM allproducts;

SELECT TRIM(category)
FROM allproducts;

SELECT TRIM(f.value)
FROM allproducts,
LATERAL FLATTEN(INPUT => SPLIT(allproducts.category, ',')) f;

CREATE OR REPLACE TABLE categories (
category_id NUMBER(10,0) PRIMARY KEY,
category VARCHAR(255)
);
INSERT INTO: comando SQL per inserire nuove righe in una tabella.INSERT INTO categories (category_id, category)
___;
INSERT INTO categories (category_id, category)
SELECT
___,
___
FROM allproducts;
INSERT INTO categories (category_id, category)
SELECT
___,
TRIM(f.value)
FROM allproducts,
LATERAL FLATTEN(INPUT => SPLIT(allproducts.category, ',')) f;
INSERT INTO categories (category_id, category)
SELECT
ROW_NUMBER() OVER (ORDER BY TRIM(f.value)),
TRIM(f.value)
FROM allproducts,
LATERAL FLATTEN(INPUT => SPLIT(allproducts.category, ',')) f;
INSERT INTO categories (category_id, category)
SELECT
ROW_NUMBER() OVER (ORDER BY TRIM(f.value)),
TRIM(f.value)
FROM allproducts,
LATERAL FLATTEN(INPUT => SPLIT(allproducts.category, ',')) f
GROUP BY TRIM(f.value);

INSERT INTO: comando SQL per inserire nuove righeTRIM: rimuove gli spazi all’inizio e alla fine dei valoriLATERAL FLATTEN(INPUT => SPLIT()): funzione Snowflake che divide i valori in righeROW_NUMBER() OVER (ORDER BY): genera un numero sequenzialeGROUP BY: aggrega i dati con gli stessi valori-- Popola un’entità con i dati da un risultato di query
INSERT INTO table_name (column_name, other_columns)
SELECT
-- Genera un valore univoco usando il numero di riga
ROW_NUMBER() OVER (ORDER BY TRIM(alias.value)),
TRIM(alias.value)
FROM another_table,
-- Dividi un attributo testuale in base a un delimitatore
LATERAL FLATTEN(INPUT => SPLIT(another_table.column_name, 'delimiter_value'))alias
-- Aggrega i dati per garantire l’univocità dei valori
GROUP BY TRIM(alias.value);
Introduzione al Data Modeling in Snowflake