Introduction to Databricks Lakehouse
Gang Wang
Senior Data Scientist
$$
$$

$$
$$

$$
{"pickup": "2024-03-15T08:23",
"dropoff": "2024-03-15 8:41",
"fare": null,
"zone": "236",
"distance": "4.2mi"}
{"pickup": "03/15/2024 09:10",
"dropoff": "2024-03-15T09:32",
"fare": 18.50,
"zone": "unknown",
"distance": 6.1}
$$
SELECT * FROM silver_taxi_trips
LIMIT 3;
pickup_ts | dropoff_ts | fare | zone_id | dist_km
2024-03-15 | 2024-03-15 | 14.20 | 236 | 6.8
2024-03-15… | 2024-03-15 | 18.50 | 142 | 9.8
2024-03-15 | 2024-03-15 | 22.00 | 79 | 12.1
$$
$$
$$
SELECT * FROM gold_taxi_daily
LIMIT 3;
date | zone_name | avg_fare | trips
2024-03-15 | Upper East | 16.80 | 1,247
2024-03-15 | Midtown | 22.45 | 3,891
2024-03-15 | Financial Dist | 19.10 | 2,156

$$
$$

Introduction to Databricks Lakehouse