DuckDB Examples
The Parquet files work out of the box with DuckDB, Pandas, Polars, or any Parquet-compatible tool.
# Install DuckDBbrew install duckdb # macOS# or download from https://duckdb.org/docs/installation
# Start DuckDBduckdbFind Netflix titles in the US
Section titled “Find Netflix titles in the US”SELECT m.title, m.year, l.provider_idFROM 'US_links.parquet' lJOIN 'core/media_details.parquet' m ON l.media_id = m.idWHERE l.provider_id = 'netflix'ORDER BY m.year DESCLIMIT 20;Top rated movies available in France
Section titled “Top rated movies available in France”SELECT m.title, m.tmdb_rating, l.provider_idFROM 'FR_links.parquet' lJOIN 'core/media_details.parquet' m ON l.media_id = m.idWHERE m.content_type = 'movie'ORDER BY m.tmdb_rating DESCLIMIT 10;Count titles per provider in Germany
Section titled “Count titles per provider in Germany”SELECT l.provider_id, p.name, COUNT(*) as title_countFROM 'DE_links.parquet' lJOIN 'core/providers.parquet' p ON l.provider_id = p.short_idGROUP BY l.provider_id, p.nameORDER BY title_count DESC;Find titles available on multiple providers
Section titled “Find titles available on multiple providers”SELECT m.title, m.year, COUNT(DISTINCT l.provider_id) as provider_count, LIST(l.provider_id) as providersFROM 'US_links.parquet' lJOIN 'core/media_details.parquet' m ON l.media_id = m.idGROUP BY m.title, m.yearHAVING provider_count >= 5ORDER BY provider_count DESCLIMIT 20;Search with translations
Section titled “Search with translations”SELECT m.title as english_title, t.title as french_title, m.yearFROM 'core/media_details.parquet' mJOIN 'translations/lang_fr.parquet' t ON m.id = t.media_idWHERE m.content_type = 'movie' AND m.tmdb_rating > 8ORDER BY m.tmdb_rating DESCLIMIT 10;Export to CSV
Section titled “Export to CSV”COPY ( SELECT m.title, m.year, m.tmdb_rating, l.provider_id FROM 'US_links.parquet' l JOIN 'core/media_details.parquet' m ON l.media_id = m.id WHERE m.content_type = 'movie' ORDER BY m.tmdb_rating DESC) TO 'us_movies.csv' (HEADER, DELIMITER ',');