diff --git a/.vscode/settings.json b/.vscode/settings.json index 236981053..ca20f9585 100644 --- a/.vscode/settings.json +++ b/.vscode/settings.json @@ -17,7 +17,6 @@ "files.autoSave": "afterDelay", "screencastMode.onlyKeyboardShortcuts": true, "terminal.integrated.fontSize": 18, - "workbench.activityBar.visible": true, "workbench.colorTheme": "Visual Studio Dark", "workbench.fontAliasing": "antialiased", "workbench.statusBar.visible": true diff --git a/data/nyc_parking_violations.db b/data/nyc_parking_violations.db index 19e587528..3b62c5561 100644 Binary files a/data/nyc_parking_violations.db and b/data/nyc_parking_violations.db differ diff --git a/data/prod_nyc_parking_violations.db b/data/prod_nyc_parking_violations.db index 9a2bd4ad7..38e734479 100644 Binary files a/data/prod_nyc_parking_violations.db and b/data/prod_nyc_parking_violations.db differ diff --git a/nyc_parking_violations/profiles.yml b/nyc_parking_violations/profiles.yml index cabe18c54..eb5ac8dfc 100644 --- a/nyc_parking_violations/profiles.yml +++ b/nyc_parking_violations/profiles.yml @@ -9,4 +9,5 @@ nyc_parking_violations: # start in the root directory and not in the # nyc_parking_violations directory path: './data/prod_nyc_parking_violations.db' - target: dev \ No newline at end of file + target: dev + \ No newline at end of file diff --git a/run_sql_queries_here.ipynb b/run_sql_queries_here.ipynb index f7c54e6c9..eca37419c 100644 --- a/run_sql_queries_here.ipynb +++ b/run_sql_queries_here.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, "outputs": [], "source": [ @@ -12,17 +12,273 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 2, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
registration_stateticket_count
0NJ9258
1PA3514
2FL2414
3CT1787
4GA840
.........
57AB1
58BC1
59NB1
60PE1
61SK1
\n", + "

62 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " registration_state ticket_count\n", + "0 NJ 9258\n", + "1 PA 3514\n", + "2 FL 2414\n", + "3 CT 1787\n", + "4 GA 840\n", + ".. ... ...\n", + "57 AB 1\n", + "58 BC 1\n", + "59 NB 1\n", + "60 PE 1\n", + "61 SK 1\n", + "\n", + "[62 rows x 2 columns]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], "source": [ "sql_query = '''\n", - "show tables\n", + "SELECT * FROM gold_vehicles_metrics\n", "'''\n", "\n", "with duckdb.connect('data/nyc_parking_violations.db') as con:\n", " display(con.sql(sql_query).df())" ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [], + "source": [ + "sql_query_import_1 ='''\n", + "CREATE OR REPLACE TABLE parking_violations_codes AS\n", + "SELECT *\n", + "FROM read_csv_auto(\n", + "'data/dof_parking_violation_codes.csv',\n", + "normalize_names=True\n", + ")\n", + "'''\n", + "\n", + "sql_query_import_2 ='''\n", + "CREATE OR REPLACE TABLE parking_violations_2023 AS\n", + "SELECT *\n", + "FROM read_csv_auto(\n", + "'data/parking_violations_issued_fiscal_year_2023_sample.csv',\n", + "normalize_names=True\n", + ")\n", + "'''\n", + "with duckdb.connect('data/prod_nyc_parking_violations.db') as con:\n", + " con.sql(sql_query_import_1)\n", + " con.sql(sql_query_import_2)" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
registration_stateticket_count
0NJ9258
1PA3514
2FL2414
3CT1787
4GA840
.........
57AB1
58BC1
59NB1
60PE1
61SK1
\n", + "

62 rows × 2 columns

\n", + "
" + ], + "text/plain": [ + " registration_state ticket_count\n", + "0 NJ 9258\n", + "1 PA 3514\n", + "2 FL 2414\n", + "3 CT 1787\n", + "4 GA 840\n", + ".. ... ...\n", + "57 AB 1\n", + "58 BC 1\n", + "59 NB 1\n", + "60 PE 1\n", + "61 SK 1\n", + "\n", + "[62 rows x 2 columns]" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "sql_query = '''\n", + "SELECT * FROM gold_vehicles_metrics\n", + "'''\n", + "\n", + "with duckdb.connect('data/prod_nyc_parking_violations.db') as con:\n", + " display(con.sql(sql_query).df())" + ] } ], "metadata": {