From 2d6ed41b6f31715e40e4ca11a754a562c06b9711 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jaan=20L=C4=B1?= Date: Wed, 10 Apr 2024 16:21:58 -0400 Subject: [PATCH 1/2] fix: paths --- README.md | 26 +++++++++++++------------- data_processing/dbt_project.yml | 10 +++++----- 2 files changed, 18 insertions(+), 18 deletions(-) diff --git a/README.md b/README.md index 4488c27..4bfaff7 100644 --- a/README.md +++ b/README.md @@ -93,14 +93,14 @@ Example plot of this data: https://s13.gifyu.com/images/SCGH2.gif (code here: ht Example visualization: live demo here - https://jaanli.github.io/american-community-survey/ (visualization code [here](https://github.com/jaanli/american-community-survey/)) -![image](https://github.com/jaanli/exploring_american_community_survey_data/assets/5317244/0428e121-c4ec-4a97-826f-d3f944bc7bf2) +![image](https://github.com/jaanli/exploring_data_processing_data/assets/5317244/0428e121-c4ec-4a97-826f-d3f944bc7bf2) ## Requirements Clone the repo; create and activate a virtual environment: ``` -git clone https://github.com/jaanli/exploring_american_community_survey_data.git -cd exploring_american_community_survey_data +git clone https://github.com/jaanli/american-community-survey.git +cd american-community-survey python3 -m venv .venv source activate ``` @@ -124,7 +124,7 @@ brew install duckdb To retrieve the list of URLs from the Census Bureau's server and download and extract the archives for all of the 50 states' PUMS files, run the following: ``` -cd american_community_survey +cd data_processing dbt run --exclude "public_use_microdata_sample.generated+" --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2022/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2022.csv", "output_path": "~/data/american_community_survey"}' ``` @@ -144,7 +144,7 @@ dbt run --select "public_use_microdata_sample.generated+" --vars '{"public_use_m Inspect the output folder to see what has been created in the `output_path` specified in the previous command: ``` ❯ tree -hF -I '*.pdf' ~/data/american_community_survey -[ 224] /Users/me/data/american_community_survey/ +[ 224] /Users/me/data/data_processing/ ├── [ 128] 2022/ │ └── [3.4K] 1-Year/ │ ├── [ 128] csv_hak/ @@ -169,7 +169,7 @@ To see the size of the csv output: ``` ❯ du -sh ~/data/american_community_survey/2022 -6.4G /Users/me/data/american_community_survey/2022 +6.4G /Users/me/data/data_processing/2022 ``` And the compressed representation size: @@ -278,12 +278,12 @@ Check that you can execute a SQL query against these files: ``` duckdb -c "SELECT COUNT(*) FROM '~/data/american_community_survey/*individual_people_united_states*2021.parquet'" ``` -6. Create a data visualization using the compressed parquet files by adding to the `american_community_survey/models/public_use_microdata_sample/figures` directory, and using examples from here https://github.com/jaanli/american-community-survey/ or here https://github.com/jaanli/lonboard/blob/example-american-community-survey/examples/american-community-survey.ipynb +6. Create a data visualization using the compressed parquet files by adding to the `data_processing/models/public_use_microdata_sample/figures` directory, and using examples from here https://github.com/jaanli/american-community-survey/ or here https://github.com/jaanli/lonboard/blob/example-american-community-survey/examples/american-community-survey.ipynb -To save time, there is a bash script with these steps in `scripts/process_one_year_of_american_community_survey_data.sh` that can be used as follows: +To save time, there is a bash script with these steps in `scripts/process_one_year_of_data_processing_data.sh` that can be used as follows: ``` -chmod a+x scripts/process_one_year_of_american_community_survey_data.sh -./scripts/process_one_year_of_american_community_survey_data.sh 2021 +chmod a+x scripts/process_one_year_of_data_processing_data.sh +./scripts/process_one_year_of_data_processing_data.sh 2021 ``` The argument specifies the year to be downloaded, transformed, compressed, and saved. It takes about 5 minutes per year of data. @@ -564,7 +564,7 @@ dbt run --select "public_use_microdata_sample.microdata_area_shapefile_paths" ``` 5. Check that the paths are correct: ``` -❯ duckdb -c "SELECT * FROM '/Users/me/data/american_community_survey/microdata_area_shapefile_paths.parquet';" +❯ duckdb -c "SELECT * FROM '/Users/me/data/data_processing/microdata_area_shapefile_paths.parquet';" ``` Displays: @@ -573,11 +573,11 @@ Displays: │ shp_path │ │ varchar │ ├─────────────────────────────────────────────────────────────────────────────────────────────┤ -│ /Users/me/data/american_community_survey/PUMA5/2010/tl_2010_02_puma10/tl_2010_02_puma10.shp │ +│ /Users/me/data/data_processing/PUMA5/2010/tl_2010_02_puma10/tl_2010_02_puma10.shp │ │ · │ │ · │ │ · │ -│ /Users/me/data/american_community_survey/PUMA5/2010/tl_2010_48_puma10/tl_2010_48_puma10.shp │ +│ /Users/me/data/data_processing/PUMA5/2010/tl_2010_48_puma10/tl_2010_48_puma10.shp │ ├─────────────────────────────────────────────────────────────────────────────────────────────┤ │ 54 rows (40 shown) │ └─────────────────────────────────────────────────────────────────────────────────────────────┘ diff --git a/data_processing/dbt_project.yml b/data_processing/dbt_project.yml index 9ba06b5..16bf3db 100644 --- a/data_processing/dbt_project.yml +++ b/data_processing/dbt_project.yml @@ -1,12 +1,12 @@ # Name your project! Project names should contain only lowercase characters # and underscores. A good package name should reflect your organization's # name or the intended use of these models -name: "american_community_survey" +name: "data_processing" version: "1.0.0" config-version: 2 # This setting configures which "profile" dbt uses for this project. -profile: "american_community_survey" +profile: "data_processing" # Variables that can be changed from the command line using the `--vars` flag: # example: dbt run --vars 'my_variable: my_value' @@ -28,8 +28,8 @@ macro-paths: ["macros"] snapshot-paths: ["snapshots"] clean-targets: # directories to be removed by `dbt clean` - - "target" - - "dbt_packages" +- "target" +- "dbt_packages" # Configuring models # Full documentation: https://docs.getdbt.com/docs/configuring-models @@ -38,7 +38,7 @@ clean-targets: # directories to be removed by `dbt clean` # directory as views. These settings can be overridden in the individual model # files using the `{{ config(...) }}` macro. models: - american_community_survey: + data_processing: # Config indicated by + and applies to all files under models/example/ # example: +materialized: view From c7b337ea0f4c5381aa0c99a754db44fb317cf3ef Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Jaan=20L=C4=B1?= Date: Wed, 10 Apr 2024 18:21:53 -0400 Subject: [PATCH 2/2] fix: make paths relative and update readme and test --- README.md | 60 ++++++++++--- .../public_use_microdata_sample/config.yml | 52 ++++++----- .../download_and_extract_archives.py | 25 +----- ...units_alabama_enum_mapped_renamed_2022.sql | 4 +- ..._units_alaska_enum_mapped_renamed_2022.sql | 4 +- ...units_arizona_enum_mapped_renamed_2022.sql | 4 +- ...nits_arkansas_enum_mapped_renamed_2022.sql | 4 +- ...ts_california_enum_mapped_renamed_2022.sql | 4 +- ...nits_colorado_enum_mapped_renamed_2022.sql | 4 +- ...s_connecticut_enum_mapped_renamed_2022.sql | 4 +- ...nits_delaware_enum_mapped_renamed_2022.sql | 4 +- ...t_of_columbia_enum_mapped_renamed_2022.sql | 4 +- ...units_florida_enum_mapped_renamed_2022.sql | 4 +- ...units_georgia_enum_mapped_renamed_2022.sql | 4 +- ..._units_hawaii_enum_mapped_renamed_2022.sql | 4 +- ...g_units_idaho_enum_mapped_renamed_2022.sql | 4 +- ...nits_illinois_enum_mapped_renamed_2022.sql | 4 +- ...units_indiana_enum_mapped_renamed_2022.sql | 4 +- ...ng_units_iowa_enum_mapped_renamed_2022.sql | 4 +- ..._units_kansas_enum_mapped_renamed_2022.sql | 4 +- ...nits_kentucky_enum_mapped_renamed_2022.sql | 4 +- ...its_louisiana_enum_mapped_renamed_2022.sql | 4 +- ...g_units_maine_enum_mapped_renamed_2022.sql | 4 +- ...nits_maryland_enum_mapped_renamed_2022.sql | 4 +- ...massachusetts_enum_mapped_renamed_2022.sql | 4 +- ...nits_michigan_enum_mapped_renamed_2022.sql | 4 +- ...its_minnesota_enum_mapped_renamed_2022.sql | 4 +- ...s_mississippi_enum_mapped_renamed_2022.sql | 4 +- ...nits_missouri_enum_mapped_renamed_2022.sql | 4 +- ...units_montana_enum_mapped_renamed_2022.sql | 4 +- ...nits_nebraska_enum_mapped_renamed_2022.sql | 4 +- ..._units_nevada_enum_mapped_renamed_2022.sql | 4 +- ...new_hampshire_enum_mapped_renamed_2022.sql | 4 +- ...ts_new_jersey_enum_mapped_renamed_2022.sql | 4 +- ...ts_new_mexico_enum_mapped_renamed_2022.sql | 4 +- ...nits_new_york_enum_mapped_renamed_2022.sql | 4 +- ...orth_carolina_enum_mapped_renamed_2022.sql | 4 +- ..._north_dakota_enum_mapped_renamed_2022.sql | 4 +- ...ng_units_ohio_enum_mapped_renamed_2022.sql | 4 +- ...nits_oklahoma_enum_mapped_renamed_2022.sql | 4 +- ..._units_oregon_enum_mapped_renamed_2022.sql | 4 +- ..._pennsylvania_enum_mapped_renamed_2022.sql | 4 +- ...s_puerto_rico_enum_mapped_renamed_2022.sql | 4 +- ..._rhode_island_enum_mapped_renamed_2022.sql | 4 +- ...outh_carolina_enum_mapped_renamed_2022.sql | 4 +- ..._south_dakota_enum_mapped_renamed_2022.sql | 4 +- ...its_tennessee_enum_mapped_renamed_2022.sql | 4 +- ...g_units_texas_enum_mapped_renamed_2022.sql | 4 +- ...first_tranche_enum_mapped_renamed_2022.sql | 4 +- ...econd_tranche_enum_mapped_renamed_2022.sql | 4 +- ...ng_units_utah_enum_mapped_renamed_2022.sql | 4 +- ...units_vermont_enum_mapped_renamed_2022.sql | 4 +- ...nits_virginia_enum_mapped_renamed_2022.sql | 4 +- ...ts_washington_enum_mapped_renamed_2022.sql | 4 +- ...west_virginia_enum_mapped_renamed_2022.sql | 4 +- ...its_wisconsin_enum_mapped_renamed_2022.sql | 4 +- ...units_wyoming_enum_mapped_renamed_2022.sql | 4 +- ...eople_alabama_enum_mapped_renamed_2022.sql | 4 +- ...people_alaska_enum_mapped_renamed_2022.sql | 4 +- ...eople_arizona_enum_mapped_renamed_2022.sql | 4 +- ...ople_arkansas_enum_mapped_renamed_2022.sql | 4 +- ...le_california_enum_mapped_renamed_2022.sql | 4 +- ...ople_colorado_enum_mapped_renamed_2022.sql | 4 +- ...e_connecticut_enum_mapped_renamed_2022.sql | 4 +- ...ople_delaware_enum_mapped_renamed_2022.sql | 4 +- ...t_of_columbia_enum_mapped_renamed_2022.sql | 4 +- ...eople_florida_enum_mapped_renamed_2022.sql | 4 +- ...eople_georgia_enum_mapped_renamed_2022.sql | 4 +- ...people_hawaii_enum_mapped_renamed_2022.sql | 4 +- ..._people_idaho_enum_mapped_renamed_2022.sql | 4 +- ...ople_illinois_enum_mapped_renamed_2022.sql | 4 +- ...eople_indiana_enum_mapped_renamed_2022.sql | 4 +- ...l_people_iowa_enum_mapped_renamed_2022.sql | 4 +- ...people_kansas_enum_mapped_renamed_2022.sql | 4 +- ...ople_kentucky_enum_mapped_renamed_2022.sql | 4 +- ...ple_louisiana_enum_mapped_renamed_2022.sql | 4 +- ..._people_maine_enum_mapped_renamed_2022.sql | 4 +- ...ople_maryland_enum_mapped_renamed_2022.sql | 4 +- ...massachusetts_enum_mapped_renamed_2022.sql | 4 +- ...ople_michigan_enum_mapped_renamed_2022.sql | 4 +- ...ple_minnesota_enum_mapped_renamed_2022.sql | 4 +- ...e_mississippi_enum_mapped_renamed_2022.sql | 4 +- ...ople_missouri_enum_mapped_renamed_2022.sql | 4 +- ...eople_montana_enum_mapped_renamed_2022.sql | 4 +- ...ople_nebraska_enum_mapped_renamed_2022.sql | 4 +- ...people_nevada_enum_mapped_renamed_2022.sql | 4 +- ...new_hampshire_enum_mapped_renamed_2022.sql | 4 +- ...le_new_jersey_enum_mapped_renamed_2022.sql | 4 +- ...le_new_mexico_enum_mapped_renamed_2022.sql | 4 +- ...ople_new_york_enum_mapped_renamed_2022.sql | 4 +- ...orth_carolina_enum_mapped_renamed_2022.sql | 4 +- ..._north_dakota_enum_mapped_renamed_2022.sql | 4 +- ...l_people_ohio_enum_mapped_renamed_2022.sql | 4 +- ...ople_oklahoma_enum_mapped_renamed_2022.sql | 4 +- ...people_oregon_enum_mapped_renamed_2022.sql | 4 +- ..._pennsylvania_enum_mapped_renamed_2022.sql | 4 +- ...e_puerto_rico_enum_mapped_renamed_2022.sql | 4 +- ..._rhode_island_enum_mapped_renamed_2022.sql | 4 +- ...outh_carolina_enum_mapped_renamed_2022.sql | 4 +- ..._south_dakota_enum_mapped_renamed_2022.sql | 4 +- ...ple_tennessee_enum_mapped_renamed_2022.sql | 4 +- ..._people_texas_enum_mapped_renamed_2022.sql | 4 +- ...first_tranche_enum_mapped_renamed_2022.sql | 4 +- ...econd_tranche_enum_mapped_renamed_2022.sql | 4 +- ...l_people_utah_enum_mapped_renamed_2022.sql | 4 +- ...eople_vermont_enum_mapped_renamed_2022.sql | 4 +- ...ople_virginia_enum_mapped_renamed_2022.sql | 4 +- ...le_washington_enum_mapped_renamed_2022.sql | 4 +- ...west_virginia_enum_mapped_renamed_2022.sql | 4 +- ...ple_wisconsin_enum_mapped_renamed_2022.sql | 4 +- ...eople_wyoming_enum_mapped_renamed_2022.sql | 4 +- ...ate_sql_schemas_for_extracted_csv_files.py | 9 +- ...th_enum_types_and_mapped_values_renamed.py | 87 ++++++++++++++----- 113 files changed, 363 insertions(+), 302 deletions(-) diff --git a/README.md b/README.md index 4bfaff7..eaff41b 100644 --- a/README.md +++ b/README.md @@ -53,14 +53,14 @@ A typical Framework project looks like this: ## Command reference -| Command | Description | -| ----------------- | -------------------------------------------------------- | -| `yarn install` | Install or reinstall dependencies | -| `yarn dev` | Start local preview server | -| `yarn build` | Build your static site, generating `./dist` | -| `yarn deploy` | Deploy your project to Observable | -| `yarn clean` | Clear the local data loader cache | -| `yarn observable` | Run commands like `observable help` | +| Command | Description | +| ----------------- | ------------------------------------------- | +| `yarn install` | Install or reinstall dependencies | +| `yarn dev` | Start local preview server | +| `yarn build` | Build your static site, generating `./dist` | +| `yarn deploy` | Deploy your project to Observable | +| `yarn clean` | Clear the local data loader cache | +| `yarn observable` | Run commands like `observable help` | ## GPT-4 reference @@ -123,22 +123,56 @@ brew install duckdb ## Usage for 2022 ACS Public Use Microdata Sample (PUMS) Data To retrieve the list of URLs from the Census Bureau's server and download and extract the archives for all of the 50 states' PUMS files, run the following: + ``` cd data_processing -dbt run --exclude "public_use_microdata_sample.generated+" --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2022/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2022.csv", "output_path": "~/data/american_community_survey"}' +dbt run --select "public_use_microdata_sample.list_urls" \ + --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2021/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2021.csv", "output_path": "~/data/american_community_survey"}' +``` + +Then save the URLs: + +``` +dbt run --select "public_use_microdata_sample.urls" \ + --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2021/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2021.csv", "output_path": "~/data/american_community_survey"}' \ + --threads 8 +``` + +Then execute the dbt model for downloading and extract the archives of the microdata (takes ~2min on a Macbook): + +``` +dbt run --select "public_use_microdata_sample.download_and_extract_archives" \ + --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2022/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2022.csv", "output_path": "~/data/american_community_survey"}' \ + --threads 8 +``` + +Then generate the CSV paths: + +``` +dbt run --select "public_use_microdata_sample.csv_paths" \ + --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2021/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2022.json", "output_path": "~/data/american_community_survey"}' \ + --threads 8 +``` + +Then parse the data dictionary: + +``` +dbt run --select "public_use_microdata_sample.parse_data_dictionary" \ + --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2021/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2021.csv", "output_path": "~/data/american_community_survey"}' \ + --threads 8 ``` Then generate the SQL commands needed to map every state's individual people or housing unit variables to the easier to use (and read) names: ``` -python scripts/generate_sql_data_dictionary_mapping_for_extracted_csv_files.py \ - ~/data/american_community_survey/public_use_microdata_sample_csv_paths.parquet \ - ~/data/american_community_survey/PUMS_Data_Dictionary_2022.json +python scripts/generate_sql_with_enum_types_and_mapped_values_renamed.py ~/data/american_community_survey/csv_paths.parquet ~/data/american_community_survey/PUMS_Data_Dictionary_2022.json ``` Then execute these generated SQL queries using 1 thread (you can adjust this number to be higher depending on the available processor cores on your system): ``` -dbt run --select "public_use_microdata_sample.generated+" --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2022/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2022.csv", "output_path": "~/data/american_community_survey"}' --threads 1 +dbt run --select "public_use_microdata_sample.generated+" \ + --vars '{"public_use_microdata_sample_url": "https://www2.census.gov/programs-surveys/acs/data/pums/2022/1-Year/", "public_use_microdata_sample_data_dictionary_url": "https://www2.census.gov/programs-surveys/acs/tech_docs/pums/data_dict/PUMS_Data_Dictionary_2022.csv", "output_path": "~/data/american_community_survey"}' \ + --threads 8 ``` Inspect the output folder to see what has been created in the `output_path` specified in the previous command: diff --git a/data_processing/models/public_use_microdata_sample/config.yml b/data_processing/models/public_use_microdata_sample/config.yml index 7e705fa..182b2f0 100644 --- a/data_processing/models/public_use_microdata_sample/config.yml +++ b/data_processing/models/public_use_microdata_sample/config.yml @@ -1,27 +1,31 @@ version: 2 models: - - name: list_urls - config: - public_use_microdata_sample_url: "{{ var('public_use_microdata_sample_url') }}" - output_path: "{{ var('output_path') }}" - - name: download_and_extract_archives - config: - public_use_microdata_sample_url: "{{ var('public_use_microdata_sample_url') }}" - output_path: "{{ var('output_path') }}" - - name: parse_data_dictionary - config: - public_use_microdata_sample_data_dictionary_url: "{{ var('public_use_microdata_sample_data_dictionary_url') }}" - output_path: "{{ var('output_path') }}" - - name: list_shapefile_urls - config: - microdata_area_shapefile_url: "{{ var('microdata_area_shapefile_url') }}" - output_path: "{{ var('output_path') }}" - - name: download_and_extract_shapefiles - config: - microdata_area_shapefile_url: "{{ var('microdata_area_shapefile_url') }}" - output_path: "{{ var('output_path') }}" - - name: combine_shapefiles - config: - microdata_area_shapefile_url: "{{ var('microdata_area_shapefile_url') }}" - output_path: "{{ var('output_path') }}" +- name: list_urls + config: + public_use_microdata_sample_url: "{{ var('public_use_microdata_sample_url') }}" + output_path: "{{ var('output_path') }}" +- name: download_and_extract_archives + config: + public_use_microdata_sample_url: "{{ var('public_use_microdata_sample_url') }}" + output_path: "{{ var('output_path') }}" +- name: csv_paths + config: + public_use_microdata_sample_url: "{{ var('public_use_microdata_sample_url') }}" + output_path: "{{ var('output_path') }}" +- name: parse_data_dictionary + config: + public_use_microdata_sample_data_dictionary_url: "{{ var('public_use_microdata_sample_data_dictionary_url') }}" + output_path: "{{ var('output_path') }}" +- name: list_shapefile_urls + config: + microdata_area_shapefile_url: "{{ var('microdata_area_shapefile_url') }}" + output_path: "{{ var('output_path') }}" +- name: download_and_extract_shapefiles + config: + microdata_area_shapefile_url: "{{ var('microdata_area_shapefile_url') }}" + output_path: "{{ var('output_path') }}" +- name: combine_shapefiles + config: + microdata_area_shapefile_url: "{{ var('microdata_area_shapefile_url') }}" + output_path: "{{ var('output_path') }}" diff --git a/data_processing/models/public_use_microdata_sample/download_and_extract_archives.py b/data_processing/models/public_use_microdata_sample/download_and_extract_archives.py index 5582e34..cc05a08 100644 --- a/data_processing/models/public_use_microdata_sample/download_and_extract_archives.py +++ b/data_processing/models/public_use_microdata_sample/download_and_extract_archives.py @@ -25,7 +25,7 @@ def model(dbt, session): base_url = dbt.config.get('public_use_microdata_sample_url') # Assuming this is correctly set # Fetch URLs from your table or view - query = "SELECT * FROM list_urls" + query = "SELECT * FROM list_urls " result = session.execute(query).fetchall() columns = [desc[0] for desc in session.description] url_df = pd.DataFrame(result, columns=columns) @@ -50,25 +50,4 @@ def model(dbt, session): paths_df = pd.DataFrame(extracted_files, columns=['csv_path']) # Return the DataFrame with paths to the extracted CSV files - return paths_df - -# Mock dbt and session for demonstration; replace with actual dbt and session in your environment -class MockDBT: - def config(self, key): - return { - 'public_use_microdata_sample_url': 'https://example.com/path/to/your/csv/files', - 'output_path': '~/path/to/your/output/directory' - }.get(key, '') - -class MockSession: - def execute(self, query): - # Mock response; replace with actual fetching logic - return [{"URL": "https://example.com/path/to/your/csv_file.zip"} for _ in range(10)] - -dbt = MockDBT() -session = MockSession() - -if __name__ == "__main__": - # Directly calling model function for demonstration; integrate properly within your dbt project - df = model(dbt, session) - print(df) + return paths_df \ No newline at end of file diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alabama_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alabama_enum_mapped_renamed_2022.sql index 358e1e8..cf2bcda 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alabama_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alabama_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hal/psam_h01.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hal/psam_h01.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alaska_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alaska_enum_mapped_renamed_2022.sql index 6684a7a..24ff800 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alaska_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_alaska_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hak/psam_h02.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hak/psam_h02.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arizona_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arizona_enum_mapped_renamed_2022.sql index 9350977..e96d309 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arizona_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arizona_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_haz/psam_h04.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_haz/psam_h04.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arkansas_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arkansas_enum_mapped_renamed_2022.sql index 66cf3bc..80674f1 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arkansas_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_arkansas_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_har/psam_h05.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_har/psam_h05.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_california_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_california_enum_mapped_renamed_2022.sql index 7c96db8..10dc16a 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_california_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_california_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hca/psam_h06.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hca/psam_h06.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_colorado_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_colorado_enum_mapped_renamed_2022.sql index 8ff6331..1296e7d 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_colorado_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_colorado_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hco/psam_h08.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hco/psam_h08.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_connecticut_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_connecticut_enum_mapped_renamed_2022.sql index 07e80f1..345bcfe 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_connecticut_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_connecticut_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hct/psam_h09.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hct/psam_h09.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_delaware_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_delaware_enum_mapped_renamed_2022.sql index 6c4f409..7ce6425 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_delaware_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_delaware_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hde/psam_h10.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hde/psam_h10.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_district_of_columbia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_district_of_columbia_enum_mapped_renamed_2022.sql index e59f7ba..b697ca3 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_district_of_columbia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_district_of_columbia_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hdc/psam_h11.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hdc/psam_h11.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_florida_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_florida_enum_mapped_renamed_2022.sql index 3943b54..0ee5457 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_florida_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_florida_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hfl/psam_h12.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hfl/psam_h12.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_georgia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_georgia_enum_mapped_renamed_2022.sql index 9ac1914..f89930f 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_georgia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_georgia_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hga/psam_h13.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hga/psam_h13.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_hawaii_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_hawaii_enum_mapped_renamed_2022.sql index 771f5df..ccf2ac8 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_hawaii_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_hawaii_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hhi/psam_h15.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hhi/psam_h15.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_idaho_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_idaho_enum_mapped_renamed_2022.sql index 73449f8..06c9740 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_idaho_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_idaho_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hid/psam_h16.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hid/psam_h16.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_illinois_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_illinois_enum_mapped_renamed_2022.sql index bbddd5a..2bc6638 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_illinois_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_illinois_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hil/psam_h17.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hil/psam_h17.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_indiana_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_indiana_enum_mapped_renamed_2022.sql index 291b2ca..2495e5f 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_indiana_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_indiana_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hin/psam_h18.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hin/psam_h18.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_iowa_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_iowa_enum_mapped_renamed_2022.sql index b36ac98..0acf6d2 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_iowa_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_iowa_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hia/psam_h19.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hia/psam_h19.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kansas_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kansas_enum_mapped_renamed_2022.sql index 776e979..ecdeb01 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kansas_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kansas_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hks/psam_h20.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hks/psam_h20.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kentucky_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kentucky_enum_mapped_renamed_2022.sql index be63133..f954195 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kentucky_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_kentucky_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hky/psam_h21.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hky/psam_h21.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_louisiana_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_louisiana_enum_mapped_renamed_2022.sql index 07f85fe..ead3b62 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_louisiana_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_louisiana_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hla/psam_h22.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hla/psam_h22.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maine_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maine_enum_mapped_renamed_2022.sql index 13d147c..8836b97 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maine_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maine_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hme/psam_h23.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_h', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maryland_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maryland_enum_mapped_renamed_2022.sql index a3a5c11..75710b4 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maryland_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_maryland_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hmd/psam_h24.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hmd/psam_h24.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_massachusetts_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_massachusetts_enum_mapped_renamed_2022.sql index a300936..e770277 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_massachusetts_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_massachusetts_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hma/psam_h25.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hma/psam_h25.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_michigan_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_michigan_enum_mapped_renamed_2022.sql index 07d4526..fbbd341 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_michigan_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_michigan_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hmi/psam_h26.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hmi/psam_h26.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_minnesota_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_minnesota_enum_mapped_renamed_2022.sql index 1c49b5e..81804b6 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_minnesota_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_minnesota_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hmn/psam_h27.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hmn/psam_h27.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_mississippi_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_mississippi_enum_mapped_renamed_2022.sql index dd3b5d3..4e58144 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_mississippi_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_mississippi_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hms/psam_h28.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hms/psam_h28.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_missouri_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_missouri_enum_mapped_renamed_2022.sql index d41533a..ea9f9f4 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_missouri_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_missouri_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hmo/psam_h29.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hmo/psam_h29.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_montana_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_montana_enum_mapped_renamed_2022.sql index 1a5bea5..b2660ca 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_montana_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_montana_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hmt/psam_h30.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hmt/psam_h30.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nebraska_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nebraska_enum_mapped_renamed_2022.sql index c5838b9..3a086f3 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nebraska_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nebraska_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hne/psam_h31.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hne/psam_h31.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nevada_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nevada_enum_mapped_renamed_2022.sql index 590ae44..12511b6 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nevada_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_nevada_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hnv/psam_h32.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hnv/psam_h32.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_hampshire_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_hampshire_enum_mapped_renamed_2022.sql index 278d674..f4ba73b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_hampshire_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_hampshire_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hnh/psam_h33.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hnh/psam_h33.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_jersey_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_jersey_enum_mapped_renamed_2022.sql index 700c3d0..7ea3caa 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_jersey_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_jersey_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hnj/psam_h34.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hnj/psam_h34.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_mexico_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_mexico_enum_mapped_renamed_2022.sql index 773afb7..7263492 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_mexico_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_mexico_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hnm/psam_h35.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hnm/psam_h35.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_york_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_york_enum_mapped_renamed_2022.sql index 97979bf..88ae02a 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_york_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_new_york_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hny/psam_h36.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hny/psam_h36.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_carolina_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_carolina_enum_mapped_renamed_2022.sql index 000c1d8..e4fcc95 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_carolina_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_carolina_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hnc/psam_h37.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hnc/psam_h37.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_dakota_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_dakota_enum_mapped_renamed_2022.sql index 0454cd0..750396c 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_dakota_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_north_dakota_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hnd/psam_h38.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hnd/psam_h38.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_ohio_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_ohio_enum_mapped_renamed_2022.sql index fdfe81d..91cbf47 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_ohio_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_ohio_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hoh/psam_h39.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hoh/psam_h39.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oklahoma_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oklahoma_enum_mapped_renamed_2022.sql index 7f82bf3..f7e624e 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oklahoma_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oklahoma_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hok/psam_h40.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hok/psam_h40.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oregon_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oregon_enum_mapped_renamed_2022.sql index 49c0a22..702098b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oregon_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_oregon_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hor/psam_h41.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hor/psam_h41.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_pennsylvania_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_pennsylvania_enum_mapped_renamed_2022.sql index e63d439..305dab9 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_pennsylvania_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_pennsylvania_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hpa/psam_h42.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hpa/psam_h42.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_puerto_rico_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_puerto_rico_enum_mapped_renamed_2022.sql index 172238f..c14612b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_puerto_rico_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_puerto_rico_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hpr/psam_h72.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hpr/psam_h72.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_rhode_island_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_rhode_island_enum_mapped_renamed_2022.sql index 0149d6b..2b6b175 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_rhode_island_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_rhode_island_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hri/psam_h44.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hri/psam_h44.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_carolina_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_carolina_enum_mapped_renamed_2022.sql index 53e21a4..9d83e7a 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_carolina_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_carolina_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hsc/psam_h45.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hsc/psam_h45.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_dakota_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_dakota_enum_mapped_renamed_2022.sql index fef4761..4e0ce77 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_dakota_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_south_dakota_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hsd/psam_h46.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hsd/psam_h46.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_tennessee_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_tennessee_enum_mapped_renamed_2022.sql index db8245b..101f90f 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_tennessee_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_tennessee_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_htn/psam_h47.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_htn/psam_h47.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_texas_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_texas_enum_mapped_renamed_2022.sql index 61e6865..01a7a92 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_texas_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_texas_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_htx/psam_h48.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_htx/psam_h48.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_first_tranche_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_first_tranche_enum_mapped_renamed_2022.sql index 42bba55..cf9a210 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_first_tranche_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_first_tranche_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hus/psam_husa.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hus/psam_husa.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_second_tranche_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_second_tranche_enum_mapped_renamed_2022.sql index cb4a25d..e93fc37 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_second_tranche_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_united_states_second_tranche_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hus/psam_husb.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hus/psam_husb.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_utah_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_utah_enum_mapped_renamed_2022.sql index 9778232..7446fc3 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_utah_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_utah_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hut/psam_h49.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hut/psam_h49.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_vermont_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_vermont_enum_mapped_renamed_2022.sql index 352f9ce..12069bb 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_vermont_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_vermont_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hvt/psam_h50.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hvt/psam_h50.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_virginia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_virginia_enum_mapped_renamed_2022.sql index 2b9760b..962a1bb 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_virginia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_virginia_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hva/psam_h51.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hva/psam_h51.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_washington_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_washington_enum_mapped_renamed_2022.sql index 50ce24c..2a9c69a 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_washington_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_washington_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hwa/psam_h53.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hwa/psam_h53.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_west_virginia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_west_virginia_enum_mapped_renamed_2022.sql index 3e7a00a..989ab22 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_west_virginia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_west_virginia_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hwv/psam_h54.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hwv/psam_h54.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wisconsin_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wisconsin_enum_mapped_renamed_2022.sql index 4f6921c..a6df3c6 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wisconsin_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wisconsin_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hwi/psam_h55.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hwi/psam_h55.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wyoming_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wyoming_enum_mapped_renamed_2022.sql index 2071605..727dc8d 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wyoming_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/housing_units_wyoming_enum_mapped_renamed_2022.sql @@ -905,7 +905,7 @@ CASE FYRBLTP WGTP78::VARCHAR AS "Housing Weight replicate 78", WGTP79::VARCHAR AS "Housing Weight replicate 79", WGTP80::VARCHAR AS "Housing Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_hwy/psam_h56.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_hwy/psam_h56.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alabama_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alabama_enum_mapped_renamed_2022.sql index c175e5e..314f563 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alabama_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alabama_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pal/psam_p01.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pal/psam_p01.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alaska_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alaska_enum_mapped_renamed_2022.sql index 3684ace..17ad44a 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alaska_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_alaska_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pak/psam_p02.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pak/psam_p02.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arizona_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arizona_enum_mapped_renamed_2022.sql index 639f650..3c473f9 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arizona_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arizona_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_paz/psam_p04.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_paz/psam_p04.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arkansas_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arkansas_enum_mapped_renamed_2022.sql index a658320..4b6bfc2 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arkansas_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_arkansas_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_par/psam_p05.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_par/psam_p05.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_california_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_california_enum_mapped_renamed_2022.sql index 1d513ae..39e793d 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_california_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_california_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pca/psam_p06.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pca/psam_p06.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_colorado_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_colorado_enum_mapped_renamed_2022.sql index 4b42da3..3f2c118 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_colorado_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_colorado_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pco/psam_p08.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pco/psam_p08.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_connecticut_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_connecticut_enum_mapped_renamed_2022.sql index 2c35d0b..87040a0 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_connecticut_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_connecticut_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pct/psam_p09.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pct/psam_p09.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_delaware_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_delaware_enum_mapped_renamed_2022.sql index 2c76792..3c667aa 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_delaware_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_delaware_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pde/psam_p10.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pde/psam_p10.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_district_of_columbia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_district_of_columbia_enum_mapped_renamed_2022.sql index baa2ea7..6182361 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_district_of_columbia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_district_of_columbia_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pdc/psam_p11.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pdc/psam_p11.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_florida_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_florida_enum_mapped_renamed_2022.sql index 9f49b11..6eb3082 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_florida_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_florida_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pfl/psam_p12.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pfl/psam_p12.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_georgia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_georgia_enum_mapped_renamed_2022.sql index 45b320f..41a0e51 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_georgia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_georgia_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pga/psam_p13.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pga/psam_p13.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_hawaii_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_hawaii_enum_mapped_renamed_2022.sql index c47573d..e2256b6 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_hawaii_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_hawaii_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_phi/psam_p15.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_phi/psam_p15.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_idaho_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_idaho_enum_mapped_renamed_2022.sql index 49d2620..65ef56b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_idaho_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_idaho_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pid/psam_p16.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pid/psam_p16.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_illinois_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_illinois_enum_mapped_renamed_2022.sql index b2d2c97..dfa9b5b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_illinois_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_illinois_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pil/psam_p17.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pil/psam_p17.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_indiana_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_indiana_enum_mapped_renamed_2022.sql index cfabfde..0013904 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_indiana_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_indiana_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pin/psam_p18.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pin/psam_p18.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_iowa_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_iowa_enum_mapped_renamed_2022.sql index 1292633..69f5ef9 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_iowa_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_iowa_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pia/psam_p19.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pia/psam_p19.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kansas_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kansas_enum_mapped_renamed_2022.sql index 8490c19..8660e38 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kansas_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kansas_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pks/psam_p20.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pks/psam_p20.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kentucky_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kentucky_enum_mapped_renamed_2022.sql index 6373463..8fe1ca8 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kentucky_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_kentucky_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pky/psam_p21.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pky/psam_p21.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_louisiana_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_louisiana_enum_mapped_renamed_2022.sql index 2541413..ae670d2 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_louisiana_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_louisiana_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pla/psam_p22.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pla/psam_p22.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maine_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maine_enum_mapped_renamed_2022.sql index f7ff47a..2d2859c 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maine_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maine_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pme/psam_p23.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_p', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maryland_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maryland_enum_mapped_renamed_2022.sql index 05f25b9..c38e7d0 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maryland_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_maryland_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pmd/psam_p24.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pmd/psam_p24.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_massachusetts_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_massachusetts_enum_mapped_renamed_2022.sql index 93bfaae..e19ec9f 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_massachusetts_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_massachusetts_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pma/psam_p25.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pma/psam_p25.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_michigan_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_michigan_enum_mapped_renamed_2022.sql index 3cf7728..ac2e3ea 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_michigan_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_michigan_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pmi/psam_p26.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pmi/psam_p26.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_minnesota_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_minnesota_enum_mapped_renamed_2022.sql index e1936e1..036fd6a 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_minnesota_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_minnesota_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pmn/psam_p27.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pmn/psam_p27.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_mississippi_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_mississippi_enum_mapped_renamed_2022.sql index 416f328..1e023b4 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_mississippi_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_mississippi_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pms/psam_p28.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pms/psam_p28.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_missouri_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_missouri_enum_mapped_renamed_2022.sql index 8a40e41..0893a33 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_missouri_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_missouri_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pmo/psam_p29.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pmo/psam_p29.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_montana_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_montana_enum_mapped_renamed_2022.sql index 7fc2ef9..7008668 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_montana_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_montana_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pmt/psam_p30.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pmt/psam_p30.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nebraska_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nebraska_enum_mapped_renamed_2022.sql index 0b95685..27e50be 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nebraska_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nebraska_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pne/psam_p31.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pne/psam_p31.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nevada_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nevada_enum_mapped_renamed_2022.sql index 5e69676..2621960 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nevada_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_nevada_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pnv/psam_p32.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pnv/psam_p32.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_hampshire_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_hampshire_enum_mapped_renamed_2022.sql index daba476..9ef5985 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_hampshire_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_hampshire_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pnh/psam_p33.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pnh/psam_p33.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_jersey_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_jersey_enum_mapped_renamed_2022.sql index 8420cca..e057025 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_jersey_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_jersey_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pnj/psam_p34.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pnj/psam_p34.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_mexico_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_mexico_enum_mapped_renamed_2022.sql index c628b15..b2b4d6b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_mexico_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_mexico_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pnm/psam_p35.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pnm/psam_p35.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_york_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_york_enum_mapped_renamed_2022.sql index d916ff1..343a1ee 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_york_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_new_york_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pny/psam_p36.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pny/psam_p36.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_carolina_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_carolina_enum_mapped_renamed_2022.sql index 7bffe4f..3e6add1 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_carolina_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_carolina_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pnc/psam_p37.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pnc/psam_p37.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_dakota_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_dakota_enum_mapped_renamed_2022.sql index ab84131..93c0768 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_dakota_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_north_dakota_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pnd/psam_p38.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pnd/psam_p38.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_ohio_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_ohio_enum_mapped_renamed_2022.sql index efb4307..c641b4e 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_ohio_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_ohio_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_poh/psam_p39.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_poh/psam_p39.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oklahoma_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oklahoma_enum_mapped_renamed_2022.sql index 5416c7a..2c63483 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oklahoma_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oklahoma_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pok/psam_p40.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pok/psam_p40.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oregon_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oregon_enum_mapped_renamed_2022.sql index fd95e8e..8a93d59 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oregon_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_oregon_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_por/psam_p41.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_por/psam_p41.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_pennsylvania_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_pennsylvania_enum_mapped_renamed_2022.sql index 54015f4..fd4b853 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_pennsylvania_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_pennsylvania_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_ppa/psam_p42.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_ppa/psam_p42.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_puerto_rico_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_puerto_rico_enum_mapped_renamed_2022.sql index 332a425..3648bdf 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_puerto_rico_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_puerto_rico_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_ppr/psam_p72.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_ppr/psam_p72.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_rhode_island_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_rhode_island_enum_mapped_renamed_2022.sql index 052667c..bd8fea2 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_rhode_island_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_rhode_island_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pri/psam_p44.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pri/psam_p44.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_carolina_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_carolina_enum_mapped_renamed_2022.sql index 79fa43c..9b2d8e4 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_carolina_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_carolina_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_psc/psam_p45.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_psc/psam_p45.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_dakota_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_dakota_enum_mapped_renamed_2022.sql index 3d92255..17ed954 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_dakota_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_south_dakota_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_psd/psam_p46.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_psd/psam_p46.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_tennessee_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_tennessee_enum_mapped_renamed_2022.sql index d8e07b7..d8a1037 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_tennessee_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_tennessee_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_ptn/psam_p47.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_ptn/psam_p47.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_texas_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_texas_enum_mapped_renamed_2022.sql index 4421db7..b1dd2d7 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_texas_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_texas_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_ptx/psam_p48.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_ptx/psam_p48.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_first_tranche_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_first_tranche_enum_mapped_renamed_2022.sql index 570a968..5e68e8b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_first_tranche_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_first_tranche_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pus/psam_pusa.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pus/psam_pusa.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_second_tranche_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_second_tranche_enum_mapped_renamed_2022.sql index 198d5ab..6270231 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_second_tranche_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_united_states_second_tranche_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pus/psam_pusb.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pus/psam_pusb.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_utah_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_utah_enum_mapped_renamed_2022.sql index 382a2fa..743cfdd 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_utah_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_utah_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_put/psam_p49.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_put/psam_p49.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_vermont_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_vermont_enum_mapped_renamed_2022.sql index 58f1b02..e885098 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_vermont_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_vermont_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pvt/psam_p50.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pvt/psam_p50.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_virginia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_virginia_enum_mapped_renamed_2022.sql index 38c1b28..768f8cf 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_virginia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_virginia_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pva/psam_p51.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pva/psam_p51.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_washington_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_washington_enum_mapped_renamed_2022.sql index 285ea26..ef23605 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_washington_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_washington_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pwa/psam_p53.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pwa/psam_p53.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_west_virginia_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_west_virginia_enum_mapped_renamed_2022.sql index afe3516..691ad64 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_west_virginia_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_west_virginia_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pwv/psam_p54.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pwv/psam_p54.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wisconsin_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wisconsin_enum_mapped_renamed_2022.sql index 8de6f59..69bc67b 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wisconsin_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wisconsin_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pwi/psam_p55.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pwi/psam_p55.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wyoming_enum_mapped_renamed_2022.sql b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wyoming_enum_mapped_renamed_2022.sql index bddb261..be37b93 100644 --- a/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wyoming_enum_mapped_renamed_2022.sql +++ b/data_processing/models/public_use_microdata_sample/generated/2022/enum_types_mapped_renamed/individual_people_wyoming_enum_mapped_renamed_2022.sql @@ -4217,7 +4217,7 @@ CASE FYOEP PWGTP78::VARCHAR AS "Person's Weight replicate 78", PWGTP79::VARCHAR AS "Person's Weight replicate 79", PWGTP80::VARCHAR AS "Person's Weight replicate 80", -FROM read_csv('/Users/me/data/american_community_survey/2022/1-Year/csv_pwy/psam_p56.csv', +FROM read_csv('~/data/american_community_survey/2022/1-Year/csv_pwy/psam_p56.csv', parallel=False, all_varchar=True, - auto_detect=True) \ No newline at end of file + auto_detect=True) diff --git a/data_processing/scripts/generate_sql_schemas_for_extracted_csv_files.py b/data_processing/scripts/generate_sql_schemas_for_extracted_csv_files.py index 6052158..5297834 100644 --- a/data_processing/scripts/generate_sql_schemas_for_extracted_csv_files.py +++ b/data_processing/scripts/generate_sql_schemas_for_extracted_csv_files.py @@ -48,18 +48,19 @@ def generate_materialized_name(folder_name, csv_name, state_lookup, national_loo enum_values = [f"'{x}'" for x in data_dict[header]["Values"].values()] enum_name = f"{header}_enum" enum_creation_statements.append(f"CREATE TYPE {enum_name} AS ENUM ({','.join(enum_values)});") - mapped_column = f"CAST({header} AS {enum_name}) AS \"{data_dict[header]['Description']}\"" + key = 'Description' + mapped_column = f'CAST({header} AS {enum_name}) AS "{data_dict[header][key]}"' sql_select_parts.append(f" {mapped_column}") elif header in data_dict: description = data_dict[header]["Description"].replace("'", "''") - sql_select_parts.append(f" {header} AS \"{description}\"") + sql_select_parts.append(f' {header} AS "{description}"') else: sql_select_parts.append(f" {header}") sql_select_statement = ",\n".join(sql_select_parts) - + newline = "\n" sql_content = f"""-- SQL transformation for {csv_name} generated by {os.path.basename(__file__)} -{'\n'.join(enum_creation_statements)} +{newline.join(enum_creation_statements)} {{{{ config(materialized='external', location=var('output_path') + '/{materialized_name}.parquet') }}}} SELECT diff --git a/data_processing/scripts/generate_sql_with_enum_types_and_mapped_values_renamed.py b/data_processing/scripts/generate_sql_with_enum_types_and_mapped_values_renamed.py index 224a4ee..3176a60 100644 --- a/data_processing/scripts/generate_sql_with_enum_types_and_mapped_values_renamed.py +++ b/data_processing/scripts/generate_sql_with_enum_types_and_mapped_values_renamed.py @@ -3,6 +3,7 @@ import os import json + def generate_materialized_name(folder_name, csv_name, state_lookup, national_lookup): type_char = folder_name.split("_")[1][0].lower() folder_code = folder_name.split("_")[1][1:].upper() @@ -15,7 +16,7 @@ def generate_materialized_name(folder_name, csv_name, state_lookup, national_loo name = state_lookup.get(folder_code, "Unknown state code") else: raise ValueError(f"Invalid code: {folder_code}") - + return f"{human_readable_name}_{name.replace(' ', '_')}".lower() @@ -39,29 +40,60 @@ def clean_enum_value(value): with open(data_dictionary_path, "r") as json_file: data_dict = json.load(json_file) -state_lookup = {code: name for name, code in [x.split("/") for x in data_dict["ST"]["Values"].values()]} -national_lookup = {"USA": "United States first tranche", "USB": "United States second tranche"} +state_lookup = { + code: name + for name, code in [x.split("/") for x in data_dict["ST"]["Values"].values()] +} +national_lookup = { + "USA": "United States first tranche", + "USB": "United States second tranche", +} df_csv_paths = pd.read_parquet(parquet_database_path) -models_dir = f"models/public_use_microdata_sample/generated/{year}/enum_types_mapped_renamed" +models_dir = ( + f"models/public_use_microdata_sample/generated/{year}/enum_types_mapped_renamed" +) os.makedirs(models_dir, exist_ok=True) def should_include_key(description): - exclude_criteria = ["weight", "identifier", "number", "age", "income", "time", "hours", "weeks", "puma", "total", "fee", "cost", "amount", "rent", "value", "taxes"] + exclude_criteria = [ + "weight", + "identifier", + "number", + "age", + "income", + "time", + "hours", + "weeks", + "puma", + "total", + "fee", + "cost", + "amount", + "rent", + "value", + "taxes", + ] # Check if any of the exclude criteria are in the value or if "age" is in the description. - if any(criterion in description.lower() and "flag" not in description.lower() for criterion in exclude_criteria): + if any( + criterion in description.lower() and "flag" not in description.lower() + for criterion in exclude_criteria + ): return False return True + for csv_path in df_csv_paths["csv_path"]: folder_name = os.path.basename(os.path.dirname(csv_path)) csv_name = os.path.basename(csv_path).split(".")[0] - materialized_name = generate_materialized_name(folder_name, csv_name, state_lookup, national_lookup) + materialized_name = generate_materialized_name( + folder_name, csv_name, state_lookup, national_lookup + ) df_headers = pd.read_csv(csv_path, nrows=0) - column_types = {column: 'VARCHAR' for column in df_headers.columns} - columns = ', '.join([f"'{col}': '{typ}'" for col, typ in column_types.items()]) + column_types = {column: "VARCHAR" for column in df_headers.columns} + columns = ", ".join([f"'{col}': '{typ}'" for col, typ in column_types.items()]) sql_select_parts = ["SELECT"] enum_creation_statements = [] table_creation_statement = f"CREATE TABLE {materialized_name} (" @@ -72,43 +104,54 @@ def should_include_key(description): if "Values" in details: if header in df_headers.columns: - enum_values = [f"'{key.strip()}'" for key, value in details["Values"].items()] + enum_values = [ + f"'{key.strip()}'" for key, value in details["Values"].items() + ] col_info = data_dict.get(header, {"Description": header}) description = col_info["Description"] if should_include_key(details["Description"]) and len(enum_values) > 0: enum_name = f"{header}_enum" - value_mapping = "\n\t\t".join([ - f"WHEN '{clean_enum_value(code)}' THEN '{clean_enum_value(label)}'" + value_mapping = "\n\t\t".join( + [ + f"WHEN '{clean_enum_value(code)}' THEN '{clean_enum_value(label)}'" + for code, label in data_dict[header]["Values"].items() + ] + ) + enum_labels = [ + f"'{clean_enum_value(label)}'" for code, label in data_dict[header]["Values"].items() - ]) - enum_labels = [f"'{clean_enum_value(label)}'" for code, label in data_dict[header]["Values"].items()] + ] mapped_column = f"""CASE {header}\n\t\t{value_mapping}\n\tEND::ENUM ({','.join(enum_labels)}) AS "{description}",""" column_definitions.append(mapped_column) else: - column_definitions.append(f' {header}::VARCHAR AS "{description}",') + column_definitions.append( + f' {header}::VARCHAR AS "{description}",' + ) else: # print(f"Column {header} not found in {csv_name}.csv") pass - - - sql_select_parts[-1] = sql_select_parts[-1].rstrip(',') + sql_select_parts[-1] = sql_select_parts[-1].rstrip(",") sql_select_statement = "\n".join(sql_select_parts) newline = "\n" newline_with_comma = ",\n" - + username = os.environ.get("USER") + path_without_user = "~/" + csv_path.split(username + '/')[1] # Combine ENUM creation, table creation, and COPY command in SQL content sql_content = f"""-- SQL transformation for {csv_name} generated by models/public_use_microdata_sample/scripts/{os.path.basename(__file__)} {{{{ config(materialized='external', location=var('output_path') + '/acs_pums_{materialized_name}_{year}.parquet') }}}} SELECT {newline.join(column_definitions)} -FROM read_csv('{csv_path}', +FROM read_csv('{path_without_user}', parallel=False, all_varchar=True, - auto_detect=True)""" + auto_detect=True) +""" - sql_file_path = os.path.join(models_dir, f"{materialized_name}_enum_mapped_renamed_{year}.sql") + sql_file_path = os.path.join( + models_dir, f"{materialized_name}_enum_mapped_renamed_{year}.sql" + ) with open(sql_file_path, "w") as sql_file: sql_file.write(sql_content)