diff --git a/data_processing/models/ahrq.gov/syh_dr/person/syhdr_commercial_person.sql b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_commercial_person.sql new file mode 100644 index 0000000..4212134 --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_commercial_person.sql @@ -0,0 +1,5 @@ +select + *, + 'commercial' as insurance +from {{ source('syh_dr', 'commercial_person') }} + diff --git a/data_processing/models/ahrq.gov/syh_dr/person/syhdr_medicaid_person.sql b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_medicaid_person.sql new file mode 100644 index 0000000..9f85194 --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_medicaid_person.sql @@ -0,0 +1,4 @@ +select + *, + 'medicaid' as insurance +from {{ source('syh_dr', 'medicaid_person') }} \ No newline at end of file diff --git a/data_processing/models/ahrq.gov/syh_dr/person/syhdr_medicare_person.sql b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_medicare_person.sql new file mode 100644 index 0000000..cb8fb7d --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_medicare_person.sql @@ -0,0 +1,4 @@ +select + *, + 'medicare' as insurance +from {{ source('syh_dr', 'medicare_person') }} \ No newline at end of file diff --git a/data_processing/models/ahrq.gov/syh_dr/person/syhdr_person.sql b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_person.sql new file mode 100644 index 0000000..0926572 --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/person/syhdr_person.sql @@ -0,0 +1,12 @@ +{{ config( + materialized = 'external', + location = '../data/ahrq.gov/syh_dr/syhdr_person.parquet' +) }} + +{{ dbt_utils.union_relations( + relations = [ + ref('syhdr_commercial_person'), + ref('syhdr_medicaid_person'), + ref('syhdr_medicare_person'), + ] +) }} \ No newline at end of file diff --git a/data_processing/models/ahrq.gov/syh_dr/syhdr_inpatient.sql b/data_processing/models/ahrq.gov/syh_dr/syhdr_inpatient.sql new file mode 100644 index 0000000..fb6afce --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/syhdr_inpatient.sql @@ -0,0 +1,29 @@ +{{ config( + materialized = 'external', + location = '../data/ahrq.gov/syh_dr/syhdr_inpatient.parquet' +)}} + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'commercial' as insurance +from {{ source('syh_dr', 'commercial_inpatient') }} + +union all + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'medicaid' as insurance +from {{ source('syh_dr', 'medicaid_inpatient') }} + +union all + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'medicare' as insurance +from {{ source('syh_dr', 'medicare_inpatient') }} diff --git a/data_processing/models/ahrq.gov/syh_dr/syhdr_outpatient.sql b/data_processing/models/ahrq.gov/syh_dr/syhdr_outpatient.sql new file mode 100644 index 0000000..9cdddb2 --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/syhdr_outpatient.sql @@ -0,0 +1,29 @@ +{{ config( + materialized = 'external', + location = '../data/ahrq.gov/syh_dr/syhdr_outpatient.parquet' +)}} + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'commercial' as insurance +from {{ source('syh_dr', 'commercial_outpatient') }} + +union all + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'medicaid' as insurance +from {{ source('syh_dr', 'medicaid_outpatient') }} + +union all + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'medicare' as insurance +from {{ source('syh_dr', 'medicare_outpatient') }} diff --git a/data_processing/models/ahrq.gov/syh_dr/syhdr_pharmacy.sql b/data_processing/models/ahrq.gov/syh_dr/syhdr_pharmacy.sql new file mode 100644 index 0000000..a4695a5 --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/syhdr_pharmacy.sql @@ -0,0 +1,29 @@ +{{ config( + materialized = 'external', + location = '../data/ahrq.gov/syh_dr/syhdr_pharmacy.parquet' +)}} + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'commercial' as insurance +from {{ source('syh_dr', 'commercial_pharmacy') }} + +union all + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'medicaid' as insurance +from {{ source('syh_dr', 'medicaid_pharmacy') }} + +union all + +select + *, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as plan_payment_amount, + replace(replace(PLAN_PMT_AMT, '$', ''), ',', '')::float as total_charge_amount, + 'medicare' as insurance +from {{ source('syh_dr', 'medicare_pharmacy') }} diff --git a/data_processing/models/ahrq.gov/syh_dr/syhdr_provider.sql b/data_processing/models/ahrq.gov/syh_dr/syhdr_provider.sql new file mode 100644 index 0000000..1455d1d --- /dev/null +++ b/data_processing/models/ahrq.gov/syh_dr/syhdr_provider.sql @@ -0,0 +1,16 @@ +{{ config( + materialized = 'external', + location = '../data/ahrq.gov/syh_dr/syhdr_provider.parquet' +)}} + +select + *, + 'medicaid' as insurance +from {{ source('syh_dr', 'medicaid_provider') }} + +union all + +select + *, + 'medicare' as insurance +from {{ source('syh_dr', 'medicare_provider') }} diff --git a/data_processing/models/sources.yml b/data_processing/models/sources.yml index 7bc3536..28b70e4 100644 --- a/data_processing/models/sources.yml +++ b/data_processing/models/sources.yml @@ -4,11 +4,11 @@ sources: - name: syh_dr description: Synthetic Healthcare data from AHRQ tables: - - name: inpatient - description: Inpatient files from AHRQ. + - name: commercial_inpatient + description: Commercial inpatient records from AHRQ. meta: external_location: > - read_csv('../data/syh_dr/syhdr_*_inpatient_2016.csv', + read_csv('../data/CSV/syhdr_commercial_inpatient_2016.csv', types = { PERSON_ID: 'UBIGINT', PERSON_WGHT: 'NUMERIC', @@ -109,15 +109,15 @@ sources: CPT_PRCDR_CD_33: 'VARCHAR', CPT_PRCDR_CD_34: 'VARCHAR', CPT_PRCDR_CD_35: 'VARCHAR', - PLAN_PMT_AMT: 'FLOAT' - TOT_CHRG_AMT: 'FLOAT' + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' }) formatter: oldstyle - - name: outpatient - description: Outpatient files from AHRQ. + - name: commercial_outpatient + description: Commercial outpatient records from AHRQ. meta: external_location: > - read_csv('../data/syh_dr/syhdr_*_outpatient_2016.csv', + read_csv('../data/CSV/syhdr_commercial_outpatient_2016.csv', types = { PERSON_ID: 'UBIGINT', PERSON_WGHT: 'NUMERIC', @@ -128,7 +128,174 @@ sources: SRVC_END_DATE: 'DATE', LOS: 'UINTEGER', ADMSN_TYPE: 'VARCHAR', - TOB_CD: 'VARCHAR'', + TOB_CD: 'VARCHAR', + CLM_TYPE_CD: 'VARCHAR', + DSCHRG_STUS: 'VARCHAR', + PRMRY_DX_IMPUTED: 'VARCHAR', + PRMRY_DX_CD: 'VARCHAR', + ICD_DX_CD_1: 'VARCHAR', + ICD_DX_CD_2: 'VARCHAR', + ICD_DX_CD_3: 'VARCHAR', + ICD_DX_CD_4: 'VARCHAR', + ICD_DX_CD_5: 'VARCHAR', + ICD_DX_CD_6: 'VARCHAR', + ICD_DX_CD_7: 'VARCHAR', + ICD_DX_CD_8: 'VARCHAR', + ICD_DX_CD_9: 'VARCHAR', + ICD_DX_CD_10: 'VARCHAR', + ICD_DX_CD_11: 'VARCHAR', + ICD_DX_CD_12: 'VARCHAR', + ICD_DX_CD_13: 'VARCHAR', + ICD_DX_CD_14: 'VARCHAR', + ICD_DX_CD_15: 'VARCHAR', + ICD_DX_CD_16: 'VARCHAR', + ICD_DX_CD_17: 'VARCHAR', + ICD_DX_CD_18: 'VARCHAR', + ICD_DX_CD_19: 'VARCHAR', + ICD_DX_CD_20: 'VARCHAR', + ICD_DX_CD_21: 'VARCHAR', + ICD_DX_CD_22: 'VARCHAR', + ICD_DX_CD_23: 'VARCHAR', + ICD_DX_CD_24: 'VARCHAR', + ICD_DX_CD_25: 'VARCHAR', + ICD_PRCDR_CD_1: 'VARCHAR', + ICD_PRCDR_CD_2: 'VARCHAR', + ICD_PRCDR_CD_3: 'VARCHAR', + ICD_PRCDR_CD_4: 'VARCHAR', + ICD_PRCDR_CD_5: 'VARCHAR', + ICD_PRCDR_CD_6: 'VARCHAR', + ICD_PRCDR_CD_7: 'VARCHAR', + ICD_PRCDR_CD_8: 'VARCHAR', + ICD_PRCDR_CD_9: 'VARCHAR', + ICD_PRCDR_CD_10: 'VARCHAR', + ICD_PRCDR_CD_11: 'VARCHAR', + ICD_PRCDR_CD_12: 'VARCHAR', + ICD_PRCDR_CD_13: 'VARCHAR', + ICD_PRCDR_CD_14: 'VARCHAR', + ICD_PRCDR_CD_15: 'VARCHAR', + ICD_PRCDR_CD_16: 'VARCHAR', + ICD_PRCDR_CD_17: 'VARCHAR', + ICD_PRCDR_CD_18: 'VARCHAR', + ICD_PRCDR_CD_19: 'VARCHAR', + ICD_PRCDR_CD_20: 'VARCHAR', + ICD_PRCDR_CD_21: 'VARCHAR', + ICD_PRCDR_CD_22: 'VARCHAR', + ICD_PRCDR_CD_23: 'VARCHAR', + ICD_PRCDR_CD_24: 'VARCHAR', + ICD_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_1: 'VARCHAR', + CPT_PRCDR_CD_2: 'VARCHAR', + CPT_PRCDR_CD_3: 'VARCHAR', + CPT_PRCDR_CD_4: 'VARCHAR', + CPT_PRCDR_CD_5: 'VARCHAR', + CPT_PRCDR_CD_6: 'VARCHAR', + CPT_PRCDR_CD_7: 'VARCHAR', + CPT_PRCDR_CD_8: 'VARCHAR', + CPT_PRCDR_CD_9: 'VARCHAR', + CPT_PRCDR_CD_10: 'VARCHAR', + CPT_PRCDR_CD_11: 'VARCHAR', + CPT_PRCDR_CD_12: 'VARCHAR', + CPT_PRCDR_CD_13: 'VARCHAR', + CPT_PRCDR_CD_14: 'VARCHAR', + CPT_PRCDR_CD_15: 'VARCHAR', + CPT_PRCDR_CD_16: 'VARCHAR', + CPT_PRCDR_CD_17: 'VARCHAR', + CPT_PRCDR_CD_18: 'VARCHAR', + CPT_PRCDR_CD_19: 'VARCHAR', + CPT_PRCDR_CD_20: 'VARCHAR', + CPT_PRCDR_CD_21: 'VARCHAR', + CPT_PRCDR_CD_22: 'VARCHAR', + CPT_PRCDR_CD_23: 'VARCHAR', + CPT_PRCDR_CD_24: 'VARCHAR', + CPT_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_26: 'VARCHAR', + CPT_PRCDR_CD_27: 'VARCHAR', + CPT_PRCDR_CD_28: 'VARCHAR', + CPT_PRCDR_CD_29: 'VARCHAR', + CPT_PRCDR_CD_30: 'VARCHAR', + CPT_PRCDR_CD_31: 'VARCHAR', + CPT_PRCDR_CD_32: 'VARCHAR', + CPT_PRCDR_CD_33: 'VARCHAR', + CPT_PRCDR_CD_34: 'VARCHAR', + CPT_PRCDR_CD_35: 'VARCHAR', + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' + }) + formatter: oldstyle + - name: commercial_person + description: Commercial person records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_commercial_person_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + AGE_LOW: 'NUMERIC', + AGE_HIGH: 'NUMERIC', + SEX_IDENT_CD: 'VARCHAR', + STATE_CD: 'VARCHAR', + COUNTY_FIPS_CD: 'VARCHAR', + ZIP_CD: 'VARCHAR', + PHRMCY_CVRG_1: 'NUMERIC', + PHRMCY_CVRG_2: 'NUMERIC', + PHRMCY_CVRG_3: 'NUMERIC', + PHRMCY_CVRG_4: 'NUMERIC', + PHRMCY_CVRG_5: 'NUMERIC', + PHRMCY_CVRG_6: 'NUMERIC', + PHRMCY_CVRG_7: 'NUMERIC', + PHRMCY_CVRG_8: 'NUMERIC', + PHRMCY_CVRG_9: 'NUMERIC', + PHRMCY_CVRG_10: 'NUMERIC', + PHRMCY_CVRG_11: 'NUMERIC', + PHRMCY_CVRG_12: 'NUMERIC', + CMRCL_INSRC_1: 'NUMERIC', + CMRCL_INSRC_2: 'NUMERIC', + CMRCL_INSRC_3: 'NUMERIC', + CMRCL_INSRC_4: 'NUMERIC', + CMRCL_INSRC_5: 'NUMERIC', + CMRCL_INSRC_6: 'NUMERIC', + CMRCL_INSRC_7: 'NUMERIC', + CMRCL_INSRC_8: 'NUMERIC', + CMRCL_INSRC_9: 'NUMERIC', + CMRCL_INSRC_10: 'NUMERIC', + CMRCL_INSRC_11: 'NUMERIC', + CMRCL_INSRC_12: 'NUMERIC' + }) + formatter: oldstyle + - name: commercial_pharmacy + descripton: Commercial pharmacy records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_commercial_pharmacy_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + PHMCY_CLM_NUM: 'NUMERIC', + CLM_CNTL_NUM: 'NUMERIC', + LINE_NBR: 'VARCHAR', + FILL_DT: 'DATE', + SYNTHETIC_DRUG_ID: 'VARCHAR', + GENERIC_DRUG_NAME: 'VARCHAR', + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' + }) + formatter: oldstyle + - name: medicaid_inpatient + description: Medicaid inpatient records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_medicaid_inpatient_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + FACILITY_ID: 'UBIGINT', + CLM_CNTL_NUM: 'NUMERIC', + AT_SPCLTY: 'VARCHAR', + SRVC_BEG_DATE: 'DATE', + SRVC_END_DATE: 'DATE', + LOS: 'UINTEGER', + ADMSN_TYPE: 'VARCHAR', + TOB_CD: 'VARCHAR', CLM_TYPE_CD: 'VARCHAR', DSCHRG_STUS: 'VARCHAR', PRMRY_DX_IMPUTED: 'VARCHAR', @@ -218,15 +385,124 @@ sources: CPT_PRCDR_CD_33: 'VARCHAR', CPT_PRCDR_CD_34: 'VARCHAR', CPT_PRCDR_CD_35: 'VARCHAR', - PLAN_PMT_AMT: 'FLOAT', - TOT_CHRG_AMT: 'FLOAT' + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' }) formatter: oldstyle - - name: person - description: Person-Level files from AHRQ. + - name: medicaid_outpatient + description: Medicaid outpatient records from AHRQ. meta: external_location: > - read_csv('../data/syh_dr/syhdr_*_person_2016.csv', + read_csv('../data/CSV/syhdr_medicaid_outpatient_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + FACILITY_ID: 'UBIGINT', + CLM_CNTL_NUM: 'NUMERIC', + AT_SPCLTY: 'VARCHAR', + SRVC_BEG_DATE: 'DATE', + SRVC_END_DATE: 'DATE', + LOS: 'UINTEGER', + ADMSN_TYPE: 'VARCHAR', + TOB_CD: 'VARCHAR', + CLM_TYPE_CD: 'VARCHAR', + DSCHRG_STUS: 'VARCHAR', + PRMRY_DX_IMPUTED: 'VARCHAR', + PRMRY_DX_CD: 'VARCHAR', + ICD_DX_CD_1: 'VARCHAR', + ICD_DX_CD_2: 'VARCHAR', + ICD_DX_CD_3: 'VARCHAR', + ICD_DX_CD_4: 'VARCHAR', + ICD_DX_CD_5: 'VARCHAR', + ICD_DX_CD_6: 'VARCHAR', + ICD_DX_CD_7: 'VARCHAR', + ICD_DX_CD_8: 'VARCHAR', + ICD_DX_CD_9: 'VARCHAR', + ICD_DX_CD_10: 'VARCHAR', + ICD_DX_CD_11: 'VARCHAR', + ICD_DX_CD_12: 'VARCHAR', + ICD_DX_CD_13: 'VARCHAR', + ICD_DX_CD_14: 'VARCHAR', + ICD_DX_CD_15: 'VARCHAR', + ICD_DX_CD_16: 'VARCHAR', + ICD_DX_CD_17: 'VARCHAR', + ICD_DX_CD_18: 'VARCHAR', + ICD_DX_CD_19: 'VARCHAR', + ICD_DX_CD_20: 'VARCHAR', + ICD_DX_CD_21: 'VARCHAR', + ICD_DX_CD_22: 'VARCHAR', + ICD_DX_CD_23: 'VARCHAR', + ICD_DX_CD_24: 'VARCHAR', + ICD_DX_CD_25: 'VARCHAR', + ICD_PRCDR_CD_1: 'VARCHAR', + ICD_PRCDR_CD_2: 'VARCHAR', + ICD_PRCDR_CD_3: 'VARCHAR', + ICD_PRCDR_CD_4: 'VARCHAR', + ICD_PRCDR_CD_5: 'VARCHAR', + ICD_PRCDR_CD_6: 'VARCHAR', + ICD_PRCDR_CD_7: 'VARCHAR', + ICD_PRCDR_CD_8: 'VARCHAR', + ICD_PRCDR_CD_9: 'VARCHAR', + ICD_PRCDR_CD_10: 'VARCHAR', + ICD_PRCDR_CD_11: 'VARCHAR', + ICD_PRCDR_CD_12: 'VARCHAR', + ICD_PRCDR_CD_13: 'VARCHAR', + ICD_PRCDR_CD_14: 'VARCHAR', + ICD_PRCDR_CD_15: 'VARCHAR', + ICD_PRCDR_CD_16: 'VARCHAR', + ICD_PRCDR_CD_17: 'VARCHAR', + ICD_PRCDR_CD_18: 'VARCHAR', + ICD_PRCDR_CD_19: 'VARCHAR', + ICD_PRCDR_CD_20: 'VARCHAR', + ICD_PRCDR_CD_21: 'VARCHAR', + ICD_PRCDR_CD_22: 'VARCHAR', + ICD_PRCDR_CD_23: 'VARCHAR', + ICD_PRCDR_CD_24: 'VARCHAR', + ICD_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_1: 'VARCHAR', + CPT_PRCDR_CD_2: 'VARCHAR', + CPT_PRCDR_CD_3: 'VARCHAR', + CPT_PRCDR_CD_4: 'VARCHAR', + CPT_PRCDR_CD_5: 'VARCHAR', + CPT_PRCDR_CD_6: 'VARCHAR', + CPT_PRCDR_CD_7: 'VARCHAR', + CPT_PRCDR_CD_8: 'VARCHAR', + CPT_PRCDR_CD_9: 'VARCHAR', + CPT_PRCDR_CD_10: 'VARCHAR', + CPT_PRCDR_CD_11: 'VARCHAR', + CPT_PRCDR_CD_12: 'VARCHAR', + CPT_PRCDR_CD_13: 'VARCHAR', + CPT_PRCDR_CD_14: 'VARCHAR', + CPT_PRCDR_CD_15: 'VARCHAR', + CPT_PRCDR_CD_16: 'VARCHAR', + CPT_PRCDR_CD_17: 'VARCHAR', + CPT_PRCDR_CD_18: 'VARCHAR', + CPT_PRCDR_CD_19: 'VARCHAR', + CPT_PRCDR_CD_20: 'VARCHAR', + CPT_PRCDR_CD_21: 'VARCHAR', + CPT_PRCDR_CD_22: 'VARCHAR', + CPT_PRCDR_CD_23: 'VARCHAR', + CPT_PRCDR_CD_24: 'VARCHAR', + CPT_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_26: 'VARCHAR', + CPT_PRCDR_CD_27: 'VARCHAR', + CPT_PRCDR_CD_28: 'VARCHAR', + CPT_PRCDR_CD_29: 'VARCHAR', + CPT_PRCDR_CD_30: 'VARCHAR', + CPT_PRCDR_CD_31: 'VARCHAR', + CPT_PRCDR_CD_32: 'VARCHAR', + CPT_PRCDR_CD_33: 'VARCHAR', + CPT_PRCDR_CD_34: 'VARCHAR', + CPT_PRCDR_CD_35: 'VARCHAR', + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' + }) + formatter: oldstyle + - name: medicaid_person + description: Medicaid person records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_medicaid_person_2016.csv', types = { PERSON_ID: 'UBIGINT', MCAID_BENE_ID: 'UBIGINT', @@ -265,7 +541,321 @@ sources: MDCD_MCO_ENRLMT_11: 'NUMERIC', MDCD_MCO_ENRLMT_12: 'NUMERIC', MDCD_CHIP_ENRLMT: 'NUMERIC', - RSTCTD_BNFTS_IND: 'NUMERIC', + RSTRCTD_BNFTS_IND: 'NUMERIC', + DUAL_ELGBL_1: 'NUMERIC', + DUAL_ELGBL_2: 'NUMERIC', + DUAL_ELGBL_3: 'NUMERIC', + DUAL_ELGBL_4: 'NUMERIC', + DUAL_ELGBL_5: 'NUMERIC', + DUAL_ELGBL_6: 'NUMERIC', + DUAL_ELGBL_7: 'NUMERIC', + DUAL_ELGBL_8: 'NUMERIC', + DUAL_ELGBL_9: 'NUMERIC', + DUAL_ELGBL_10: 'NUMERIC', + DUAL_ELGBL_11: 'NUMERIC', + DUAL_ELGBL_12: 'NUMERIC' + }) + formatter: oldstyle + - name: medicaid_pharmacy + descripton: Medicaid pharmacy records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_medicaid_pharmacy_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + PHMCY_CLM_NUM: 'NUMERIC', + CLM_CNTL_NUM: 'NUMERIC', + LINE_NBR: 'VARCHAR', + FILL_DT: 'DATE', + SYNTHETIC_DRUG_ID: 'VARCHAR', + GENERIC_DRUG_NAME: 'VARCHAR', + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' + }) + formatter: oldstyle + - name: medicaid_provider + description: Medicaid provider files from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_medicaid_provider_2016.csv', + types = { + Facility_ID: 'VARCHAR', + Prvdr_Ctgry_Cd: 'VARCHAR', + Prvdr_Ownrshp_Cd: 'VARCHAR', + Prvdr_Prtcptn_Cd: 'VARCHAR' + }) + formatter: oldstyle + - name: medicare_inpatient + description: Medicare inpatient records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_medicare_inpatient_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + FACILITY_ID: 'UBIGINT', + CLM_CNTL_NUM: 'NUMERIC', + AT_SPCLTY: 'VARCHAR', + SRVC_BEG_DATE: 'DATE', + SRVC_END_DATE: 'DATE', + LOS: 'UINTEGER', + ADMSN_TYPE: 'VARCHAR', + TOB_CD: 'VARCHAR', + CLM_TYPE_CD: 'VARCHAR', + DSCHRG_STUS: 'VARCHAR', + PRMRY_DX_IMPUTED: 'VARCHAR', + PRMRY_DX_CD: 'VARCHAR', + ICD_DX_CD_1: 'VARCHAR', + ICD_DX_CD_2: 'VARCHAR', + ICD_DX_CD_3: 'VARCHAR', + ICD_DX_CD_4: 'VARCHAR', + ICD_DX_CD_5: 'VARCHAR', + ICD_DX_CD_6: 'VARCHAR', + ICD_DX_CD_7: 'VARCHAR', + ICD_DX_CD_8: 'VARCHAR', + ICD_DX_CD_9: 'VARCHAR', + ICD_DX_CD_10: 'VARCHAR', + ICD_DX_CD_11: 'VARCHAR', + ICD_DX_CD_12: 'VARCHAR', + ICD_DX_CD_13: 'VARCHAR', + ICD_DX_CD_14: 'VARCHAR', + ICD_DX_CD_15: 'VARCHAR', + ICD_DX_CD_16: 'VARCHAR', + ICD_DX_CD_17: 'VARCHAR', + ICD_DX_CD_18: 'VARCHAR', + ICD_DX_CD_19: 'VARCHAR', + ICD_DX_CD_20: 'VARCHAR', + ICD_DX_CD_21: 'VARCHAR', + ICD_DX_CD_22: 'VARCHAR', + ICD_DX_CD_23: 'VARCHAR', + ICD_DX_CD_24: 'VARCHAR', + ICD_DX_CD_25: 'VARCHAR', + ICD_PRCDR_CD_1: 'VARCHAR', + ICD_PRCDR_CD_2: 'VARCHAR', + ICD_PRCDR_CD_3: 'VARCHAR', + ICD_PRCDR_CD_4: 'VARCHAR', + ICD_PRCDR_CD_5: 'VARCHAR', + ICD_PRCDR_CD_6: 'VARCHAR', + ICD_PRCDR_CD_7: 'VARCHAR', + ICD_PRCDR_CD_8: 'VARCHAR', + ICD_PRCDR_CD_9: 'VARCHAR', + ICD_PRCDR_CD_10: 'VARCHAR', + ICD_PRCDR_CD_11: 'VARCHAR', + ICD_PRCDR_CD_12: 'VARCHAR', + ICD_PRCDR_CD_13: 'VARCHAR', + ICD_PRCDR_CD_14: 'VARCHAR', + ICD_PRCDR_CD_15: 'VARCHAR', + ICD_PRCDR_CD_16: 'VARCHAR', + ICD_PRCDR_CD_17: 'VARCHAR', + ICD_PRCDR_CD_18: 'VARCHAR', + ICD_PRCDR_CD_19: 'VARCHAR', + ICD_PRCDR_CD_20: 'VARCHAR', + ICD_PRCDR_CD_21: 'VARCHAR', + ICD_PRCDR_CD_22: 'VARCHAR', + ICD_PRCDR_CD_23: 'VARCHAR', + ICD_PRCDR_CD_24: 'VARCHAR', + ICD_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_1: 'VARCHAR', + CPT_PRCDR_CD_2: 'VARCHAR', + CPT_PRCDR_CD_3: 'VARCHAR', + CPT_PRCDR_CD_4: 'VARCHAR', + CPT_PRCDR_CD_5: 'VARCHAR', + CPT_PRCDR_CD_6: 'VARCHAR', + CPT_PRCDR_CD_7: 'VARCHAR', + CPT_PRCDR_CD_8: 'VARCHAR', + CPT_PRCDR_CD_9: 'VARCHAR', + CPT_PRCDR_CD_10: 'VARCHAR', + CPT_PRCDR_CD_11: 'VARCHAR', + CPT_PRCDR_CD_12: 'VARCHAR', + CPT_PRCDR_CD_13: 'VARCHAR', + CPT_PRCDR_CD_14: 'VARCHAR', + CPT_PRCDR_CD_15: 'VARCHAR', + CPT_PRCDR_CD_16: 'VARCHAR', + CPT_PRCDR_CD_17: 'VARCHAR', + CPT_PRCDR_CD_18: 'VARCHAR', + CPT_PRCDR_CD_19: 'VARCHAR', + CPT_PRCDR_CD_20: 'VARCHAR', + CPT_PRCDR_CD_21: 'VARCHAR', + CPT_PRCDR_CD_22: 'VARCHAR', + CPT_PRCDR_CD_23: 'VARCHAR', + CPT_PRCDR_CD_24: 'VARCHAR', + CPT_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_26: 'VARCHAR', + CPT_PRCDR_CD_27: 'VARCHAR', + CPT_PRCDR_CD_28: 'VARCHAR', + CPT_PRCDR_CD_29: 'VARCHAR', + CPT_PRCDR_CD_30: 'VARCHAR', + CPT_PRCDR_CD_31: 'VARCHAR', + CPT_PRCDR_CD_32: 'VARCHAR', + CPT_PRCDR_CD_33: 'VARCHAR', + CPT_PRCDR_CD_34: 'VARCHAR', + CPT_PRCDR_CD_35: 'VARCHAR', + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' + }) + formatter: oldstyle + - name: medicare_outpatient + description: Medicare outpatient records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_medicare_outpatient_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + FACILITY_ID: 'UBIGINT', + CLM_CNTL_NUM: 'NUMERIC', + AT_SPCLTY: 'VARCHAR', + SRVC_BEG_DATE: 'DATE', + SRVC_END_DATE: 'DATE', + LOS: 'UINTEGER', + ADMSN_TYPE: 'VARCHAR', + TOB_CD: 'VARCHAR', + CLM_TYPE_CD: 'VARCHAR', + DSCHRG_STUS: 'VARCHAR', + PRMRY_DX_IMPUTED: 'VARCHAR', + PRMRY_DX_CD: 'VARCHAR', + ICD_DX_CD_1: 'VARCHAR', + ICD_DX_CD_2: 'VARCHAR', + ICD_DX_CD_3: 'VARCHAR', + ICD_DX_CD_4: 'VARCHAR', + ICD_DX_CD_5: 'VARCHAR', + ICD_DX_CD_6: 'VARCHAR', + ICD_DX_CD_7: 'VARCHAR', + ICD_DX_CD_8: 'VARCHAR', + ICD_DX_CD_9: 'VARCHAR', + ICD_DX_CD_10: 'VARCHAR', + ICD_DX_CD_11: 'VARCHAR', + ICD_DX_CD_12: 'VARCHAR', + ICD_DX_CD_13: 'VARCHAR', + ICD_DX_CD_14: 'VARCHAR', + ICD_DX_CD_15: 'VARCHAR', + ICD_DX_CD_16: 'VARCHAR', + ICD_DX_CD_17: 'VARCHAR', + ICD_DX_CD_18: 'VARCHAR', + ICD_DX_CD_19: 'VARCHAR', + ICD_DX_CD_20: 'VARCHAR', + ICD_DX_CD_21: 'VARCHAR', + ICD_DX_CD_22: 'VARCHAR', + ICD_DX_CD_23: 'VARCHAR', + ICD_DX_CD_24: 'VARCHAR', + ICD_DX_CD_25: 'VARCHAR', + ICD_PRCDR_CD_1: 'VARCHAR', + ICD_PRCDR_CD_2: 'VARCHAR', + ICD_PRCDR_CD_3: 'VARCHAR', + ICD_PRCDR_CD_4: 'VARCHAR', + ICD_PRCDR_CD_5: 'VARCHAR', + ICD_PRCDR_CD_6: 'VARCHAR', + ICD_PRCDR_CD_7: 'VARCHAR', + ICD_PRCDR_CD_8: 'VARCHAR', + ICD_PRCDR_CD_9: 'VARCHAR', + ICD_PRCDR_CD_10: 'VARCHAR', + ICD_PRCDR_CD_11: 'VARCHAR', + ICD_PRCDR_CD_12: 'VARCHAR', + ICD_PRCDR_CD_13: 'VARCHAR', + ICD_PRCDR_CD_14: 'VARCHAR', + ICD_PRCDR_CD_15: 'VARCHAR', + ICD_PRCDR_CD_16: 'VARCHAR', + ICD_PRCDR_CD_17: 'VARCHAR', + ICD_PRCDR_CD_18: 'VARCHAR', + ICD_PRCDR_CD_19: 'VARCHAR', + ICD_PRCDR_CD_20: 'VARCHAR', + ICD_PRCDR_CD_21: 'VARCHAR', + ICD_PRCDR_CD_22: 'VARCHAR', + ICD_PRCDR_CD_23: 'VARCHAR', + ICD_PRCDR_CD_24: 'VARCHAR', + ICD_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_1: 'VARCHAR', + CPT_PRCDR_CD_2: 'VARCHAR', + CPT_PRCDR_CD_3: 'VARCHAR', + CPT_PRCDR_CD_4: 'VARCHAR', + CPT_PRCDR_CD_5: 'VARCHAR', + CPT_PRCDR_CD_6: 'VARCHAR', + CPT_PRCDR_CD_7: 'VARCHAR', + CPT_PRCDR_CD_8: 'VARCHAR', + CPT_PRCDR_CD_9: 'VARCHAR', + CPT_PRCDR_CD_10: 'VARCHAR', + CPT_PRCDR_CD_11: 'VARCHAR', + CPT_PRCDR_CD_12: 'VARCHAR', + CPT_PRCDR_CD_13: 'VARCHAR', + CPT_PRCDR_CD_14: 'VARCHAR', + CPT_PRCDR_CD_15: 'VARCHAR', + CPT_PRCDR_CD_16: 'VARCHAR', + CPT_PRCDR_CD_17: 'VARCHAR', + CPT_PRCDR_CD_18: 'VARCHAR', + CPT_PRCDR_CD_19: 'VARCHAR', + CPT_PRCDR_CD_20: 'VARCHAR', + CPT_PRCDR_CD_21: 'VARCHAR', + CPT_PRCDR_CD_22: 'VARCHAR', + CPT_PRCDR_CD_23: 'VARCHAR', + CPT_PRCDR_CD_24: 'VARCHAR', + CPT_PRCDR_CD_25: 'VARCHAR', + CPT_PRCDR_CD_26: 'VARCHAR', + CPT_PRCDR_CD_27: 'VARCHAR', + CPT_PRCDR_CD_28: 'VARCHAR', + CPT_PRCDR_CD_29: 'VARCHAR', + CPT_PRCDR_CD_30: 'VARCHAR', + CPT_PRCDR_CD_31: 'VARCHAR', + CPT_PRCDR_CD_32: 'VARCHAR', + CPT_PRCDR_CD_33: 'VARCHAR', + CPT_PRCDR_CD_34: 'VARCHAR', + CPT_PRCDR_CD_35: 'VARCHAR', + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' + }) + formatter: oldstyle + - name: medicare_person + description: Medicare person records from AHRQ. + meta: + external_location: > + read_csv('../data/CSV/syhdr_medicare_person_2016.csv', + types = { + PERSON_ID: 'UBIGINT', + PERSON_WGHT: 'NUMERIC', + AGE_LOW: 'NUMERIC', + AGE_HIGH: 'NUMERIC', + SEX_IDENT_CD: 'VARCHAR', + RACE_CD: 'VARCHAR', + STATE_CD: 'VARCHAR', + COUNTY_FIPS_CD: 'VARCHAR', + ZIP_CD: 'VARCHAR', + RSN_ENRLMT_CD: 'VARCHAR', + MDCR_ENTLMT_IND_1: 'VARCHAR', + MDCR_ENTLMT_IND_2: 'VARCHAR', + MDCR_ENTLMT_IND_3: 'VARCHAR', + MDCR_ENTLMT_IND_4: 'VARCHAR', + MDCR_ENTLMT_IND_5: 'VARCHAR', + MDCR_ENTLMT_IND_6: 'VARCHAR', + MDCR_ENTLMT_IND_7: 'VARCHAR', + MDCR_ENTLMT_IND_8: 'VARCHAR', + MDCR_ENTLMT_IND_9: 'VARCHAR', + MDCR_ENTLMT_IND_10: 'VARCHAR', + MDCR_ENTLMT_IND_11: 'VARCHAR', + MDCR_ENTLMT_IND_12: 'VARCHAR', + MDCR_HMO_CVRG_1: 'NUMERIC', + MDCR_HMO_CVRG_2: 'NUMERIC', + MDCR_HMO_CVRG_3: 'NUMERIC', + MDCR_HMO_CVRG_4: 'NUMERIC', + MDCR_HMO_CVRG_5: 'NUMERIC', + MDCR_HMO_CVRG_6: 'NUMERIC', + MDCR_HMO_CVRG_7: 'NUMERIC', + MDCR_HMO_CVRG_8: 'NUMERIC', + MDCR_HMO_CVRG_9: 'NUMERIC', + MDCR_HMO_CVRG_10: 'NUMERIC', + MDCR_HMO_CVRG_11: 'NUMERIC', + MDCR_HMO_CVRG_12: 'NUMERIC', + PHRMCY_CVRG_1: 'NUMERIC', + PHRMCY_CVRG_2: 'NUMERIC', + PHRMCY_CVRG_3: 'NUMERIC', + PHRMCY_CVRG_4: 'NUMERIC', + PHRMCY_CVRG_5: 'NUMERIC', + PHRMCY_CVRG_6: 'NUMERIC', + PHRMCY_CVRG_7: 'NUMERIC', + PHRMCY_CVRG_8: 'NUMERIC', + PHRMCY_CVRG_9: 'NUMERIC', + PHRMCY_CVRG_10: 'NUMERIC', + PHRMCY_CVRG_11: 'NUMERIC', + PHRMCY_CVRG_12: 'NUMERIC', DUAL_ELGBL_1: 'NUMERIC', DUAL_ELGBL_2: 'NUMERIC', DUAL_ELGBL_3: 'NUMERIC', @@ -280,11 +870,11 @@ sources: DUAL_ELGBL_12: 'NUMERIC' }) formatter: oldstyle - - name: pharmacy - descripton: Pharmacy files from AHRQ. + - name: medicare_pharmacy + descripton: Medicare pharmacy records from AHRQ. meta: external_location: > - read_csv('../data/syh_dr/syhdr_*_pharmacy_2016.csv', + read_csv('../data/CSV/syhdr_medicare_pharmacy_2016.csv', types = { PERSON_ID: 'UBIGINT', PERSON_WGHT: 'NUMERIC', @@ -294,15 +884,15 @@ sources: FILL_DT: 'DATE', SYNTHETIC_DRUG_ID: 'VARCHAR', GENERIC_DRUG_NAME: 'VARCHAR', - PLAN_PMT_AMT: 'FLOAT', - TOT_CHRG_AMT: 'FLOAT' + PLAN_PMT_AMT: 'VARCHAR', + TOT_CHRG_AMT: 'VARCHAR' }) formatter: oldstyle - - name: provider - description: Provider files from AHRQ. + - name: medicare_provider + description: Medicare provider files from AHRQ. meta: external_location: > - read_csv('../data/syh_dr/syhdr_*_provider_2016.csv', + read_csv('../data/CSV/syhdr_medicare_provider_2016.csv', types = { Facility_ID: 'VARCHAR', Prvdr_Ctgry_Cd: 'VARCHAR',