Skip to content

Commit

Permalink
Convert concept & coding builders to new schema approach
Browse files Browse the repository at this point in the history
- Remove a lot of codeable concept expected values, when passed to a
  jinja file. The concept builders handle that themselves.
- Move validate_schema() from core_templates to sql_utils
- Have the concept & coding builders use validate_schema to check for
  field existence, and pass down the full expected field schema in
  places that need it.
- Remove deprecated valueQuantity_system, as no one should be using it
  right now.
  • Loading branch information
mikix committed Apr 22, 2024
1 parent fe56b8a commit 3042432
Show file tree
Hide file tree
Showing 23 changed files with 181 additions and 163 deletions.
9 changes: 3 additions & 6 deletions cumulus_library/studies/core/builder_condition.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,13 +4,10 @@

expected_table_cols = {
"condition": {
"category": [],
"clinicalstatus": [],
"id": [],
"recordedDate": [],
"verificationstatus": [],
"subject": ["reference", "display", "type"],
"encounter": ["reference", "display", "type"],
"subject": sql_utils.REFERENCE,
"encounter": sql_utils.REFERENCE,
}
}

Expand Down Expand Up @@ -85,7 +82,7 @@ def prepare_queries(
**kwargs,
):
self.denormalize_codes()
validated_schema = core_templates.validate_schema(
validated_schema = sql_utils.validate_schema(
cursor, schema, expected_table_cols, parser
)
self.queries.append(
Expand Down
10 changes: 5 additions & 5 deletions cumulus_library/studies/core/builder_documentreference.py
Original file line number Diff line number Diff line change
Expand Up @@ -5,13 +5,11 @@
expected_table_cols = {
"documentreference": {
"id": [],
"type": [],
"status": [],
"date": [],
"docStatus": [],
"subject": ["reference"],
"context": {"encounter": ["reference"], "period": ["start"]},
"category": [],
"subject": sql_utils.REFERENCE,
"context": {"encounter": sql_utils.REFERENCE, "period": ["start"]},
}
}

Expand All @@ -30,6 +28,7 @@ def prepare_queries(
self.queries = sql_utils.denormalize_complex_objects(
schema,
cursor,
parser,
[
sql_utils.CodeableConceptConfig(
source_table="documentreference",
Expand Down Expand Up @@ -59,10 +58,11 @@ def prepare_queries(
source_id="id",
column_hierarchy=[("content", list), ("format", dict)],
target_table="core__documentreference_dn_format",
expected={"format": sql_utils.CODING},
),
],
)
validated_schema = core_templates.validate_schema(
validated_schema = sql_utils.validate_schema(
cursor, schema, expected_table_cols, parser
)
self.queries.append(
Expand Down
25 changes: 8 additions & 17 deletions cumulus_library/studies/core/builder_encounter.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,24 +6,14 @@

expected_table_cols = {
"encounter": {
"id": [],
"status": [],
"period": [
"start",
"end",
],
"class": [
"code",
"system",
"display",
"userSelected",
"version",
],
"subject": [
"reference",
"display",
"type",
],
"id": [],
"class": sql_utils.CODING,
"subject": sql_utils.REFERENCE,
},
"etl__completion": {
"group_name": [],
Expand All @@ -47,7 +37,7 @@ def __post_init__(self):
class CoreEncounterBuilder(base_table_builder.BaseTableBuilder):
display_text = "Creating Encounter tables..."

def denormalize_codes(self, schema, cursor):
def denormalize_codes(self, schema, cursor, parser):
code_configs = [
EncConfig(
column_hierarchy=[("type", list)],
Expand Down Expand Up @@ -110,11 +100,11 @@ def denormalize_codes(self, schema, cursor):
("hospitalization", dict),
("dischargedisposition", dict),
],
filter_priority=False,
expected={"dischargedisposition": sql_utils.CODEABLE_CONCEPT},
),
]
self.queries += sql_utils.denormalize_complex_objects(
schema, cursor, code_configs
schema, cursor, parser, code_configs
)

def prepare_queries(
Expand All @@ -128,8 +118,9 @@ def prepare_queries(
self.denormalize_codes(
schema,
cursor,
parser,
)
validated_schema = core_templates.validate_schema(
validated_schema = sql_utils.validate_schema(
cursor, schema, expected_table_cols, parser
)
self.queries += [
Expand Down
21 changes: 15 additions & 6 deletions cumulus_library/studies/core/builder_medication.py
Original file line number Diff line number Diff line change
@@ -1,14 +1,14 @@
""" Module for generating core medication table"""

from cumulus_library import base_table_builder, base_utils
from cumulus_library import base_table_builder, base_utils, databases
from cumulus_library.studies.core.core_templates import core_templates
from cumulus_library.template_sql import base_templates, sql_utils


class MedicationBuilder(base_table_builder.BaseTableBuilder):
display_text = "Creating Medication table..."

def _check_data_in_fields(self, cursor, schema: str):
def _check_data_in_fields(self, cursor, parser, schema: str):
"""Validates whether either observed medication source is present
We opt to not use the core_templates.utils based version of
Expand Down Expand Up @@ -37,6 +37,7 @@ def _check_data_in_fields(self, cursor, schema: str):
source_table=table,
hierarchy=[(inline_col, dict), ("coding", list)],
cursor=cursor,
parser=parser,
)
if data_types["inline"]:
query = base_templates.get_column_datatype_query(
Expand All @@ -56,8 +57,9 @@ def _check_data_in_fields(self, cursor, schema: str):
schema=schema,
source_table=table,
hierarchy=[("medicationreference", dict), ("reference", dict)],
expected=["reference"],
expected=sql_utils.REFERENCE,
cursor=cursor,
parser=parser,
):
return data_types, has_userselected

Expand All @@ -83,15 +85,22 @@ def _check_data_in_fields(self, cursor, schema: str):

return data_types, has_userselected

def prepare_queries(self, cursor: object, schema: str, *args, **kwargs) -> dict:
def prepare_queries(
self,
cursor: databases.DatabaseCursor,
schema: str,
parser: databases.DatabaseParser = None,
*args,
**kwargs,
) -> dict:
"""Constructs queries related to condition codeableConcept
:param cursor: A database cursor object
:param schema: the schema/db name, matching the cursor
:param parser: A database parser
"""
medication_datasources, has_userselected = self._check_data_in_fields(
cursor, schema
cursor, parser, schema
)
if (
medication_datasources["inline"]
Expand Down
10 changes: 4 additions & 6 deletions cumulus_library/studies/core/builder_medicationrequest.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,10 +14,8 @@
"intent": [],
"authoredOn": [],
"reportedBoolean": [],
"category": ["code", "system", "display"],
"medicationCodeableConcept": ["code", "system", "display"],
"subject": ["reference"],
"encounter": ["reference"],
"subject": sql_utils.REFERENCE,
"encounter": sql_utils.REFERENCE,
"dosageInstruction": ["text"],
}
}
Expand Down Expand Up @@ -54,9 +52,9 @@ def prepare_queries(
),
]
self.queries += sql_utils.denormalize_complex_objects(
schema, cursor, code_sources
schema, cursor, parser, code_sources
)
validated_schema = core_templates.validate_schema(
validated_schema = sql_utils.validate_schema(
cursor, schema, expected_table_cols, parser
)
self.queries.append(
Expand Down
29 changes: 9 additions & 20 deletions cumulus_library/studies/core/builder_observation.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,30 +9,15 @@
expected_table_cols = {
"observation": {
"id": [],
"category": [],
"component": {
"code": [],
"dataAbsentReason": [],
"valueQuantity": ["code", "comparator", "system", "unit", "value"],
},
"status": [],
"code": [],
"interpretation": [],
"referenceRange": [
"low",
"high",
"normalValue",
"type",
"appliesTo",
"age",
"text",
],
"effectiveDateTime": [],
"valueQuantity": ["value", "comparator", "unit", "system", "code"],
"valueCodeableConcept": [],
"valueQuantity": ["code", "comparator", "system", "unit", "value"],
"valueString": [],
"subject": ["reference"],
"encounter": ["reference"],
"subject": sql_utils.REFERENCE,
"encounter": sql_utils.REFERENCE,
}
}

Expand Down Expand Up @@ -73,18 +58,22 @@ def prepare_queries(
ObsConfig(
is_public=True,
column_hierarchy=[("component", list), ("code", dict)],
expected={"code": sql_utils.CODEABLE_CONCEPT},
),
ObsConfig(
is_public=True,
column_hierarchy=[("component", list), ("dataabsentreason", dict)],
expected={"dataabsentreason": sql_utils.CODEABLE_CONCEPT},
),
ObsConfig(
is_public=True,
column_hierarchy=[("component", list), ("interpretation", list)],
expected={"interpretation": sql_utils.CODEABLE_CONCEPT},
),
ObsConfig(
is_public=True,
column_hierarchy=[("component", list), ("valuecodeableconcept", dict)],
expected={"valuecodeableconcept": sql_utils.CODEABLE_CONCEPT},
),
ObsConfig(
column_hierarchy=[("interpretation", list)], filter_priority=False
Expand All @@ -100,9 +89,9 @@ def prepare_queries(
]

self.queries += sql_utils.denormalize_complex_objects(
schema, cursor, code_sources
schema, cursor, parser, code_sources
)
validated_schema = core_templates.validate_schema(
validated_schema = sql_utils.validate_schema(
cursor, schema, expected_table_cols, parser
)
self.queries += [
Expand Down
4 changes: 2 additions & 2 deletions cumulus_library/studies/core/builder_patient.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,7 +9,7 @@
"patient": {
"id": [],
"gender": [],
"address": [],
"address": {"postalCode": {}},
"birthDate": [],
}
}
Expand Down Expand Up @@ -53,7 +53,7 @@ def prepare_queries(
is_array=True,
)
self.queries.append(base_templates.get_extension_denormalize_query(config))
validated_schema = core_templates.validate_schema(
validated_schema = sql_utils.validate_schema(
cursor, schema, expected_table_cols, parser
)
self.queries.append(
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -17,7 +17,6 @@ WITH temp_condition AS (
'condition',
'c',
[
'category',
('subject', 'reference', 'subject_ref'),
('encounter', 'reference', 'encounter_ref'),
],
Expand Down Expand Up @@ -54,9 +53,7 @@ WITH temp_condition AS (
],
schema
)
}},
c.verificationStatus,
c.clinicalStatus
}}
FROM condition AS c
LEFT JOIN core__condition_codable_concepts_all AS cca ON c.id = cca.id
)
Expand Down
11 changes: 1 addition & 10 deletions cumulus_library/studies/core/core_templates/core_templates.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,14 +12,5 @@ def get_core_template(
) -> str:
"""Extracts code system details as a standalone table"""
return base_templates.get_base_template(
target_table, path=pathlib.Path(__file__).parent, schema=schema, config=config
target_table, path=PATH, schema=schema, config=config
)


def validate_schema(cursor: object, schema: str, expected_table_cols, parser):
validated_schema = {}
for table, cols in expected_table_cols.items():
query = base_templates.get_column_datatype_query(schema, table, cols.keys())
table_schema = cursor.execute(query).fetchall()
validated_schema[table] = parser.validate_table_schema(cols, table_schema)
return validated_schema
Original file line number Diff line number Diff line change
Expand Up @@ -16,10 +16,9 @@ WITH temp_documentreference AS (
'documentreference',
'dr',
[
'type',
'status',
'docStatus',
'context',
'context',
('subject', 'reference', 'subject_ref'),
],
schema
Expand Down
11 changes: 6 additions & 5 deletions cumulus_library/studies/core/core_templates/encounter.sql.jinja
Original file line number Diff line number Diff line change
Expand Up @@ -26,9 +26,9 @@ temp_encounter_nullable AS (
'e',
[
'status',
'class',
('class', 'code', 'class_code'),
('class', 'system', 'class_code_system'),
('subject', 'reference', 'subject_ref'),
'period',
],
schema
)
Expand All @@ -46,7 +46,7 @@ temp_encounter_nullable AS (
'encounter',
'e',
[
('period','end', 'period_end_day', 'day'),
('period', 'end', 'period_end_day', 'day'),
('period', 'start', 'period_start_day', 'day'),
('period', 'start', 'period_start_week', 'week'),
('period', 'start', 'period_start_month', 'month'),
Expand All @@ -68,7 +68,8 @@ temp_encounter AS (
SELECT DISTINCT
e.id,
e.status,
e.class,
e.class_code,
e.class_code_system,
e.subject_ref,
e.period_start,
e.period_start_day,
Expand Down Expand Up @@ -134,7 +135,7 @@ SELECT DISTINCT
concat('Encounter/', e.id) AS encounter_ref
FROM temp_encounter AS e
LEFT JOIN core__fhir_mapping_expected_act_encounter_code_v3 AS eac
ON e.class.code = eac.found
ON e.class_code = eac.found
LEFT JOIN core__fhir_act_encounter_code_v3 AS ac ON eac.expected = ac.code
INNER JOIN core__patient AS p ON e.subject_ref = p.subject_ref
WHERE
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -34,7 +34,6 @@ WITH temp_mr AS (

'mr',
[
'display',
'reportedBoolean',
'dosageInstruction',
('subject', 'reference', 'subject_ref'),
Expand Down
Loading

0 comments on commit 3042432

Please sign in to comment.