From 618a01cc8a78e3a078498cec02a08561d0c532e3 Mon Sep 17 00:00:00 2001 From: Vicky Bikia Date: Fri, 6 Dec 2024 20:50:17 -0800 Subject: [PATCH 1/5] Print symptoms in the viewer when reviewing ECG recordings --- ecg_data_manager/modules/utils.py | 145 ++++++++++++++-------- ecg_data_manager/modules/visualization.py | 9 +- 2 files changed, 98 insertions(+), 56 deletions(-) diff --git a/ecg_data_manager/modules/utils.py b/ecg_data_manager/modules/utils.py index f4e6c71..0173e8b 100644 --- a/ecg_data_manager/modules/utils.py +++ b/ecg_data_manager/modules/utils.py @@ -83,6 +83,51 @@ def process_ecg_data(db: Client, data: pd.DataFrame) -> pd.DataFrame: return processed_data +def fetch_symptoms_single(observation_data: dict) -> dict: + """ + Extracts symptoms information from the components array of a single observation data dictionary where + HKElectrocardiogram.SymptomsStatus is 'present'. Returns 'UserId', 'ResourceId', and 'Symptoms'. + This data is suitable for merging with a main DataFrame. + + Args: + observation_data: A dictionary containing observation data. + + Returns: + dict: A dictionary with 'UserId', 'ResourceId', and 'Symptoms' if symptoms are present. + Returns an empty dictionary if no symptoms are present or if SymptomsStatus is not 'present'. + """ + components = observation_data.get("component", []) + user_id = observation_data.get(ColumnNames.USER_ID.value) + resource_id = observation_data.get(ColumnNames.RESOURCE_ID.value) + + # Check for SymptomsStatus + symptoms_status = next( + ( + comp.get("valueString") + for comp in components + if comp.get("code", {}).get("coding", [{}])[0].get("code") + == "HKElectrocardiogram.SymptomsStatus" + ), + None, + ) + + # If SymptomsStatus is "present", extract symptoms + if symptoms_status == "present": + symptoms = [ + f"{comp.get('code', {}).get('coding', [{}])[0].get('display')}:" + f"{comp.get('valueString')}" + for comp in components + if "HKCategoryTypeIdentifier" + in comp.get("code", {}).get("coding", [{}])[0].get("code", "") + ] + if symptoms: # Check if symptoms list is not empty + return {ColumnNames.USER_ID.value: user_id, ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": ', '.join(symptoms)} + else: + return {ColumnNames.USER_ID.value: user_id, ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": "No symptoms."} + else: + return {ColumnNames.USER_ID.value: user_id, ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": "No symptoms."} + + def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches db: Client, input_df: pd.DataFrame, @@ -91,7 +136,7 @@ def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches ) -> pd.DataFrame: """ Fetch diagnosis data from the Firestore database and extend the input DataFrame with new - columns. + columns, including a 'Symptoms' column. Args: db (Client): Firestore database client. @@ -101,7 +146,7 @@ def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches ECG_DATA_SUBCOLLECTION. Returns: - pd.DataFrame: Extended DataFrame containing the fetched diagnosis data. + pd.DataFrame: Extended DataFrame containing the fetched diagnosis data and symptoms. """ collection_ref = db.collection(collection_name) resources = [] @@ -126,89 +171,79 @@ def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches ) ).stream() + # Process the FHIR documents and store observation data for doc in fhir_docs: observation_data = doc.to_dict() - observation_data["user_id"] = user_id - observation_data["ResourceId"] = doc.id + observation_data[ColumnNames.USER_ID.value] = user_id + observation_data[ColumnNames.RESOURCE_ID.value] = doc.id + + # Extract effective period start time + effective_start = observation_data.get('effectivePeriod', {}).get('start', '') + if effective_start: + observation_data['EffectiveDateTimeHHMM'] = effective_start + + # Extract symptoms information HERE + symptoms_info = fetch_symptoms_single(observation_data) + if symptoms_info: + observation_data.update(symptoms_info) + + # Extract diagnosis information from diagnosis subcollection diagnosis_docs = list( doc.reference.collection(DIAGNOSIS_DATA_SUBCOLLECTION).stream() ) - if diagnosis_docs: - physician_initials_list = [ - diagnosis_doc.to_dict().get("physicianInitials") - for diagnosis_doc in diagnosis_docs - if diagnosis_doc.to_dict().get("physicianInitials") - ] - observation_data["NumberOfReviewers"] = len(physician_initials_list) - observation_data["Reviewers"] = physician_initials_list - else: - observation_data["NumberOfReviewers"] = 0 - observation_data["Reviewers"] = [] - + physician_initials_list = [ + diagnosis_doc.to_dict().get("physicianInitials", "") + for diagnosis_doc in diagnosis_docs + ] + observation_data["NumberOfReviewers"] = len(physician_initials_list) + observation_data["Reviewers"] = physician_initials_list observation_data["ReviewStatus"] = ( "Incomplete review" if observation_data["NumberOfReviewers"] < 3 else "Complete review" ) - resources.append(observation_data) + # Add new columns from diagnosis documents for i, diagnosis_doc in enumerate(diagnosis_docs): - if diagnosis_doc: - doc_data = diagnosis_doc.to_dict() - for key, value in doc_data.items(): - col_name = f"Diagnosis{i+1}_{key}" - new_columns.add(col_name) - observation_data[col_name] = value + doc_data = diagnosis_doc.to_dict() + for key, value in doc_data.items(): + col_name = f"Diagnosis{i+1}_{key}" + new_columns.add(col_name) + observation_data[col_name] = value + + resources.append(observation_data) except Exception as e: # pylint: disable=broad-exception-caught print(f"An error occurred while processing user {user_id}: {str(e)}") + fetched_df = pd.DataFrame(resources) + + # Define columns for the final DataFrame columns = [ ColumnNames.USER_ID.value, - "ResourceId", + ColumnNames.RESOURCE_ID.value, "EffectiveDateTimeHHMM", ColumnNames.APPLE_ELECTROCARDIOGRAM_CLASSIFICATION.value, "NumberOfReviewers", "Reviewers", "ReviewStatus", + "Symptoms", ] + list(new_columns) - data = [] - - for resource in resources: - row_data = [ - resource.get(ColumnNames.USER_ID.value, None), - resource.get("id", None), - ( - resource.get("effectivePeriod", {}).get("start", None) - if resource.get("effectivePeriod") - else None - ), - ( - resource.get("component", [{}])[2].get("valueString", None) - if len(resource.get("component", [])) > 2 - else None - ), - resource.get("NumberOfReviewers", None), - resource.get("Reviewers", None), - resource.get("ReviewStatus", None), - ] - for col in new_columns: - row_data.append(resource.get(col, None)) - - data.append(row_data) - - fetched_df = pd.DataFrame(data, columns=columns) + fetched_df = fetched_df.reindex( + columns=columns, fill_value=None + ) # Ensure columns are in order and filled - # Extend the input_df with new columns based on ResourceId + # Extend the input DataFrame with new columns extended_df = input_df.copy() additional_columns = [ - "ResourceId", + ColumnNames.RESOURCE_ID.value, "NumberOfReviewers", "Reviewers", "ReviewStatus", "EffectiveDateTimeHHMM", + "Symptoms", ] + list(new_columns) for col in additional_columns: @@ -216,8 +251,10 @@ def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches extended_df[col] = None for index, row in extended_df.iterrows(): - resource_id = row["ResourceId"] - fetched_row = fetched_df[fetched_df["ResourceId"] == resource_id] + resource_id = row[ColumnNames.RESOURCE_ID.value] + fetched_row = fetched_df[ + fetched_df[ColumnNames.RESOURCE_ID.value] == resource_id + ] if not fetched_row.empty: for col in additional_columns: if col in fetched_row.columns: diff --git a/ecg_data_manager/modules/visualization.py b/ecg_data_manager/modules/visualization.py index c974a65..0747b6c 100644 --- a/ecg_data_manager/modules/visualization.py +++ b/ecg_data_manager/modules/visualization.py @@ -351,6 +351,8 @@ def plot_single_ecg(self, row): # pylint: disable=too-many-locals else "Unknown" ) + symptoms = row.get("Symptoms", "No symptoms reported.") + group_class = row[AGE_GROUP_STRING] user_id_html = widgets.HTML( value=f"{group_class} " @@ -360,6 +362,9 @@ def plot_single_ecg(self, row): # pylint: disable=too-many-locals heart_rate_html = widgets.HTML( value=f"Average HR: {heart_rate} bpm" ) + + symptoms_html = widgets.HTML(value=f"Symptoms: {symptoms}") + interpretation_html = widgets.HTML( value="Classification: " ) @@ -374,7 +379,7 @@ def plot_single_ecg(self, row): # pylint: disable=too-many-locals interpretation_html.value += "" - display(user_id_html, heart_rate_html, interpretation_html) + display(user_id_html, heart_rate_html, symptoms_html, interpretation_html) # Add review status diagnosis_collection_ref = ( @@ -506,7 +511,7 @@ def hide_widgets(b): # pylint: disable=unused-argument return widgets_box - def save_diagnosis( # pylint: disable=too-many-locals, too-many-arguments, too-many-positional-arguments + def save_diagnosis( # pylint: disable=too-many-locals, too-many-arguments self, user_id, document_id, From 53081f78479141cef864e2a82f0347ce477ae0ad Mon Sep 17 00:00:00 2001 From: Vicky Bikia Date: Sun, 8 Dec 2024 12:41:24 -0800 Subject: [PATCH 2/5] Linting --- ecg_data_manager/modules/utils.py | 30 ++++++++++++++++++++++-------- 1 file changed, 22 insertions(+), 8 deletions(-) diff --git a/ecg_data_manager/modules/utils.py b/ecg_data_manager/modules/utils.py index 0173e8b..6925698 100644 --- a/ecg_data_manager/modules/utils.py +++ b/ecg_data_manager/modules/utils.py @@ -85,9 +85,9 @@ def process_ecg_data(db: Client, data: pd.DataFrame) -> pd.DataFrame: def fetch_symptoms_single(observation_data: dict) -> dict: """ - Extracts symptoms information from the components array of a single observation data dictionary where - HKElectrocardiogram.SymptomsStatus is 'present'. Returns 'UserId', 'ResourceId', and 'Symptoms'. - This data is suitable for merging with a main DataFrame. + Extracts symptoms information from the components array of a single observation data + dictionary where HKElectrocardiogram.SymptomsStatus is 'present'. Returns 'UserId', + 'ResourceId', and 'Symptoms'. This data is suitable for merging with a main DataFrame. Args: observation_data: A dictionary containing observation data. @@ -121,11 +121,23 @@ def fetch_symptoms_single(observation_data: dict) -> dict: in comp.get("code", {}).get("coding", [{}])[0].get("code", "") ] if symptoms: # Check if symptoms list is not empty - return {ColumnNames.USER_ID.value: user_id, ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": ', '.join(symptoms)} + return { + ColumnNames.USER_ID.value: user_id, + ColumnNames.RESOURCE_ID.value: resource_id, + "Symptoms": ", ".join(symptoms), + } else: - return {ColumnNames.USER_ID.value: user_id, ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": "No symptoms."} + return { + ColumnNames.USER_ID.value: user_id, + ColumnNames.RESOURCE_ID.value: resource_id, + "Symptoms": "No symptoms.", + } else: - return {ColumnNames.USER_ID.value: user_id, ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": "No symptoms."} + return { + ColumnNames.USER_ID.value: user_id, + ColumnNames.RESOURCE_ID.value: resource_id, + "Symptoms": "No symptoms.", + } def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches @@ -178,9 +190,11 @@ def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches observation_data[ColumnNames.RESOURCE_ID.value] = doc.id # Extract effective period start time - effective_start = observation_data.get('effectivePeriod', {}).get('start', '') + effective_start = observation_data.get("effectivePeriod", {}).get( + "start", "" + ) if effective_start: - observation_data['EffectiveDateTimeHHMM'] = effective_start + observation_data["EffectiveDateTimeHHMM"] = effective_start # Extract symptoms information HERE symptoms_info = fetch_symptoms_single(observation_data) From 88bd2c9ac87e5b4c8cfa9f734f60acc31c02891a Mon Sep 17 00:00:00 2001 From: Vicky Bikia Date: Sun, 8 Dec 2024 12:41:55 -0800 Subject: [PATCH 3/5] Linting --- ecg_data_manager/modules/utils.py | 16 ++++++++-------- ecg_data_manager/modules/visualization.py | 16 ++++++---------- 2 files changed, 14 insertions(+), 18 deletions(-) diff --git a/ecg_data_manager/modules/utils.py b/ecg_data_manager/modules/utils.py index 6925698..df599c9 100644 --- a/ecg_data_manager/modules/utils.py +++ b/ecg_data_manager/modules/utils.py @@ -94,7 +94,8 @@ def fetch_symptoms_single(observation_data: dict) -> dict: Returns: dict: A dictionary with 'UserId', 'ResourceId', and 'Symptoms' if symptoms are present. - Returns an empty dictionary if no symptoms are present or if SymptomsStatus is not 'present'. + Returns an empty dictionary if no symptoms are present or if SymptomsStatus is + not 'present'. """ components = observation_data.get("component", []) user_id = observation_data.get(ColumnNames.USER_ID.value) @@ -126,19 +127,18 @@ def fetch_symptoms_single(observation_data: dict) -> dict: ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": ", ".join(symptoms), } - else: - return { - ColumnNames.USER_ID.value: user_id, - ColumnNames.RESOURCE_ID.value: resource_id, - "Symptoms": "No symptoms.", - } - else: return { ColumnNames.USER_ID.value: user_id, ColumnNames.RESOURCE_ID.value: resource_id, "Symptoms": "No symptoms.", } + return { + ColumnNames.USER_ID.value: user_id, + ColumnNames.RESOURCE_ID.value: resource_id, + "Symptoms": "No symptoms.", + } + def fetch_diagnosis_data( # pylint: disable=too-many-locals, too-many-branches db: Client, diff --git a/ecg_data_manager/modules/visualization.py b/ecg_data_manager/modules/visualization.py index 0747b6c..83c618d 100644 --- a/ecg_data_manager/modules/visualization.py +++ b/ecg_data_manager/modules/visualization.py @@ -7,11 +7,9 @@ # """ -This module provides classes and associated functions for viewing, filtering, and -analyzing ECG data. The primary class, ECGDataViewer, allows users to interact with -ECG data through a graphical interface, enabling the review, diagnosis, and visualization -of ECG recordings. The module also includes functions for plotting single lead ECGs and -configuring the appearance of the plots. +This module provides classes and functions for viewing, filtering, and analyzing ECG data. The +primary class, ECGDataViewer, allows users to interact with ECG data through a graphical interface, +enabling the review, diagnosis, and visualization of ECG recordings. """ # Standard library imports @@ -363,13 +361,14 @@ def plot_single_ecg(self, row): # pylint: disable=too-many-locals value=f"Average HR: {heart_rate} bpm" ) - symptoms_html = widgets.HTML(value=f"Symptoms: {symptoms}") + symptoms_html = widgets.HTML( + value=f"Symptoms: {symptoms}" + ) interpretation_html = widgets.HTML( value="Classification: " ) - # Conditional color for non-sinusRhythm classifications if ecg_interpretation != SINUS_RHYTHM: interpretation_html.value += ( f"{ecg_interpretation}" @@ -479,7 +478,6 @@ def hide_widgets(b): # pylint: disable=unused-argument ) ) - # Hide the widgets if not all selections have been made initials = ( self.initials_dropdown.value if self.initials_dropdown.value != WidgetStrings.OTHER.value @@ -494,10 +492,8 @@ def hide_widgets(b): # pylint: disable=unused-argument tracing_quality_dropdown.layout.visibility = "hidden" notes_textarea.layout.visibility = "hidden" - # Attach the hide_widgets function to the button's on_click event save_button.on_click(hide_widgets) - # Display the widgets widgets_box = widgets.VBox( [ diagnosis_dropdown, From e96ad52ee0c3890e0dc4754ff2fb110e86f967d5 Mon Sep 17 00:00:00 2001 From: Vicky Bikia Date: Sun, 8 Dec 2024 12:42:02 -0800 Subject: [PATCH 4/5] Linting --- ecg_data_manager/modules/visualization.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ecg_data_manager/modules/visualization.py b/ecg_data_manager/modules/visualization.py index 83c618d..fc4d313 100644 --- a/ecg_data_manager/modules/visualization.py +++ b/ecg_data_manager/modules/visualization.py @@ -507,7 +507,7 @@ def hide_widgets(b): # pylint: disable=unused-argument return widgets_box - def save_diagnosis( # pylint: disable=too-many-locals, too-many-arguments + def save_diagnosis( # pylint: disable=too-many-locals, too-many-positional-arguments self, user_id, document_id, From 82d5296abb92820f4fbff646a045b5c2355ecf5b Mon Sep 17 00:00:00 2001 From: Vicky Bikia Date: Sun, 8 Dec 2024 12:18:00 -0800 Subject: [PATCH 5/5] Linting --- ecg_data_manager/modules/visualization.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/ecg_data_manager/modules/visualization.py b/ecg_data_manager/modules/visualization.py index fc4d313..94b9f1a 100644 --- a/ecg_data_manager/modules/visualization.py +++ b/ecg_data_manager/modules/visualization.py @@ -507,7 +507,7 @@ def hide_widgets(b): # pylint: disable=unused-argument return widgets_box - def save_diagnosis( # pylint: disable=too-many-locals, too-many-positional-arguments + def save_diagnosis( # pylint: disable=too-many-locals, too-many-arguments, too-many-positional-arguments self, user_id, document_id,