Merge pull request #141 from bptlab/refactor/134-code-check-tte

Refactor/134 code check Trace Testing Environment
bptlab · May 25, 2024 · 0dee86c · 0dee86c
2 parents 6fae209 + 3f5d28d
commit 0dee86c
Show file tree

Hide file tree

Showing 9 changed files with 1,194 additions and 1,243 deletions.
diff --git a/tracex_project/db.sqlite3 b/tracex_project/db.sqlite3
diff --git a/tracex_project/extraction/fixtures/prompts_fixture.json b/tracex_project/extraction/fixtures/prompts_fixture.json
diff --git a/tracex_project/extraction/logic/modules/module_metrics_analyzer.py b/tracex_project/extraction/logic/modules/module_metrics_analyzer.py
@@ -92,7 +92,7 @@ def __rate_activity_relevance(activity: str, condition: str | None) -> str:
         return category
 
     def __rate_timestamps_correctness(
-        self, activity: str, start: pd.DateTime, end: pd.DateTime
+        self, activity: str, start, end
     ) -> Tuple[str, float]:
         messages = Prompt.objects.get(name="METRIC_TIMESTAMP_MESSAGES").text
         messages.append(

diff --git a/tracex_project/trace_comparator/comparator.py b/tracex_project/trace_comparator/comparator.py
@@ -1,41 +1,51 @@
 """The trace comparator compares the pipeline output against a ground truth and vice versa."""
 import time
+from typing import List, Tuple
 from pathlib import Path
 from django.conf import settings
+import pandas as pd
 
 from extraction.models import Prompt
 from tracex.logic.logger import log_execution_time
 from tracex.logic import utils as u, constants as c
 
 
 @log_execution_time(Path(settings.BASE_DIR / "tracex/logs/execution_time.log"))
-def compare_traces(view, pipeline_df, ground_truth_df):
-    """Executes the trace comparison."""
-    pipeline_activities = pipeline_df["activity"]
-    ground_truth_activities = ground_truth_df["activity"]
+def compare_traces(
+    view, pipeline_df: pd.DataFrame, ground_truth_df: pd.DataFrame
+) -> dict:
+    """Executes the trace comparison.
+
+    Compare the piepline output to the ground truth and determine all matching activities.Classify every activity
+    from the pipeline output that has no match as 'missing' and every activity from the ground truth that
+    has no match as 'unexpected'. Finally, determine activities from the pipeline that are correctly
+    matched but in the wrong order.
+    """
+    pipeline_activities: pd.Series = pipeline_df["activity"]
+    ground_truth_activities: pd.Series = ground_truth_df["activity"]
 
     (
         mapping_pipeline_to_ground_truth,
         mapping_ground_truth_to_pipeline,
     ) = find_activity_mapping(view, pipeline_activities, ground_truth_activities)
-    missing_activities = find_unmapped_activities(
+    missing_activities: List[str] = find_unmapped_activities(
         ground_truth_activities, mapping_ground_truth_to_pipeline
     )
-    unexpected_activities = find_unmapped_activities(
+    unexpected_activities: List[str] = find_unmapped_activities(
         pipeline_activities, mapping_pipeline_to_ground_truth
     )
-    wrong_orders = find_wrong_orders(
+    wrong_orders: List[Tuple[str, str]] = find_wrong_orders(
         pipeline_activities, mapping_ground_truth_to_pipeline
     )
 
-    matching_percent_pipeline_to_ground_truth = find_matching_percentage(
+    matching_percent_pipeline_to_ground_truth: int = find_matching_percentage(
         pipeline_activities, mapping_pipeline_to_ground_truth
     )
-    matching_percent_ground_truth_to_pipeline = find_matching_percentage(
+    matching_percent_ground_truth_to_pipeline: int = find_matching_percentage(
         ground_truth_activities, mapping_ground_truth_to_pipeline
     )
 
-    results_dict = {
+    results: dict = {
         "mapping_pipeline_to_ground_truth": mapping_pipeline_to_ground_truth,
         "mapping_ground_truth_to_pipeline": mapping_ground_truth_to_pipeline,
         "missing_activities": missing_activities,
@@ -45,27 +55,29 @@ def compare_traces(view, pipeline_df, ground_truth_df):
         "matching_percent_ground_truth_to_pipeline": matching_percent_ground_truth_to_pipeline,
     }
 
-    return results_dict
+    return results
 
 
-def find_activity_mapping(view, pipeline_activities, ground_truth_activities):
-    """Find the activity mapping between two dataframes"""
-    total_steps = len(pipeline_activities) + len(ground_truth_activities)
-    half_progress = len(pipeline_activities)
+def find_activity_mapping(
+    view, pipeline_activities: pd.Series, ground_truth_activities: pd.Series
+) -> Tuple[List[int], List[int]]:
+    """Create a mapping of activities from the pipeline to the ground truth and vice versa."""
+    total_steps: int = len(pipeline_activities) + len(ground_truth_activities)
+    half_progress: int = len(pipeline_activities)
 
     mapping_pipeline_to_ground_truth = compare_activities(
         view,
         0,
         total_steps,
-        "Mapping Pipeline Activites to Ground Truth Activites",
+        "Mapping pipeline activities to ground truth activities",
         pipeline_activities,
         ground_truth_activities,
     )
     mapping_ground_truth_to_pipeline = compare_activities(
         view,
         half_progress,
         total_steps,
-        "Mapping Ground Truth Activites to Pipeline Activites",
+        "Mapping ground truth activities to pipeline activities",
         ground_truth_activities,
         pipeline_activities,
     )
@@ -82,14 +94,14 @@ def find_activity_mapping(view, pipeline_activities, ground_truth_activities):
 
 def compare_activities(
     view,
-    current_step,
-    total_steps,
-    status,
-    input_activities,
-    comparison_basis_activities,
-):
-    """Compare input activities with comparison basis activities."""
-    mapping_input_to_comparison = []
+    current_step: int,
+    total_steps: int,
+    status: str,
+    input_activities: pd.Series,
+    comparison_basis_activities: pd.Series,
+) -> List[Tuple[int, float]]:
+    """Compare input activities with ground truth activities."""
+    mapping_input_to_comparison: List[Tuple[int, float]] = []
     for index, activity in enumerate(input_activities):
         update_progress(view, current_step, total_steps, status)
         find_activity(
@@ -98,18 +110,29 @@ def compare_activities(
             index,
             mapping_input_to_comparison,
         )
-        time.sleep(2)
+        time.sleep(2)  # this prevents the token limit per minute from being exceeded
         current_step += 1
 
     return mapping_input_to_comparison
 
 
 def find_activity(
-    activity, comparison_basis_activities, index, mapping_input_to_comparison
-):
-    """Compares a target activity against potential matches to identify the best match based on similarity."""
-    lower, upper = u.get_snippet_bounds(index, len(comparison_basis_activities))
-    possible_matches = []
+    activity,
+    comparison_basis_activities: pd.Series,
+    activity_index: int,
+    mapping_input_to_comparison: List[Tuple[int, float]],
+) -> None:
+    """Compares an activity against potential matches to identify the best match based on
+    similarity.
+
+    An activity from the newly made extraction is compared against each activity from the ground truth that within a
+    certain range. For instance, an activity with index 5 ist compared to activities 3-7 from the ground truth. Both
+    activities are sent to the GPT model to determine if they are semantically similar.
+    """
+    lower, upper = u.get_snippet_bounds(
+        activity_index, len(comparison_basis_activities)
+    )
+    possible_matches: List[Tuple[int, float]] = []
     for count, second_activity in enumerate(comparison_basis_activities[lower:upper]):
         messages = Prompt.objects.get(name="COMPARE_MESSAGES").text
         messages.append(
@@ -118,34 +141,44 @@ def find_activity(
                 "content": f"First: {activity}\nSecond: {second_activity}",
             }
         )
-        response, top_logprops = u.query_gpt(messages, logprobs=True, top_logprobs=1)
-        linear_prop = u.calculate_linear_probability(top_logprops[0].logprob)
+        response, top_logprobs = u.query_gpt(messages, logprobs=True, top_logprobs=1)
+        linear_prop = u.calculate_linear_probability(top_logprobs[0].logprob)
         if "True" in response:
             possible_matches.append((lower + count, linear_prop))
-    if possible_matches:
-        best_match = max(possible_matches, key=lambda x: x[1])
-        if best_match[1] > c.THRESHOLD_FOR_MATCH:
-            mapping_input_to_comparison.append(best_match)
-            return
-    mapping_input_to_comparison.append((-1, 0))
+
+    mapping_input_to_comparison.append(
+        max(
+            (
+                (index, prob)
+                for index, prob in possible_matches
+                if prob > c.THRESHOLD_FOR_MATCH
+            ),
+            key=lambda x: x[1],
+            default=(-1, 0),
+        )
+    )
 
 
-def postprocess_mappings(mapping_data_to_groundtruth, mapping_groundtruth_to_data):
+def postprocess_mappings(
+    mapping_data_to_ground_truth: List, mapping_ground_truth_to_data: List
+) -> Tuple[List[int], List[int]]:
     """Postprocess the mappings between data and ground truth."""
-    mapping_data_to_groundtruth = fill_mapping(
-        mapping_data_to_groundtruth, mapping_groundtruth_to_data
+    mapping_data_to_ground_truth = fill_mapping(
+        mapping_data_to_ground_truth, mapping_ground_truth_to_data
     )
-    mapping_groundtruth_to_data = fill_mapping(
-        mapping_groundtruth_to_data, mapping_data_to_groundtruth
+    mapping_ground_truth_to_data = fill_mapping(
+        mapping_ground_truth_to_data, mapping_data_to_ground_truth
     )
-    mapping_data_to_groundtruth = remove_probabilities(mapping_data_to_groundtruth)
-    mapping_groundtruth_to_data = remove_probabilities(mapping_groundtruth_to_data)
+    mapping_data_to_ground_truth = remove_probabilities(mapping_data_to_ground_truth)
+    mapping_ground_truth_to_data = remove_probabilities(mapping_ground_truth_to_data)
 
-    return mapping_data_to_groundtruth, mapping_groundtruth_to_data
+    return mapping_data_to_ground_truth, mapping_ground_truth_to_data
 
 
-def fill_mapping(mapping_back_to_forth, mapping_forth_to_back):
-    """Fill the missing mappings using the reverse mapping."""
+def fill_mapping(mapping_back_to_forth: List, mapping_forth_to_back: List) -> List:
+    """Fill up missing mappings using the reverse mapping and updates existing mappings, if ones with higher
+    probabilities are found. If an activity has no mapping on either side, leave it as is.
+    """
     for index_forth, activity_index_forth in enumerate(mapping_back_to_forth):
         if activity_index_forth[0] == -1:
             possible_matches = []
@@ -159,42 +192,51 @@ def fill_mapping(mapping_back_to_forth, mapping_forth_to_back):
     return mapping_back_to_forth
 
 
-def remove_probabilities(mapping):
+def remove_probabilities(mapping: List[Tuple[int, float]]) -> List[int]:
     """Remove the probabilities from the mapping."""
     new_mapping = [elem[0] for elem in mapping]
 
     return new_mapping
 
 
-def find_matching_percentage(input_activities, mapping_input_to_comparison):
+def find_matching_percentage(
+    input_activities: pd.Series, mapping_input_to_comparison: list
+) -> int:
     """Calculate the percentage of matching activities."""
-    total_matching_activities = len(
-        [elem for elem in mapping_input_to_comparison if elem != -1]
+    total_matching_activities: int = sum(
+        1 for elem in mapping_input_to_comparison if elem != -1
     )
-    matching_percentage = round(
+    matching_percentage: int = round(
         total_matching_activities / input_activities.shape[0] * 100
     )
 
     return matching_percentage
 
 
-def find_unmapped_activities(activities, mapping):
-    """Find the activities that are not mapped."""
+def find_unmapped_activities(activities: pd.Series, mapping: list) -> List[str]:
+    """Find the activities that are not mapped, indicated by mapping index -1."""
     return [
         activities[index]
-        for index, match_index in enumerate(mapping)
-        if match_index == -1
+        for index, mapping_index in enumerate(mapping)
+        if mapping_index == -1
     ]
 
 
-def find_wrong_orders(df_activities, mapping_groundtruth_to_data):
-    """Find the activities that are in the wrong order."""
-    wrong_orders_indices = []
-    wrong_orders_activities = []
-    for index, first_activity_index in enumerate(mapping_groundtruth_to_data):
+def find_wrong_orders(
+    df_activities: pd.Series, mapping_ground_truth_to_data: List[int]
+) -> List[Tuple[str, str]]:
+    """Find the activities that are in the wrong order.
+
+    For every activity in the provided dataframe, the function checks if the mapped activity in the ground truth has a
+    smaller index, indicating the activity should have been found earlier. All activities and their mapped counterparts
+    from the ground truth are saved in a list and returned.
+    """
+    wrong_orders_indices: List[Tuple[int, int]] = []
+    wrong_orders_activities: List[Tuple[str, str]] = []
+    for index, first_activity_index in enumerate(mapping_ground_truth_to_data):
         if first_activity_index == -1:
             continue
-        for second_activity_index in mapping_groundtruth_to_data[index:]:
+        for second_activity_index in mapping_ground_truth_to_data[index:]:
             if second_activity_index == -1:
                 continue
             if first_activity_index > second_activity_index:
@@ -216,8 +258,8 @@ def find_wrong_orders(df_activities, mapping_groundtruth_to_data):
     return wrong_orders_activities
 
 
-def update_progress(view, current_step, total_steps, status):
-    """Update the progress of the extraction."""
+def update_progress(view, current_step: int, total_steps: int, status: str) -> None:
+    """Update the progress of the extraction, by updating the session variables."""
     if view is not None:
         percentage = round((current_step / total_steps) * 100)
         view.request.session["progress"] = percentage

diff --git a/tracex_project/trace_comparator/forms.py b/tracex_project/trace_comparator/forms.py
@@ -1,22 +1,26 @@
 """Implementation of forms for the trace comparator app."""
+from typing import List, Tuple
+
 from django import forms
 from extraction.models import PatientJourney
 
 
 class PatientJourneySelectForm(forms.Form):
-    """Form for selecting ground truth patient journey."""
+    """Form for selecting a patient journey to use in the trace testing environment."""
 
     selected_patient_journey = forms.ChoiceField(choices=[])
 
     def __init__(self, *args, **kwargs):
-        """Initializes the PatientJourneySelectForm."""
+        """Initializes the PatientJourneySelectForm with available choices."""
         super().__init__(*args, **kwargs)
         self.fields[
             "selected_patient_journey"
         ].choices = self.get_patient_journey_choices()
 
-    def get_patient_journey_choices(self):
-        """Retrieves the available patient journey choices from the database."""
+    @staticmethod
+    def get_patient_journey_choices() -> List[Tuple[str, str]]:
+        """Retrieves the available patient journey choices from the database. Available choices are those with a
+        saved ground truth."""
         patient_journeys = PatientJourney.manager.filter(
             name__contains="journey_comparison_"
         )