dssg
diff --git a/‎requirement/main.txt‎
Lines changed: 1 addition & 0 deletions b/‎requirement/main.txt‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/triage/component/postmodeling/base.py‎
Lines changed: 50 additions & 10 deletions b/‎src/triage/component/postmodeling/base.py‎
Lines changed: 50 additions & 10 deletions
diff --git a/‎src/triage/component/postmodeling/experiment_summarizer.py‎
Lines changed: 111 additions & 66 deletions b/‎src/triage/component/postmodeling/experiment_summarizer.py‎
Lines changed: 111 additions & 66 deletions
@@ -25,6 +25,7 @@ verboselogs==1.7
 s3fs==0.4.2 # pyup: ignore
 scikit-learn==1.6.1
 matplotlib==3.5.1
+matplotlib-inline==0.1.3
 seaborn==0.11.2
 ohio==0.5.0
 aequitas==0.42.0
 
@@ -5,11 +5,11 @@
 import seaborn as sns
 import matplotlib.table as tab
 import matplotlib.pyplot as plt
+import itertools
 #from tabulate import tabulate
 
 from IPython.display import display
-import itertools
-
+from io import StringIO
 from descriptors import cachedproperty
 from sqlalchemy import create_engine
 from sklearn.calibration import calibration_curve
@@ -475,15 +475,55 @@ def mean_ratio(pos, neg):
         crosstabs_df['model_id'] = self.model_id
         crosstabs_df['matrix_uuid'] = matrix_uuid
 
-    
         if push_to_db:
-            logging.info('Pushing the results to the DB')
+            # logging.info('Pushing the results to the DB')
+            # crosstabs_df.set_index(
+            #     ['model_id', 'matrix_uuid', 'feature', 'metric', 'threshold_type', 'threshold'], inplace=True
+            # )
+
+            # # TODO: Figure out to change the owner of the table
+            # crosstabs_df.pg_copy_to(schema='test_results', name=table_name, con=self.engine, if_exists='append')
+            logging.info(f'Pushing the results to the database, {len(crosstabs_df)} rows')
+                    
             crosstabs_df.set_index(
-                ['model_id', 'matrix_uuid', 'feature', 'metric', 'threshold_type', 'threshold'], inplace=True
+                ['model_id', 'matrix_uuid', 'feature', 'metric', 'threshold_type', 'threshold'],
+                inplace=True
             )
-
-            # TODO: Figure out to change the owner of the table
-            crosstabs_df.pg_copy_to(schema='test_results', name=table_name, con=self.engine, if_exists='append')
+            
+            crosstabs_df = crosstabs_df.reset_index()
+            
+            if not table_exists(f'test_results.{table_name}', self.engine):
+                q = f'''
+                    create schema if not exists test_results;
+                    
+                    create table test_results.{table_name} (
+                    model_id INTEGER,
+                    matrix_uuid TEXT,
+                    feature TEXT,
+                    metric TEXT,
+                    threshold_type TEXT,
+                    threshold FLOAT,
+                    value FLOAT  
+                    );
+                
+                '''
+                # q = _generate_create_table_sql_statement_from_df(results, f'{table_schema}.{table_name}')
+                self.engine.execute(q)
+            
+            conn = self.engine.raw_connection()
+            cursor = conn.cursor()
+            
+            buffer = StringIO()
+            crosstabs_df.to_csv(buffer, index=False, header=False)
+            buffer.seek(0)
+            
+            columns = ', '.join(crosstabs_df.columns)
+            print(columns)
+            cursor.copy_expert(f"COPY test_results.{table_name} ({columns}) FROM STDIN WITH CSV", buffer)
+            # results.to_sql(con=db_engine, schema=table_schema, name=table_name, if_exists='append')
+            conn.commit()
+            cursor.close()
+            conn.close()
 
         if return_df:
             return crosstabs_df
@@ -1136,7 +1176,7 @@ def get_model_ids(self):
             and model_group_id in ('{model_groups}')        
             """  
         # TODO do we really need experiment_hashes here? can we query with only model_group_ids?
-
+        
         # TODO: modify to remove pandas
         models = pd.read_sql(q, self.engine).to_dict(orient='records')
 
@@ -1197,7 +1237,7 @@ def _make_plot_grid(self, plot_type, subplot_width=3, subplot_len=None, sharey=F
         """
         fig, axes = self._get_subplots(subplot_width=subplot_width, subplot_len=subplot_len, sharey=sharey, sharex=sharex)
 
-        print(len(axes), len(axes[0]))
+        logging.info(f"{len(axes), len(axes[0])}")
 
         for j, mg in enumerate(self.models):
             for i, train_end_time in enumerate(self.models[mg]):
 
@@ -1,15 +1,17 @@
 
 """ This is a module for moving the ad-hoc code we wrote in generating the modeling report"""
+import verboselogs, logging
+
+logger = verboselogs.VerboseLogger(__name__)
 
 import pandas as pd
 import json
 import matplotlib.pyplot as plt
 import seaborn as sns
-import logging
-from matplotlib.lines import Line2D
-
 import warnings
 
+from matplotlib.lines import Line2D
+
 from triage.component.timechop.plotting import visualize_chops_plotly
 from triage.component.timechop import Timechop
 from triage.component.audition.plotting import plot_cats
@@ -112,7 +114,12 @@ def get_most_recent_experiment_hash(engine):
 
 class ExperimentReport:
 
-    def __init__(self, engine, experiment_hashes, performance_priority_metric, threshold, bias_priority_metric, bias_priority_groups):
+    def __init__(self, engine, 
+                 experiment_hashes, 
+                 performance_priority_metric='recall@', 
+                 threshold="1_pct", 
+                 bias_priority_metric='tpr_disparity', 
+                 bias_priority_groups=None):
         self.engine = engine
         self.experiment_hashes = experiment_hashes
 
@@ -429,33 +436,51 @@ def model_performance(self, metric=None, parameter=None, generate_plot=True):
             parameter = self.threshold
 
         # fetch model groups
-        q = f'''
-            with models as (
+        def fetch_evaluation_values(with_parameter=True): 
+            if with_parameter: 
+                parameter_stmt = f"and e.parameter = '{parameter}'"
+            else: 
+                parameter_stmt = ''
+
+            q = f'''
+                with models as (
+                    select 
+                        distinct model_id, 
+                        train_end_time, 
+                        model_group_id, 
+                        model_type, 
+                        hyperparameters
+                    from triage_metadata.experiment_models join triage_metadata.models using(model_hash)
+                    where experiment_hash in ('{"','".join(self.experiment_hashes)}')   
+                )
                 select 
-                    distinct model_id, 
-                    train_end_time, 
-                    model_group_id, 
+                    m.model_id, 
+                    train_end_time::date as train_end_time_dt,
+                    to_char(train_end_time, 'YYYY-MM-DD') as train_end_time,
                     model_type, 
-                    hyperparameters
-                from triage_metadata.experiment_models join triage_metadata.models using(model_hash)
-                where experiment_hash in ('{"','".join(self.experiment_hashes)}')   
-            )
-            select 
-                m.model_id, 
-                train_end_time::date as train_end_time_dt,
-                to_char(train_end_time, 'YYYY-MM-DD') as train_end_time,
-                model_type, 
-                model_group_id,
-                stochastic_value as metric_value
-            from models m left join test_results.evaluations e 
-            on m.model_id = e.model_id
-            and e.metric = '{metric}'
-            and e.parameter = '{parameter}'
-            and e.subset_hash = ''
-        '''
-
-
+                    model_group_id,
+                    stochastic_value as metric_value,
+                    parameter
+                from models m left join test_results.evaluations e 
+                on m.model_id = e.model_id
+                and e.metric = '{metric}'
+                {parameter_stmt}
+                and e.subset_hash = ''
+            '''
+            return q 
+        
+        # 1. fetch evaluation values to check if we have 
+        q = fetch_evaluation_values()
         df = pd.read_sql(q, self.engine)
+        # Validate that we have value for the DEFAULT metric and parameter 
+        if df.metric_value.isna().unique(): 
+            q = fetch_evaluation_values(with_parameter=False)
+            df = pd.read_sql(q, self.engine)
+            # fetch the first available value 
+            parameter_ = df.loc[0, 'parameter']
+            self.threshold = parameter_
+            df = df[df.parameter == parameter_]
+
         df['train_end_time'] = pd.to_datetime(df.train_end_time, format='%Y-%m-%d')
 
         models_per_train_end_time = df.groupby(['model_group_id', 'train_end_time']).count()['model_id']
@@ -508,27 +533,45 @@ def model_performance_subsets(self, metric=None, parameter=None, generate_plot=T
         if parameter is None: 
             parameter = self.threshold
 
-        q = f'''
-            select 
-                case when e.subset_hash is null then 'full_cohort' 
-                else s.config ->> 'name' 
-                end as "subset",
-                e.subset_hash,
-                m.model_id,
-                m.model_group_id,
-                m.model_type,
-                m.train_end_time::date,
-                e.stochastic_value as metric_value
-            from triage_metadata.experiment_models join triage_metadata.models m using(model_hash)
-                left join test_results.evaluations e
-                on m.model_id = e.model_id
-                and e.parameter = '{parameter}'
-                and e.metric = '{metric}'
-                    left join triage_metadata.subsets s on e.subset_hash = s.subset_hash 
-            where experiment_hash in ('{"','".join(self.experiment_hashes)}')
-        '''
+        def fetch_evaluation_values_subsets(with_parameter=True):
+            if with_parameter: 
+                parameter_stmt = f"and e.parameter = '{parameter}'"
+            else: 
+                parameter_stmt = ''
+
+            q = f'''
+                select 
+                    case when e.subset_hash is null then 'full_cohort' 
+                    else s.config ->> 'name' 
+                    end as "subset",
+                    e.subset_hash,
+                    m.model_id,
+                    m.model_group_id,
+                    m.model_type,
+                    m.train_end_time::date,
+                    e.stochastic_value as metric_value,
+                    parameter
+                from triage_metadata.experiment_models join triage_metadata.models m using(model_hash)
+                    left join test_results.evaluations e
+                    on m.model_id = e.model_id
+                    and e.parameter = '{parameter}'
+                    {parameter_stmt}
+                        left join triage_metadata.subsets s on e.subset_hash = s.subset_hash 
+                where experiment_hash in ('{"','".join(self.experiment_hashes)}')
+            '''
+
+            return q
 
+        q = fetch_evaluation_values_subsets() 
         df = pd.read_sql(q, self.engine)
+        # Validate that we have value for the DEFAULT metric and parameter 
+        if df.metric_value.isna().unique(): 
+            q = fetch_evaluation_values_subsets(with_parameter=False)
+            df = pd.read_sql(q, self.engine)
+            # fetch the first available value 
+            parameter_ = df.loc[0, 'parameter']
+            self.threshold = parameter_
+            df = df[df.parameter == parameter_]
 
         if (df.empty) or (None in df.subset.unique()):
             return None
@@ -921,39 +964,41 @@ def generate_summary(self, metric=None, parameter=None, equity_metric=None):
         if equity_metric is None:
             equity_metric = self.bias_metric
 
-        
+        logger.notice(f"Default performance parameters are set to recall@1_pct and bias metric to tpr_disparity!")
+        logger.notice("==> In case your experiment doesn't have those parameters Triage will use one of the available. <==")
         stats = self.experiment_stats()
 
         if stats['implemented_fewer_splits'] == 1:
-            print(f"Temporal config suggests {stats['timesplits_from_temporal_config']} temporal splits, but experiment implemented only {stats['validation_splits']} splits. Was this intentional?")
+            logger.notice(f"Temporal config suggests {stats['timesplits_from_temporal_config']} temporal splits, but experiment implemented only {stats['validation_splits']} splits. Was this intentional?")
         else:
-            print(f'Experiment contained {stats["timesplits_from_temporal_config"]} temporal splits')
+            logger.notice(f'Experiment contained {stats["timesplits_from_temporal_config"]} temporal splits')
 
-        
-        print(f"Experiment contained {stats['as_of_times']} distinct as_of_times")
+        logger.notice(f"Experiment contained {stats['as_of_times']} distinct as_of_times")
 
         cohorts = self.cohorts(generate_plots=False)
-        print(f'On average, your cohorts contained around {round(cohorts.cohort_size.mean())} entities with a baserate of {round(cohorts.baserate.mean(), 3)}')
-    
-        print(f"You built {stats['features']} features organized into {stats['feature_groups']} groups/blocks")
+        logger.notice(f'On average, your cohorts contained around {round(cohorts.cohort_size.mean())} entities with a baserate of {round(cohorts.baserate.mean(), 3)}')
 
-        print(f"Your model grid specification contained {stats['grid_size']} model types with {stats['models_needed']} individual models")
+        logger.notice(f"You built {stats['features']} features organized into {stats['feature_groups']} groups/blocks")
+        
+        logger.notice(f"Your model grid specification contained {stats['grid_size']} model types with {stats['models_needed']} individual models")
 
         ## Models
         num_models = len(self.models())
         if num_models < stats['models_needed']:
-            print(f"However, the experiment only built {num_models} models. You are missing {stats['models_needed'] - num_models} models")
+            logger.notice(f"However, the experiment only built {num_models} models. You are missing {stats['models_needed'] - num_models} models")
 
         else:
-            print(f"You successfully built all the {num_models} models")
+            logger.notice(f"You successfully built all the {num_models} models")
 
         # Model Performance
         performance = self.model_performance(metric=metric, parameter=parameter, generate_plot=False)
         best_performance = performance.groupby(['model_group_id', 'model_type'])['metric_value'].mean().max()
         best_model_group = performance.groupby(['model_group_id', 'model_type'])['metric_value'].mean().idxmax()[0]
         best_model_type = performance.groupby(['model_group_id', 'model_type'])['metric_value'].mean().idxmax()[1]
-            
-        print(f"Your models acheived a best average {metric}{parameter} of {round(best_performance, 3)} over the {stats['validation_splits']} validation splits, with the Model Group {best_model_group},{best_model_type}. Note that model selection is more nuanced than average predictive performance over time. You could use Audition for model selection.")
+        
+        # because we could change the value of the default parameter in case it doesn't exist, 
+        # it is safer to take it from the object itself.
+        logger.notice(f"Your models achieved a best average {self.performance_metric}{self.threshold} of {round(best_performance, 3)} over the {stats['validation_splits']} validation splits, with the Model Group {best_model_group},{best_model_type}. Note that model selection is more nuanced than average predictive performance over time. You could use Audition for model selection.") 
 
         ## Subsets
         subset_performance = self.model_performance_subsets(metric=metric, parameter=parameter, generate_plot=False)
@@ -969,11 +1014,11 @@ def generate_summary(self, metric=None, parameter=None, equity_metric=None):
                 res.append(d)
 
             if len(res) > 0:
-                print(f"You created {len(res)} subsets of your cohort -- {', '.join([x['subset'] for x in res])}")
+                logger.notice(f"You created {len(res)} subsets of your cohort -- {', '.join([x['subset'] for x in res])}")
                 for d in res:
-                    print(f"For subset '{d['subset'] }', Model Group {d['best_mod'][0]}, {d['best_mod'][1]} achieved the best average {metric}{parameter} of {d['best_perf']}")
+                    logger.notice(f"For subset '{d['subset'] }', Model Group {d['best_mod'][0]}, {d['best_mod'][1]} achieved the best average {metric}{parameter} of {d['best_perf']}")
         else:
-            print("No subsets defined.") 
+            logger.notice("No subsets defined.")
 
         ## Bias
         equity_metrics = self.efficiency_and_equity(
@@ -986,11 +1031,11 @@ def generate_summary(self, metric=None, parameter=None, equity_metric=None):
         if equity_metrics is not None:
             grpobj = equity_metrics[(equity_metrics.baserate > 0) & (equity_metrics.model_group_id == best_model_group)].groupby('attribute_name')
             for attr, gdf in grpobj:
-                print(f'Measuring biases across {attr} groups using {equity_metric} for the best performing model:')
+                logger.notice(f"Measuring biases across {attr} groups using {equity_metric} for the best performing model:")
                 d = gdf.groupby('attribute_value')[equity_metric].mean()
-                print(", ".join(f"{k}: {round(v, 3)}" for k, v, in d.to_dict().items()))
+                logger.notice(", ".join(f"{k}: {round(v, 3)}" for k, v, in d.to_dict().items()))
         else:
-            print(f"No bias audit results were found in the database for the experiment.")
+            logger.notice(f"No bias audit results were found in the database for the experiment.")
 
 
     def precision_recall_curves(self, plot_size=(3,3)):