@@ -60,11 +60,11 @@ def fit_predict_scores(self, data: pd.DataFrame, true_objects: pd.Series = None)
6060 """Fit the model and return scores.
6161
6262 Args:
63- data (DataFrame): Workers' outputs .
64- A pandas.DataFrame containing `task`, `worker` and `output ` columns.
65- true_objects (Series): Tasks' ground truth labels .
63+ data (DataFrame): Workers' responses .
64+ A pandas.DataFrame containing `task`, `worker` and `text ` columns.
65+ true_objects (Series): Tasks' ground truth texts .
6666 A pandas.Series indexed by `task` such that `labels.loc[task]`
67- is the tasks's ground truth label .
67+ is the tasks's ground truth text .
6868
6969 Returns:
7070 DataFrame: Tasks' label scores.
@@ -78,11 +78,11 @@ def fit_predict(self, data: pd.DataFrame, true_objects: pd.Series = None) -> pd.
7878 """Fit the model and return aggregated texts.
7979
8080 Args:
81- data (DataFrame): Workers' outputs .
82- A pandas.DataFrame containing `task`, `worker` and `output ` columns.
83- true_objects (Series): Tasks' ground truth labels .
81+ data (DataFrame): Workers' responses .
82+ A pandas.DataFrame containing `task`, `worker` and `text ` columns.
83+ true_objects (Series): Tasks' ground truth texts .
8484 A pandas.Series indexed by `task` such that `labels.loc[task]`
85- is the tasks's ground truth label .
85+ is the tasks's ground truth text .
8686
8787 Returns:
8888 Series: Tasks' texts.
@@ -91,11 +91,11 @@ def fit_predict(self, data: pd.DataFrame, true_objects: pd.Series = None) -> pd.
9191 """
9292
9393 hrrasa_results = self ._hrrasa .fit_predict (self ._encode_data (data ), self ._encode_true_objects (true_objects ))
94- self .texts_ = hrrasa_results .reset_index ()[['task' , 'output' ]].set_index ('task' )
94+ self .texts_ = hrrasa_results .reset_index ()[['task' , 'output' ]].rename ( columns = { 'output' : 'text' }). set_index ('task' )
9595 return self .texts_
9696
9797 def _encode_data (self , data : pd .DataFrame ) -> pd .DataFrame :
98- data = data [['task' , 'worker' , 'output ' ]]
98+ data = data [['task' , 'worker' , 'text ' ]]. rename ( columns = { 'text' : 'output' })
9999 data ['embedding' ] = data .output .apply (self .encoder )
100100 return data
101101
0 commit comments