Spaces:

CoreyMorris
/

MMLU-by-task-Leaderboard

Running

Corey Morris commited on Aug 22, 2023

Commit

a5840fb

•

1 Parent(s): 916604b

removing models that are known to have training data contaminated with evaluations

Files changed (2) hide show

contaminated_models.txt ADDED Viewed

result_data_processor.py CHANGED Viewed

@@ -140,8 +140,20 @@ class ResultDataProcessor:
         # remove extreme outliers from column harness|truthfulqa:mc1
         data = self._remove_mc1_outliers(data)
         return data
     def rank_data(self):
         # add rank for each column to the dataframe
         # copy the data dataframe to avoid modifying the original dataframe

         # remove extreme outliers from column harness|truthfulqa:mc1
         data = self._remove_mc1_outliers(data)
+        data = self.manual_removal_of_models(data)
         return data
+    def manual_removal_of_models(self, df):
+    # remove models verified to be trained on evaluation data
+        # load the list of models
+        with open('contaminated_models.txt') as f:
+            contaminated_models = f.read().splitlines()
+        # remove the models from the dataframe
+        df = df[~df.index.isin(contaminated_models)]
+        return df
     def rank_data(self):
         # add rank for each column to the dataframe
         # copy the data dataframe to avoid modifying the original dataframe