(#343)(skip-models)(skip-preps)(skip-embs)

hosseinfani · hosseinfani · commit 7648236e92f9 · 2026-03-09T14:29:59.000-04:00
diff --git a/src/Adila b/src/Adila
@@ -1 +1 @@
-Subproject commit 577b78b783060c94544f61ef5a67bfda66b8a4e5
+Subproject commit eb5dc44c83c4940c0754387a81c4498670abc4f3
diff --git a/src/main.py b/src/main.py
@@ -117,10 +117,6 @@ def run(cfg):
         # if a list, all see the exact splits of teams.
         # if individual, they see different teams in splits. But as we show the average results, no big deal, esp., as we do n-fold
         models = {}
-        # model names t* will follow the streaming scenario
-        # model names *_ts have timestamp (year) as a single added feature
-        # model names *_ts2v learn temporal skill vectors via d2v when each doc is a stream of (skills: year of the team)
-        # non-temporal (no streaming scenario, bag of teams)
         assert len(cfg.models.instances) > 0, f'{opentf.textcolor["red"]}No model instance for training! Check ./src/__config__.yaml and models.instances ... {opentf.textcolor["reset"]}'
 
         # Get command-line overrides for models. Kinda tricky as we dynamically override a subconfig.
@@ -145,7 +141,7 @@ def run(cfg):
             # t2v object knows the embedding method and ...
             skill_vecs = t2v.get_dense_vecs(teamsvecs, vectype='skill')
             assert skill_vecs.shape[0] == teamsvecs['skill'].shape[0], f'{opentf.textcolor["red"]}Incorrect number of embeddings for teams subset of skills!{opentf.textcolor["reset"]}'
-            teamsvecs['original_skill'] = teamsvecs['skill'] #to accomodate skill_coverage metric and future use cases like in nmt
+            teamsvecs['original_skill'] = teamsvecs['skill'] #to accommodate skill_coverage metric and future use cases like in nmt
             teamsvecs['skill'] = skill_vecs
 
         for m in cfg.models.instances:
@@ -189,8 +185,9 @@ def run(cfg):
     log.info(f'{opentf.textcolor["green"]}Aggregating the test results under {cfg.data.output} per splits from test.pred.eval.mean.csv files ... {opentf.textcolor["reset"]}')
     aggregate(cfg.data.output)
 
-# sample runs for different configs, including different prep, embeddings, model training, ..., are available as unit-test in
+# sample runs for different configs, including different prep, embeddings, model training, ..., see unit-tests and scripts in
 # ./github/workflows/*.yml
+# ./ipynb/*.ipynb
 
 # To run on compute canada servers you can use the following command: (time is in minutes)
 #sbatch --account=def-hfani --mem=96000MB --time=2880 computecanada.sh
diff --git a/src/mdl/ntf.py b/src/mdl/ntf.py
@@ -105,6 +105,20 @@ def plot_roc(self, splits, on_train=False):
             # plt.show()
 
     def adila(self, teamsvecs, splits, faircfg):
+        def _avg_per_fold(files):
+            from pathlib import Path;
+            pd = opentf.install_import('pandas')
+            files = [f for f in files if not re.search(r'\.e\d+\.', os.path.basename(f))] #filter out per epoch files
+            for kind in ['fair', 'utility']:
+                dfs = []
+                for fold in splits['folds'].keys():
+                    fold_file = [f'{f}.eval.{kind}.mean.csv' for f in files if Path(f).name.startswith(f'f{fold}.')]
+                    if len(fold_file) != 1: raise ValueError(f'Expected one file for fold {fold} ({kind}), found {len(fold_file)}!')
+                    dfs.append(pd.read_csv(fold_file[0], index_col=0))
+                combined = pd.concat(dfs)
+                mean_df = combined.groupby(combined.index).mean()
+                mean_df.to_csv(fold_file[0].replace(f'f{fold}.', ''))
+
         from Adila.src.adila import Adila
         from Adila.src.main import _
         if not scipy.sparse.issparse(teamsvecs['skill']): teamsvecs['skill'] = teamsvecs['original_skill']  # to accomodate dense emb vecs of skills
@@ -116,4 +130,5 @@ def adila(self, teamsvecs, splits, faircfg):
                     stats, minorities, ratios = adila.prep(self.output, notion, attribute, is_popular_alg, faircfg.is_popular_coef, plot)
                     if notion == 'dp' and faircfg.dp_ratio: ratios = [1 - faircfg.ratio if attribute == 'popularity' else faircfg.ratio]
                     for algorithm in faircfg.algorithm:
-                        _(adila, self.output, minorities, ratios, algorithm, faircfg.k_max, faircfg.alpha, faircfg.acceleration, faircfg.eval)
+                        outputs = _(adila, self.output, minorities, ratios, algorithm, faircfg.k_max, faircfg.alpha, faircfg.acceleration, faircfg.eval)
+                        _avg_per_fold(outputs) # ideally, all the outputs should be in the same folder/path.