X-Git-Url: https://code.communitydata.science/cdsc_reddit.git/blobdiff_plain/4cb7eeec80c5a9c8f49339acd378c515e290ed81..65deba5e4e4ad9e3f23e82573491f7d6b190e644:/clustering/lsi_base.py diff --git a/clustering/lsi_base.py b/clustering/lsi_base.py index 45cc49b..80b7101 100644 --- a/clustering/lsi_base.py +++ b/clustering/lsi_base.py @@ -18,11 +18,12 @@ class lsi_grid_sweep(grid_sweep): self.subsweep = subsweep inpath = Path(inpath) if lsi_dimensions == 'all': - lsi_paths = list(inpath.glob("*")) + lsi_paths = list(inpath.glob("*.feather")) else: - lsi_paths = [inpath / (dim + '.feather') for dim in lsi_dimensions] + lsi_paths = [inpath / (str(dim) + '.feather') for dim in lsi_dimensions] - lsi_nums = [p.stem for p in lsi_paths] + print(lsi_paths) + lsi_nums = [int(p.stem) for p in lsi_paths] self.hasrun = False self.subgrids = [self.subsweep(lsi_path, outpath, lsi_dim, *args, **kwargs) for lsi_dim, lsi_path in zip(lsi_nums, lsi_paths)] self.jobs = list(chain(*map(lambda gs: gs.jobs, self.subgrids)))