diff --git a/pmlb/_version.py b/pmlb/_version.py index c206b429d..cc271b1cd 100644 --- a/pmlb/_version.py +++ b/pmlb/_version.py @@ -23,4 +23,4 @@ SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. """ -__version__ = '1.0.1.post2' +__version__ = '1.0.1.post3' diff --git a/pmlb/dataset_lists.py b/pmlb/dataset_lists.py index ae3cd2f0b..66dcf26cc 100644 --- a/pmlb/dataset_lists.py +++ b/pmlb/dataset_lists.py @@ -23,13 +23,10 @@ SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. """ import pathlib, pandas - -try: # used in repo - df_summary = pandas.read_csv('pmlb/all_summary_stats.tsv', sep='\t') -except: # used in pypi pkg - import pkgutil - data = pkgutil.get_data('pmlb', 'all_summary_stats.tsv') - df_summary = pandas.read_csv(data , sep='\t') +from io import StringIO +import pkgutil +data = pkgutil.get_data('pmlb', 'all_summary_stats.tsv') +df_summary = pandas.read_csv(StringIO(data.decode("utf-8")) , sep='\t') regression_dataset_names = df_summary.query('task=="regression"')['dataset'].tolist() classification_dataset_names = df_summary.query('task=="classification"')['dataset'].tolist() dataset_names = regression_dataset_names + classification_dataset_names