From c56d2b1a0ecf4e0d8efa4ea76e8cae3decc788d5 Mon Sep 17 00:00:00 2001 From: =?UTF-8?q?Lu=C3=A3=20Bida=20Vacaro?= <82233055+luabida@users.noreply.github.com> Date: Fri, 3 Feb 2023 10:56:10 -0300 Subject: [PATCH] fix(sinan): remove hardcoded data path when extracting from pysus (#113) bugfix --- pysus/online_data/SINAN.py | 2 +- pysus/online_data/__init__.py | 16 ++++++++++------ 2 files changed, 11 insertions(+), 7 deletions(-) diff --git a/pysus/online_data/SINAN.py b/pysus/online_data/SINAN.py index cd9e3750..9b0b16f0 100644 --- a/pysus/online_data/SINAN.py +++ b/pysus/online_data/SINAN.py @@ -151,7 +151,7 @@ def download(disease, year, return_chunks=False, data_path="/tmp/pysus"): if not Path(out).exists(): logger.debug(f"{fname} file not found. Proceeding to download..") try: - _fetch_file(fname, sus_path, "DBC", return_df=False) + _fetch_file(fname, sus_path, "DBC", return_df=False, data_path=data_path) logger.info(f"{fname} downloaded at {data_path}") except Exception as e: diff --git a/pysus/online_data/__init__.py b/pysus/online_data/__init__.py index 9e175f65..37990ddd 100644 --- a/pysus/online_data/__init__.py +++ b/pysus/online_data/__init__.py @@ -34,7 +34,11 @@ def cache_contents(): def _fetch_file( - fname: str, path: str, ftype: str, return_df: bool = True + fname: str, + path: str, + ftype: str, + return_df: bool = True, + data_path: str = '/tmp/pysus' ) -> pd.DataFrame: """ Fetch a single file. @@ -48,27 +52,27 @@ def _fetch_file( ftp.login() ftp.cwd(path) - Path('/tmp/pysus').mkdir(exist_ok=True) + Path(data_path).mkdir(exist_ok=True) try: - ftp.retrbinary(f"RETR {fname}", open(f'/tmp/pysus/{fname}', "wb").write) + ftp.retrbinary(f"RETR {fname}", open(f'{Path(data_path) / fname}', "wb").write) except Exception: raise Exception("File {} not available on {}".format(fname, path)) if return_df: - df = get_dataframe(f'/tmp/pysus/{fname}', ftype) + df = get_dataframe(fname, ftype, data_path) return df else: return pd.DataFrame() -def get_dataframe(fname: str, ftype: str) -> pd.DataFrame: +def get_dataframe(fname: str, ftype: str, data_path: str = '/tmp/pysus') -> pd.DataFrame: """ Return a dataframe read fom temporary file on disk. :param fname: temporary file name :param ftype: 'DBC' or 'DBF' :return: DataFrame """ - fname = f'/tmp/pysus/{fname}' + fname = Path(data_path) / fname if ftype == "DBC": df = read_dbc(fname, encoding="iso-8859-1", raw=False)