Skip to content

Commit

Permalink
Include -y option to cli
Browse files Browse the repository at this point in the history
  • Loading branch information
luabida committed Dec 21, 2023
1 parent db02048 commit 2cada3e
Show file tree
Hide file tree
Showing 3 changed files with 58 additions and 18 deletions.
4 changes: 2 additions & 2 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -66,8 +66,8 @@ To use Episcanner Downloader, follow these steps:
```shell
cd dist/
./episcanner -h
./episcanner -s RJ -d dengue -o /tmp -f duckdb
./episcanner --all -d zika -o /tmp -f csv parquet --verbose
./episcanner -y 2023 -s RJ -d dengue -o /tmp -f duckdb
./episcanner -y 2021 2022 2023 --all -d zika -f csv parquet --verbose
```
*Replace <source> with the desired source (e.g., 'MG', or '--all' to download all states) and <diseases> with the specific diseases you want to download (e.g., 'dengue chikungunya'). Specify the <output_directory> where the data should be saved.*

Expand Down
68 changes: 53 additions & 15 deletions src/scanner/cli.py
Original file line number Diff line number Diff line change
@@ -1,17 +1,31 @@
"""
python src/scanner/cli.py -a -d dengue zika -f csv -v
python src/scanner/cli.py -y 2023 -a -d dengue zika -f csv -v
python src/scanner/cli.py -s SP RJ DF -d dengue zika -f csv parquet duckdb
python src/scanner/cli.py -y 2010 -s SP RJ DF -d dengue zika -f csv parquet duckdb
python src/scanner/cli.py -s SP -d zika -f csv -o /tmp
python src/scanner/cli.py -y 2020 2021 2022 -s SP -d zika -f csv -o /tmp
"""

import argparse
import datetime

from src.scanner.scanner import EpiScanner
from src.scanner.utils import CACHEPATH, STATES


class YearsAction(argparse.Action):
def __call__(self, parser, namespace, values, option_string=None):
cur_year = datetime.datetime.now().year
for value in values:
if int(value) < 2010 or int(value) > cur_year:
raise argparse.ArgumentError(
self,
f"Invalid year: {value}. "
f"Options: 2010 to {cur_year}",
)
setattr(namespace, self.dest, list(map(lambda x: x.lower(), values)))


class StatesAction(argparse.Action):
def __call__(self, parser, namespace, values, option_string=None):
for value in values:
Expand Down Expand Up @@ -49,6 +63,19 @@ def app():
description="Export EpiScanner data to duckdb, csv and parquet"
)

parser.add_argument(
"-y",
"--years",
nargs="+",
action=StatesAction,
help="""
Years to be scanned.
Example:
-y 2011 2022
""",
required=True,
)

parser.add_argument(
"-s",
"--states",
Expand Down Expand Up @@ -117,16 +144,27 @@ def app():
"-s/--states OR -a/--all"
)

for disease in args.diseases:
for format in args.file_format:
if args.all:
for state in STATES:
EpiScanner(disease, state, args.verbose).export(
format, args.output_dir
for year in args.years:
for disease in args.diseases:
for format in args.file_format:
if args.all:
for state in STATES:
EpiScanner(
disease=disease,
uf=state,
year=year,
verbose=args.verbose
).export(
to=format, output_dir=args.output_dir
)
break

for state in args.states:
EpiScanner(
disease=disease,
uf=state,
year=year,
verbose=args.verbose
).export(
to=format, output_dir=args.output_dir
)
break

for state in args.states:
EpiScanner(disease, state, args.verbose).export(
format, args.output_dir
)
4 changes: 3 additions & 1 deletion src/scanner/scanner.py
Original file line number Diff line number Diff line change
Expand Up @@ -145,7 +145,7 @@ def export(
self._to_duckdb(output_dir)
file = output_dir / "episcanner.duckdb"

logger.info(f"Data exported successfully to {file}")
logger.info(f"{self.uf} data for {self.year} wrote to {file}")
except (FileNotFoundError, PermissionError) as e:
raise ValueError(f"Failed to write file: {e}")
except Exception as e:
Expand Down Expand Up @@ -318,6 +318,8 @@ def _to_duckdb(self, output_dir: str):
).fetchone()[0]

if rows > 0:
if self.verbose:
logger.warning(f"Overriding data for {self.year}")
con.execute(
f"DELETE FROM '{table_name}'"
f" WHERE year = {self.year}"
Expand Down

0 comments on commit 2cada3e

Please sign in to comment.