srun -t 1:00:00 -p datamover --mem=1G --pty bash -l
cd <this repo>/bin
./submit_parse.py ../yaml/uniprotkb-prod.yaml
srun -t 1:00:00 -p datamover --mem=64G -c 8 --pty bash -l
cd <this repo>
python -m uniprot_log_file_parser.merge \
'/hps/nobackup/martin/uniprot/users/dlrice/rest-log-parquets/prod/uniprotkb/parquet'
cd <this repo>
python -m uniprot_log_file_parser.parse_to_parquet \
--out_dir '/path/to/save/parquet/files' \
--log_path '/path/to/file.log'
cd <this repo>
python -m uniprot_log_file_parser.parse_to_parquet \
--out_dir '/path/to/save/parquet/files' \
--log_path '/path/to/legacy/file.log' \
--legacy
- Create single configuration file in YAML
- Create single point of execution for parse submission
- Create merge slurm job