diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml index f258d8dda..757033acc 100644 --- a/.pre-commit-config.yaml +++ b/.pre-commit-config.yaml @@ -1,6 +1,8 @@ --- ci: autoupdate_schedule: quarterly + autofix_prs: false + submodules: false repos: - repo: https://github.com/pre-commit/pre-commit-hooks diff --git a/experiments/data/prepare_chemrxiv.py b/experiments/data/prepare_chemrxiv.py index 3e161b2c3..5a1735756 100644 --- a/experiments/data/prepare_chemrxiv.py +++ b/experiments/data/prepare_chemrxiv.py @@ -39,5 +39,5 @@ # execute gpt-neox processing gpt_tool_path = f"{args.gptneox_dir}/tools/preprocess_data.py" os.system( - f"python {gpt_tool_path} --input {data_path} --output-prefix {save_path}/data --vocab /fsx/pile/20B_tokenizer.json --dataset-impl mmap --tokenizer-type HFTokenizer --append-eod" + f"python {gpt_tool_path} --input {data_path} --output-prefix {save_path}/data --vocab /fsx/pile/20B_tokenizer.json --dataset-impl mmap --tokenizer-type HFTokenizer --append-eod" # noqa: E501 )