Skip to content

Commit

Permalink
fixes
Browse files Browse the repository at this point in the history
  • Loading branch information
deepanker13 committed Dec 20, 2023
1 parent f5572d8 commit db1ebce
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 7 deletions.
7 changes: 2 additions & 5 deletions sdk/python/kubeflow/trainer/hf_dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -7,12 +7,9 @@ FROM pytorch/pytorch:2.0.1-cuda11.7-cudnn8-runtime
# Copy the Python package and its source code into the container
COPY . /app

# Copy the requirements.txt file into the container
COPY requirements.txt /app/requirements.txt

# Install any needed packages specified in requirements.txt
RUN pip install --no-cache-dir -r requirements.txt
RUN pip install --no-cache-dir -r /app/requirements.txt

# Run storage.py when the container launches
ENTRYPOINT ["python", "hf_llm_training.py"]
ENTRYPOINT ["python", "/app/hf_llm_training.py"]

4 changes: 2 additions & 2 deletions sdk/python/kubeflow/trainer/hf_llm_training.py
Original file line number Diff line number Diff line change
Expand Up @@ -81,7 +81,7 @@ def parse_arguments():
parser.add_argument("--token_dir", help="directory containing tokenizer")
parser.add_argument("--dataset_dir", help="directory contaning dataset")
parser.add_argument("--peft_config", help="peft_config")
parser.add_argument("--train_params", help="hugging face training parameters")
parser.add_argument("--train_parameters", help="hugging face training parameters")

return parser.parse_args()

Expand All @@ -91,4 +91,4 @@ def parse_arguments():
model, tokenizer = setup_model_and_tokenizer(args.token_dir, args.model_dir)
train_data, eval_data = load_and_preprocess_data(args.dataset_dir, tokenizer)
model = setup_peft_model(model, args.peft_config)
train_model(model, train_data, eval_data, tokenizer, args)
train_model(model, train_data, eval_data, tokenizer, args.train_parameters)

0 comments on commit db1ebce

Please sign in to comment.