Skip to content

Commit

Permalink
Update fms-hf-tuning e2e test
Browse files Browse the repository at this point in the history
Signed-off-by: ted chang <htchang@us.ibm.com>
  • Loading branch information
tedhtchang committed Apr 9, 2024
1 parent f46d74d commit 1eb5fb1
Show file tree
Hide file tree
Showing 3 changed files with 8 additions and 4 deletions.
4 changes: 4 additions & 0 deletions test/e2e/config.json
Original file line number Diff line number Diff line change
@@ -1,4 +1,8 @@
{
"accelerate_launch_args": {
"num_processes": 2,
"cpu": true
},
"model_name_or_path": "bigscience/bloom-560m",
"training_data_path": "/etc/config/twitter_complaints_small.json",
"output_dir": "/tmp/out",
Expand Down
6 changes: 3 additions & 3 deletions test/e2e/kfto_kueue_sft_test.go
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
//go:build ignore
//go:build tuning_e2e

/*
Copyright 2023.
Expand Down Expand Up @@ -94,9 +94,9 @@ func TestPytorchjobWithSFTtrainer(t *testing.T) {
Containers: []corev1.Container{
{
Name: "pytorch",
Image: "quay.io/tedchang/sft-trainer:dev",
Image: "quay.io/modh/fms-hf-tuning:5d8789723ec58ac1bc9c2df704395f162fed974a",
ImagePullPolicy: corev1.PullIfNotPresent,
Command: []string{"python", "/app/launch_training.py"},
Command: []string{"python", "/app/accelerate_launch.py"},
Env: []corev1.EnvVar{
{
Name: "SFT_TRAINER_CONFIG_JSON_PATH",
Expand Down
2 changes: 1 addition & 1 deletion test/e2e/setup.sh
Original file line number Diff line number Diff line change
Expand Up @@ -19,4 +19,4 @@ docker build -t ${KFTO_IMG} -f ${BASE_DIR}/build/images/training-operator/Docker

echo "Load training operator image into cluster"
kind load --name training-operator-cluster docker-image training-operator:dev
KFTO_IMG=training-operator:dev make deploy
IMG=training-operator:dev make deploy

0 comments on commit 1eb5fb1

Please sign in to comment.