Skip to content

Commit 1eb5fb1

Browse files
committed
Update fms-hf-tuning e2e test
Signed-off-by: ted chang <[email protected]>
1 parent f46d74d commit 1eb5fb1

File tree

3 files changed

+8
-4
lines changed

3 files changed

+8
-4
lines changed

test/e2e/config.json

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,8 @@
11
{
2+
"accelerate_launch_args": {
3+
"num_processes": 2,
4+
"cpu": true
5+
},
26
"model_name_or_path": "bigscience/bloom-560m",
37
"training_data_path": "/etc/config/twitter_complaints_small.json",
48
"output_dir": "/tmp/out",

test/e2e/kfto_kueue_sft_test.go

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
//go:build ignore
1+
//go:build tuning_e2e
22

33
/*
44
Copyright 2023.
@@ -94,9 +94,9 @@ func TestPytorchjobWithSFTtrainer(t *testing.T) {
9494
Containers: []corev1.Container{
9595
{
9696
Name: "pytorch",
97-
Image: "quay.io/tedchang/sft-trainer:dev",
97+
Image: "quay.io/modh/fms-hf-tuning:5d8789723ec58ac1bc9c2df704395f162fed974a",
9898
ImagePullPolicy: corev1.PullIfNotPresent,
99-
Command: []string{"python", "/app/launch_training.py"},
99+
Command: []string{"python", "/app/accelerate_launch.py"},
100100
Env: []corev1.EnvVar{
101101
{
102102
Name: "SFT_TRAINER_CONFIG_JSON_PATH",

test/e2e/setup.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -19,4 +19,4 @@ docker build -t ${KFTO_IMG} -f ${BASE_DIR}/build/images/training-operator/Docker
1919

2020
echo "Load training operator image into cluster"
2121
kind load --name training-operator-cluster docker-image training-operator:dev
22-
KFTO_IMG=training-operator:dev make deploy
22+
IMG=training-operator:dev make deploy

0 commit comments

Comments
 (0)