Skip to content

Commit

Permalink
fix(ci): roberta fixes for single card. fixes for img2text
Browse files Browse the repository at this point in the history
  • Loading branch information
imangohari1 committed Aug 7, 2024
1 parent b3384cc commit 66959b1
Show file tree
Hide file tree
Showing 5 changed files with 13 additions and 13 deletions.
4 changes: 2 additions & 2 deletions tests/baselines/gpt2_xl.json
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,7 @@
"deepspeed": {
"learning_rate": 4e-4,
"train_batch_size": 16,
"perplexity": 13.0461,
"perplexity": 13.23775,
"train_runtime": 190.696,
"train_samples_per_second": 89.877,
"extra_arguments": [
Expand All @@ -40,4 +40,4 @@
}
}
}
}
}
4 changes: 2 additions & 2 deletions tests/baselines/gpt_neox_20b.json
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,7 @@
"deepspeed": {
"learning_rate": 5e-5,
"train_batch_size": 2,
"perplexity": 8.0545,
"perplexity": 8.166753,
"train_runtime": 721.5428,
"train_samples_per_second": 7.571,
"extra_arguments": [
Expand All @@ -20,4 +20,4 @@
}
}
}
}
}
6 changes: 3 additions & 3 deletions tests/baselines/roberta_base.json
Original file line number Diff line number Diff line change
Expand Up @@ -56,8 +56,8 @@
"learning_rate": 7e-5,
"train_batch_size": 64,
"eval_f1": 91.5253,
"train_runtime": 105.6042,
"train_samples_per_second": 907.395,
"train_runtime": 120.6563,
"train_samples_per_second": 847.504,
"extra_arguments": [
"--max_seq_length 384",
"--use_hpu_graphs_for_inference"
Expand Down Expand Up @@ -95,4 +95,4 @@
}
}
}
}
}
6 changes: 3 additions & 3 deletions tests/baselines/roberta_large.json
Original file line number Diff line number Diff line change
Expand Up @@ -56,8 +56,8 @@
"learning_rate": 3e-5,
"train_batch_size": 32,
"eval_f1": 94.5886,
"train_runtime": 342.1653,
"train_samples_per_second": 284.873,
"train_runtime": 361.4789,
"train_samples_per_second": 266.47,
"extra_arguments": [
"--max_seq_length 384",
"--use_hpu_graphs_for_inference"
Expand Down Expand Up @@ -95,4 +95,4 @@
}
}
}
}
}
6 changes: 3 additions & 3 deletions tests/test_image_to_text_example.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,14 +15,14 @@
MODELS_TO_TEST = {
"bf16": [
("llava-hf/llava-1.5-7b-hf", 1, 87.2901500056982),
("llava-hf/llava-1.5-13b-hf", 1, 54.41252589197953),
("llava-hf/llava-1.5-13b-hf", 1, 51.04717105443364),
("llava-hf/llava-v1.6-mistral-7b-hf", 1, 33.17984878151546),
("llava-hf/llava-v1.6-vicuna-7b-hf", 1, 35.00608681379742),
("llava-hf/llava-v1.6-vicuna-13b-hf", 1, 23.527610042925),
],
"fp8": [
("llava-hf/llava-1.5-7b-hf", 1, 123.00953973789325),
("llava-hf/llava-1.5-13b-hf", 1, 82.81132373492122),
("llava-hf/llava-1.5-7b-hf", 1, 115.48515989461843),
("llava-hf/llava-1.5-13b-hf", 1, 78.2635142547838),
("llava-hf/llava-v1.6-mistral-7b-hf", 1, 45.011551008367084),
("llava-hf/llava-v1.6-vicuna-7b-hf", 1, 45.18544502949674),
("llava-hf/llava-v1.6-vicuna-13b-hf", 1, 30.9535718774675),
Expand Down

0 comments on commit 66959b1

Please sign in to comment.