From 31dd3aebb4172b3d9ee0c0785c926c2641d0db24 Mon Sep 17 00:00:00 2001 From: PingqiLi Date: Mon, 4 Mar 2024 10:18:24 +0800 Subject: [PATCH 1/2] fix: add warmup to the training config of squeezenet_1.0 to make the training stable. --- configs/squeezenet/README.md | 12 ++++++------ configs/squeezenet/squeezenet_1.0_ascend.yaml | 2 +- mindcv/models/squeezenet.py | 2 +- 3 files changed, 8 insertions(+), 8 deletions(-) diff --git a/configs/squeezenet/README.md b/configs/squeezenet/README.md index e29bdd45c..2717f1709 100644 --- a/configs/squeezenet/README.md +++ b/configs/squeezenet/README.md @@ -25,12 +25,12 @@ Our reproduced model performance on ImageNet-1K is reported as follows.
-| Model | Context | Top-1 (%) | Top-5 (%) | Params (M) | Recipe | Download | -|---------------|---------|-----------|-----------|------------|---------------------------------------------------------------------------------------------------------|---------------------------------------------------------------------------------------------| -| squeezenet1_0 | D910x8-G | 59.01 | 81.01 | 1.25 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.0_ascend.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_0-e2d78c4a.ckpt) | -| squeezenet1_0 | GPUx8-G | 58.83 | 81.08 | 1.25 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.0_gpu.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_0_gpu-685f5941.ckpt) | -| squeezenet1_1 | D910x8-G | 58.44 | 80.84 | 1.24 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.1_ascend.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_1-da256d3a.ckpt) | -| squeezenet1_1 | GPUx8-G | 59.18 | 81.41 | 1.24 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.1_gpu.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_1_gpu-0e33234a.ckpt) | +| Model | Context | Top-1 (%) | Top-5 (%) | Params (M) | Recipe | Download | +|---------------|---------|-----------|-----------|------------|---------------------------------------------------------------------------------------------------------|--------------------------------------------------------------------------------------------------------| +| squeezenet1_0 | D910x8-G | 58.67 | 80.61 | 1.25 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.0_ascend.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_0-eb911778.ckpt) | +| squeezenet1_0 | GPUx8-G | 58.83 | 81.08 | 1.25 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.0_gpu.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_0_gpu-685f5941.ckpt) | +| squeezenet1_1 | D910x8-G | 58.44 | 80.84 | 1.24 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.1_ascend.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_1-da256d3a.ckpt) | +| squeezenet1_1 | GPUx8-G | 59.18 | 81.41 | 1.24 | [yaml](https://github.com/mindspore-lab/mindcv/blob/main/configs/squeezenet/squeezenet_1.1_gpu.yaml) | [weights](https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_1_gpu-0e33234a.ckpt) |
diff --git a/configs/squeezenet/squeezenet_1.0_ascend.yaml b/configs/squeezenet/squeezenet_1.0_ascend.yaml index cb2df5061..aed5d70b5 100644 --- a/configs/squeezenet/squeezenet_1.0_ascend.yaml +++ b/configs/squeezenet/squeezenet_1.0_ascend.yaml @@ -40,7 +40,7 @@ label_smoothing: 0.1 scheduler: 'warmup_cosine_decay' min_lr: 0.0 lr: 0.1 -warmup_epochs: 0 +warmup_epochs: 5 decay_epochs: 200 # optimizer diff --git a/mindcv/models/squeezenet.py b/mindcv/models/squeezenet.py index 48fc3d113..b70a21644 100644 --- a/mindcv/models/squeezenet.py +++ b/mindcv/models/squeezenet.py @@ -29,7 +29,7 @@ def _cfg(url="", **kwargs): default_cfgs = { - "squeezenet1_0": _cfg(url="https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_0-e2d78c4a.ckpt"), + "squeezenet1_0": _cfg(url="https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_0-eb911778.ckpt"), "squeezenet1_1": _cfg(url="https://download.mindspore.cn/toolkits/mindcv/squeezenet/squeezenet1_1-da256d3a.ckpt"), } From e2c38b901366feeff4fe255a3be70cbab796e834 Mon Sep 17 00:00:00 2001 From: PingqiLi Date: Mon, 18 Mar 2024 17:34:06 +0800 Subject: [PATCH 2/2] fix the config of squeezenet_1.0 to avoid overflow --- configs/squeezenet/squeezenet_1.0_ascend.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/configs/squeezenet/squeezenet_1.0_ascend.yaml b/configs/squeezenet/squeezenet_1.0_ascend.yaml index aed5d70b5..79c06bbdb 100644 --- a/configs/squeezenet/squeezenet_1.0_ascend.yaml +++ b/configs/squeezenet/squeezenet_1.0_ascend.yaml @@ -30,7 +30,7 @@ keep_checkpoint_max: 10 ckpt_save_dir: './ckpt' epoch_size: 200 dataset_sink_mode: True -amp_level: 'O2' +amp_level: 'O0' # loss loss: 'CE'