Skip to content

Latest commit

 

History

History
118 lines (114 loc) · 4.09 KB

README.md

File metadata and controls

118 lines (114 loc) · 4.09 KB

VOVNet

This is a reasonably clean implementation of a classifier using VOVNet (https://arxiv.org/abs/1904.09730). A very simple architecture which, nevertheless produces very good accuracy, and is especially useful for object detection applications.

The following ImageNet checkpoints are included:

Higher accuracies should be possible, this was one of the very first attempts to train this. Training was done with SGD, EMA and smooth CE.

Detailed parameters:

CONFIGS = {
    "vovnet19": {
        "dropout": 0.2,
        "batch_size": 512,
        "loss": "smooth_ce",
        "loss_kwargs": {"smoothing": 0.1},
        "epochs": 50,
        "optimizer": "sgd",
        "optimizer_kwargs": {"momentum": 0.9, "weight_decay": 2e-5, "nesterov": True},
        "scheduler": "cosine",
        "scheduler_kwargs": {
            "num_cycles": 1,
            "peak_lr": 3.0,
            "min_lr": 1e-7,
            "total_lr_decay": 0.1,
            "initial_warmup_step_fraction": 0.0,
            "cycle_warmup_step_fraction": 0.1,
        },
        "trainer_kwargs": {"use_ema": True},
    },
    "vovnet27_slim": {
        "dropout": 0.2,
        "batch_size": 400,
        "loss": "smooth_ce",
        "loss_kwargs": {"smoothing": 0.1},
        "epochs": 100,
        "optimizer": "sgd",
        "optimizer_kwargs": {"momentum": 0.9, "weight_decay": 2e-5, "nesterov": True},
        "scheduler": "cosine",
        "scheduler_kwargs": {
            "num_cycles": 1,
            "peak_lr": 2.0,
            "min_lr": 1e-7,
            "total_lr_decay": 0.1,
            "initial_warmup_step_fraction": 0.0,
            "cycle_warmup_step_fraction": 0.1,
        },
        "trainer_kwargs": {"use_ema": True},
    },
    "vovnet39": {
        "dropout": 0.2,
        "batch_size": 300,
        "loss": "smooth_ce",
        "loss_kwargs": {"smoothing": 0.1},
        "epochs": 100,
        "optimizer": "sgd",
        "optimizer_kwargs": {"momentum": 0.9, "weight_decay": 2e-5, "nesterov": True},
        "scheduler": "cosine",
        "scheduler_kwargs": {
            "num_cycles": 1,
            "peak_lr": 2.0,
            "min_lr": 1e-7,
            "total_lr_decay": 0.1,
            "initial_warmup_step_fraction": 0.0,
            "cycle_warmup_step_fraction": 0.1,
        },
        "trainer_kwargs": {"use_ema": True},
    },
    "vovnet57": {
        "dropout": 0.2,
        "batch_size": 256,
        "epochs": 100,
        "loss": "smooth_ce",
        "loss_kwargs": {"smoothing": 0.1},
        "optimizer": "sgd",
        "optimizer_kwargs": {"momentum": 0.9, "weight_decay": 2e-5, "nesterov": True},
        "scheduler": "cosine",
        "scheduler_kwargs": {
            "num_cycles": 1,
            "peak_lr": 2.0,
            "min_lr": 1e-7,
            "total_lr_decay": 0.1,
            "initial_warmup_step_fraction": 0.0,
            "cycle_warmup_step_fraction": 0.1,
        },
        "trainer_kwargs": {"use_ema": True},
    },
    "vovnet99": {
        "dropout": 0.2,
        "batch_size": 160,
        "epochs": 100,
        "loss": "smooth_ce",
        "loss_kwargs": {"smoothing": 0.1},
        "optimizer": "sgd",
        "optimizer_kwargs": {"momentum": 0.9, "weight_decay": 2e-5, "nesterov": True},
        "scheduler": "cosine",
        "scheduler_kwargs": {
            "num_cycles": 1,
            "peak_lr": 0.8,
            "min_lr": 1e-7,
            "total_lr_decay": 0.1,
            "initial_warmup_step_fraction": 0.0,
            "cycle_warmup_step_fraction": 0.1,
        },
        "trainer_kwargs": {"use_ema": True},
    },
}

After each of these runs I recommend another run, also with EMA, but at 1/50th the max learning rate (or so), to take up the slack on accuracy.