generated from dlibml/dlib-template-project
-
Notifications
You must be signed in to change notification settings - Fork 1
/
repvgg.h
82 lines (68 loc) · 4.65 KB
/
repvgg.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
#ifndef RepVGG_H
#define RepVGG_H
#include <dlib/dnn.h>
namespace repvgg
{
// clang-format off
using namespace dlib;
// ACT can be any activation layer.
// a_n, a_d: a multiplier numerator and denominator, respectively.
// b_n, b_d: b multiplier numerator and denominator, respectively.
template <template <typename> class ACT, long a_n, long a_d, long b_n, long b_d>
struct def
{
static const long filters_0 = std::min<long>(64, 64 * a_n / a_d);
static const long filters_1 = 64 * a_n / a_d;
static const long filters_2 = 128 * a_n / a_d;
static const long filters_3 = 256 * a_n / a_d;
static const long filters_4 = 512 * b_n / b_d;
// padded convolution
template <long num_filters, long ks, int s, typename SUBNET>
using pcon = add_layer<con_<num_filters, ks, ks, s, s, ks/2, ks/2>, SUBNET>;
// batch norm + padded convolution
template <long num_filters, long ks, int s, typename SUBNET>
using bcon = bn_con<pcon<num_filters, ks, s, SUBNET>>;
// RepVGG block: 3x3 & 1x1 convolutions
template <long num_filters, int s, typename SUBNET>
using repvggblock = add_prev2<bcon<num_filters, 1, s, skip1<tag2<bcon<num_filters, 3, s, tag1<SUBNET>>>>>>;
// RepVGG block + identity (with batch norm): tag1 is the input of the RepVGG block defined above
template <long num_filters, typename SUBNET>
using repvggblock_id = add_prev3<bn_con<skip1<tag3<repvggblock<num_filters, 1, SUBNET>>>>>;
template <typename SUBNET> using repvggblock_id_1 = ACT<repvggblock_id<filters_1, SUBNET>>;
template <typename SUBNET> using repvggblock_id_2 = ACT<repvggblock_id<filters_2, SUBNET>>;
template <typename SUBNET> using repvggblock_id_3 = ACT<repvggblock_id<filters_3, SUBNET>>;
template <typename SUBNET> using iblock_1 = ACT<pcon<filters_1, 3, 1, SUBNET>>;
template <typename SUBNET> using iblock_2 = ACT<pcon<filters_2, 3, 1, SUBNET>>;
template <typename SUBNET> using iblock_3 = ACT<pcon<filters_3, 3, 1, SUBNET>>;
template <size_t nb_3, size_t nb_2, size_t nb_1, typename INPUT>
using tbackbone = ACT<repvggblock<filters_4, 2,
repeat<nb_3, repvggblock_id_3, ACT<repvggblock<filters_3, 2,
repeat<nb_2, repvggblock_id_2, ACT<repvggblock<filters_2, 2,
repeat<nb_1, repvggblock_id_1, ACT<repvggblock<filters_1, 2,
ACT<repvggblock<filters_0, 2, INPUT>>>>>>>>>>>>>;
template <size_t nb_3, size_t nb_2, size_t nb_1, typename INPUT>
using ibackbone = ACT<pcon<filters_4, 3, 2,
repeat<nb_3, iblock_3, ACT<pcon<filters_3, 3, 2,
repeat<nb_2, iblock_2, ACT<pcon<filters_2, 3, 2,
repeat<nb_1, iblock_1, ACT<pcon<filters_1, 3, 2,
ACT<pcon<filters_0, 3, 2, INPUT>>>>>>>>>>>>>;
};
template <long num_filters, typename SUBNET>
using classification_head = loss_multiclass_log<fc<num_filters, avg_pool_everything<SUBNET>>>;
using train_a0 = classification_head<1000, def<relu, 3, 4, 5, 2>::tbackbone<13, 3, 1, input_rgb_image>>;
using infer_a0 = classification_head<1000, def<relu, 3, 4, 5, 2>::ibackbone<13, 3, 1, input_rgb_image>>;
using train_a1 = classification_head<1000, def<relu, 1, 1, 5, 2>::tbackbone<13, 3, 1, input_rgb_image>>;
using infer_a1 = classification_head<1000, def<relu, 1, 1, 5, 2>::ibackbone<13, 3, 1, input_rgb_image>>;
using train_a2 = classification_head<1000, def<relu, 3, 2, 11, 4>::tbackbone<13, 3, 1, input_rgb_image>>;
using infer_a2 = classification_head<1000, def<relu, 3, 2, 11, 4>::ibackbone<13, 3, 1, input_rgb_image>>;
using train_b0 = classification_head<1000, def<relu, 1, 1, 5, 2>::tbackbone<15, 5, 3, input_rgb_image>>;
using infer_b0 = classification_head<1000, def<relu, 1, 1, 5, 2>::ibackbone<15, 5, 3, input_rgb_image>>;
using train_b1 = classification_head<1000, def<relu, 2, 1, 4, 1>::tbackbone<15, 5, 3, input_rgb_image>>;
using infer_b1 = classification_head<1000, def<relu, 2, 1, 4, 1>::ibackbone<15, 5, 3, input_rgb_image>>;
using train_b2 = classification_head<1000, def<relu, 5, 2, 5, 1>::tbackbone<15, 5, 3, input_rgb_image>>;
using infer_b2 = classification_head<1000, def<relu, 5, 2, 5, 1>::ibackbone<15, 5, 3, input_rgb_image>>;
using train_b3 = classification_head<1000, def<relu, 5, 2, 5, 1>::tbackbone<15, 5, 3, input_rgb_image>>;
using infer_b3 = classification_head<1000, def<relu, 3, 1, 5, 1>::ibackbone<15, 5, 3, input_rgb_image>>;
// clang-format on
} // namespace repvgg
#endif // RepVGG_H