FluxML · RafaelT00 · Nov 3, 2023 · Nov 3, 2023 · May 3, 2024 · May 6, 2024
diff --git a/src/convnets/shufflenet.jl b/src/convnets/shufflenet.jl
@@ -0,0 +1,160 @@
+using Flux
+
+"""
+Channelshuffle(channels, groups)
+
+Channel shuffle operation from 'ShuffleNet: An Extremely Efficient Convolutional Neural Network for Mobile Devices
+([reference](https://arxiv.org/abs/1707.01083)).
+
+# Arguments
+
+  - `channels`: number of channels
+  - `groups`: number of groups
+"""
+function ChannelShuffle(x::Array{Float32, 4}, g::Int)
-function ChannelShuffle(x::Array{Float32, 4}, g::Int)
+function channel_shuffle(x::AbstractArray{Float32, 4}, g::Int)
-function ChannelShuffle(x::Array{Float32, 4}, g::Int)
+function channel_shuffle(x::AbstractArray{Float32, 4}, g::Int)
+    width, height, channels, batch = size(x)
+    channels_per_group = channels÷g
+    if (channels % g) == 0
-    if (channels % g) == 0
+    if channels % g == 0
-    if (channels % g) == 0
+    if channels % g == 0
+        x = reshape(x, (width, height, g, channels_per_group, batch))
+        x = permutedims(x,(1,2,4,3,5))
+        x = reshape(x, (width, height, channels, batch))
+    end
+    return x
+end
+
+"""
+ShuffleUnit(in_channels::Integer, out_channels::Integer, grps::Integer, downsample::Bool, ignore_group::Bool)
+
+Shuffle Unit from 'ShuffleNet: An Extremely Efficient Convolutional Neural Network for Mobile Devices
+([reference](https://arxiv.org/abs/1707.01083)).
+
+# Arguments
+
+  - `in_channels`: number of input channels
+  - `out_channels`: number of output channels
+  - `groups`: number of groups
+  - `downsample`: apply downsaple if true
+  - `ignore_group`: ignore group convolution if true
+"""
+function ShuffleUnit(in_channels::Integer, out_channels::Integer, groups::Integer, downsample::Bool, ignore_group::Bool)
+    mid_channels = out_channels ÷ 4
+    groups = ignore_group ? 1 : groups
+    strd = downsample ? 2 : 1
+
+    if downsample
+        out_channels -= in_channels
+    end
+
+    m = Chain(Conv((1,1), in_channels => mid_channels; groups,pad=SamePad()),
+              BatchNorm(mid_channels),
+              NNlib.relu,
-              BatchNorm(mid_channels),
-              NNlib.relu,
+              BatchNorm(mid_channels, relu),
-              BatchNorm(mid_channels),
-              NNlib.relu,
+              BatchNorm(mid_channels, relu),
+              x -> ChannelShuffle(x, groups),
-              x -> ChannelShuffle(x, groups),
+              Base.Fix2(channel_shuffle, groups),
-              x -> ChannelShuffle(x, groups),
+              Base.Fix2(channel_shuffle, groups),
+              DepthwiseConv((3,3),  mid_channels => mid_channels; bias=false, stride=strd, pad=SamePad()),
+              BatchNorm(mid_channels),
+              NNlib.relu,
+              Conv((1,1), mid_channels => out_channels; groups, pad=SamePad()),
+              BatchNorm(out_channels),
+              NNlib.relu)
+
+    if downsample
+        m = Parallel((mx, x) -> cat(mx, x, dims=3),m, MeanPool((3,3); pad=SamePad(), stride=2))
-        m = Parallel((mx, x) -> cat(mx, x, dims=3),m, MeanPool((3,3); pad=SamePad(), stride=2))
+        m = Parallel(cat_channels, m, MeanPool((3,3); pad=SamePad(), stride=2))
-        m = Parallel((mx, x) -> cat(mx, x, dims=3),m, MeanPool((3,3); pad=SamePad(), stride=2))
+        m = Parallel(cat_channels, m, MeanPool((3,3); pad=SamePad(), stride=2))
+    else
+        m = SkipConnection(m, +)
+    end
+    return m
+end
+
+"""
+ShuffleNet(channels, init_block_channels::Integer, groups, num_classes; in_channels=3)
+
+ShuffleNet model from 'ShuffleNet: An Extremely Efficient Convolutional Neural Network for Mobile Devices
+([reference](https://arxiv.org/abs/1707.01083)).
+
+# Arguments
+
+  - `channels`: list of channels per layer
+  - `init_block_channels`: number of output channels from the first layer
+  - `groups`: number of groups
+  - `num_classes`: number of classes
+  - `in_channels`: number of input channels
+"""
+function ShuffleNet(channels, init_block_channels::Integer, groups, num_classes; in_channels=3)
+    features = []
+
+    append!(features, [Conv((3,3), in_channels => init_block_channels; stride=2, pad=SamePad()),
+    BatchNorm(init_block_channels),
+    NNlib.relu,
+    MaxPool((3,3); stride=2, pad=SamePad())])
+
+    in_channels::Integer = init_block_channels
+
+    for (i, num_channels) in enumerate(channels)
+        stage = []
+        for (j, out_channels) in enumerate(num_channels)
+            downsample = j==1
+            ignore_group = i==1 && j==1
+            out_ch::Integer = trunc(out_channels)
+            push!(stage, ShuffleUnit(in_channels, out_ch, groups, downsample, ignore_group))
+            in_channels = out_ch
+        end
+        append!(features, stage)
+    end
+
+    model = Chain(features...)
+
+    return Chain(model, GlobalMeanPool(), Flux.flatten, Dense(in_channels => num_classes))
-    return Chain(model, GlobalMeanPool(), Flux.flatten, Dense(in_channels => num_classes))
+    return Chain(model, GlobalMeanPool(), MLUtils.flatten, Dense(in_channels => num_classes))
-    return Chain(model, GlobalMeanPool(), Flux.flatten, Dense(in_channels => num_classes))
+    return Chain(model, GlobalMeanPool(), MLUtils.flatten, Dense(in_channels => num_classes))
+end
+
+"""
+shufflenet(groups, width_scale, num_classes; in_channels=3)
+
+Wrapper for ShuffleNet. Create a ShuffleNet model from 'ShuffleNet: An Extremely Efficient Convolutional Neural Network for Mobile Devices
+([reference](https://arxiv.org/abs/1707.01083)).
+
+# Arguments
+
+  - `groups`: number of groups
+  - `width_scale`: scaling factor for number of channels
+  - `num_classes`: number of classes
+  - `in_channels`: number of input channels
+"""
+function shufflenet(groups, width_scale, num_classes; in_channels=3)
+    init_block_channels = 24
+    layers = [4, 8, 4]
+
+    if groups == 1
+        channels_per_layers = [144, 288, 576]
+    elseif groups == 2
+        channels_per_layers = [200, 400, 800]
+    elseif groups == 3
+        channels_per_layers = [240, 480, 960]
+    elseif groups == 4
+        channels_per_layers = [272, 544, 1088]
+    elseif groups == 8
+        channels_per_layers = [384, 768, 1536]
+    else
+        return error("The number of groups is not supported. Groups = ", groups)
+    end
+
+    channels = []
+    for i in eachindex(layers)
+        char = [channels_per_layers[i]]
+        new = repeat(char, layers[i])
+        push!(channels, new)
+    end
+
+    if width_scale != 1.0
+        channels = channels*width_scale
+
+        init_block_channels::Integer = trunc(init_block_channels * width_scale)
+    end
+
+    net = ShuffleNet(
+        channels,
+        init_block_channels,
+        groups; 
+        in_channels, 
+        num_classes)
+
+    return net
+end