当前位置：首页 > news >正文

轻量级关键点 blaze pose 2025

news 2025/6/10 5:24:06

BlazePose-Lite(1.7M Params)

BlazePose-Full(3.4M Params)

网络代码和预训练模型：

BlazePose-Lite(1.7M Params)

Arch	AP	Ap .5	AP .75	AP (M)	AP (L)	AR	AR .5	AR .75	AR (M)	AR (L)
BlazePose	0.623	0.883	0.714	0.616	0.684	0.679	0.898	0.748	0.648	0.726

BlazePose-Full(3.4M Params)

Arch	AP	Ap .5	AP .75	AP (M)	AP (L)	AR	AR .5	AR .75	AR (M)	AR (L)
BlazePose-Full	0.653	0.894	0.725	0.625	0.697	0.690	0.906	0.754	0.654	0.743

网络代码和预训练模型：

GitHub - jacke121/BlazePose_torch: pytorch implement of google blazePose

GitHub - WangChyanhassth-2say/BlazePose_torch: pytorch implement of google blazePose

提供了预训练，full模型7.09M，lite 6.8M

推理速度9ms

# ------------------------------------------------------------------------------
# BlazePose:
# Written by me(460717505@qq.com)
# ------------------------------------------------------------------------------
# ------------------------------------------------------------------------------
# The SimDR and SA-SimDR part:
# Written by Yanjie Li (lyj20@mails.tsinghua.edu.cn)
# ------------------------------------------------------------------------------
import timeimport torch
import torch.nn as nn
import torch.nn.functional as F
from einops import rearrange, repeatclass h_sigmoid(nn.Module):def __init__(self):super(h_sigmoid, self).__init__()def forward(self, x):return F.relu6(x + 3.) / 6.class h_swish(nn.Module):def __init__(self, inplace=True):super(h_swish, self).__init__()self.sigmoid = h_sigmoid()def forward(self, x):return x * self.sigmoid(x)class SwishLinear(nn.Module):def __init__(self, inp, oup):super(SwishLinear, self).__init__()self.linear = nn.Sequential(nn.Linear(inp, oup),nn.BatchNorm1d(oup),)def forward(self, x):return self.linear(x)class Reshape(nn.Module):def __init__(self, *args):super(Reshape, self).__init__()self.shape = argsdef forward(self, x):return x.view((x.size(0),)+self.shape)class SEModule(nn.Module):def __init__(self, channel, reduction=4):super(SEModule, self).__init__()self.avg_pool = nn.AdaptiveAvgPool2d(1)self.fc = nn.Sequential(nn.Linear(channel, channel // reduction, bias=False),nn.ReLU(inplace=True),nn.Linear(channel // reduction, channel, bias=False),h_sigmoid()# nn.Sigmoid())def forward(self, x):b, c, _, _ = x.size()y = self.avg_pool(x).view(b, c)y = self.fc(y).view(b, c, 1, 1)return x * y.expand_as(x)class Identity(nn.Module):def __init__(self, channel):super(Identity, self).__init__()def forward(self, x):return xclass BlazeBlock(nn.Module):def __init__(self, in_channels, out_channels, stride=1, kernel_size=3):super(BlazeBlock, self).__init__()self.use_pooling = stride == 2self.channel_pad = out_channels - in_channelsif self.use_pooling:self.pool = nn.MaxPool2d(kernel_size=2, stride=2)padding = 0else:padding = 1self.depth_conv = nn.Conv2d(in_channels, in_channels, kernel_size=kernel_size, stride=stride,padding=padding, groups=in_channels)self.pointwise_conv = nn.Conv2d(in_channels, out_channels, kernel_size=1, stride=1, padding=0)self.relu = nn.ReLU6(inplace=True)def forward(self, x):if self.use_pooling:conv_input = F.pad(x, [0, 1, 0, 1], "constant", 0)x = self.pool(x)else:conv_input = xconv_out = self.depth_conv(conv_input)conv_out = self.pointwise_conv(conv_out)if self.channel_pad > 0:x = F.pad(x, [0, 0, 0, 0, 0, self.channel_pad], "constant", 0)return self.relu(conv_out + x)class MobileBottleneck(nn.Module):def __init__(self, inp, oup, kernel, stride, exp, se=False, nl='RE'):super(MobileBottleneck, self).__init__()assert stride in [1, 2]assert kernel in [3, 5]padding = (kernel - 1) // 2self.use_res_connect = stride == 1 and inp == oupconv_layer = nn.Conv2dnorm_layer = nn.BatchNorm2dif nl == 'RE':nlin_layer = nn.ReLU6 # or ReLUelif nl == 'HS':nlin_layer = h_swishelse:raise NotImplementedErrorif se:SELayer = SEModuleelse:SELayer = Identityself.conv = nn.Sequential(# pwconv_layer(inp, exp, 1, 1, 0, bias=False),norm_layer(exp),nlin_layer(inplace=True),# dwconv_layer(exp, exp, kernel, stride, padding, groups=exp, bias=False),norm_layer(exp),SELayer(exp),nlin_layer(inplace=True),# pw-linearconv_layer(exp, oup, 1, 1, 0, bias=False),norm_layer(oup),)def forward(self, x):if self.use_res_connect:return x + self.conv(x)else:return self.conv(x)class BlazePose(nn.Module):def __init__(self, num_keypoints: int):super(BlazePose, self).__init__()self.num_keypoints = num_keypoints# stem layersself.conv1 = nn.Sequential(nn.Conv2d(3, 16, 3, 2, 1, bias=False),nn.BatchNorm2d(16),h_swish())# MobileBottleneck: input:(inp, oup, k, s, exp, se, li)self.conv2_b1 = MobileBottleneck(16, 16, 3, 1, 72, False, 'RE')self.conv3_b1 = MobileBottleneck(32, 32, 5, 1, 120, True, 'RE')self.conv4_b1 = MobileBottleneck(64, 64, 3, 1, 200, False, 'HS')self.conv4_b2 = MobileBottleneck(64, 64, 3, 1, 184, False, 'HS')self.conv5_b1 = MobileBottleneck(128, 128, 3, 1, 480, True, 'HS')self.conv5_b2 = MobileBottleneck(128, 128, 3, 1, 672, True, 'HS')self.conv6_b1 = MobileBottleneck(192, 192, 5, 1, 960, True, 'HS')self.conv12_a1 = MobileBottleneck(32, 32, 5, 1, 120, True, 'RE')self.conv13_a1 = MobileBottleneck(64, 64, 3, 1, 200, False, 'HS')self.conv13_a2 = MobileBottleneck(64, 64, 3, 1, 184, False, 'HS')self.conv14_a1 = MobileBottleneck(128, 128, 3, 1, 480, True, 'HS')self.conv14_a2 = MobileBottleneck(128, 128, 3, 1, 672, True, 'HS')self.conv15_a1 = MobileBottleneck(192, 192, 5, 1, 960, True, 'HS')# blaze blocksself.conv2 = BlazeBlock(16, 16, 1)self.conv3 = BlazeBlock(16, 32, 2)self.conv4 = BlazeBlock(32, 64, 2)self.conv5 = BlazeBlock(64, 128, 2)self.conv6 = BlazeBlock(128, 192, 2)self.conv12 = BlazeBlock(32, 64, 2)self.conv13 = BlazeBlock(64, 128, 2)self.conv14 = BlazeBlock(128, 192, 2)self.conv7_ = nn.Sequential(nn.Conv2d(192, 32, 3, 1, 1, bias=False),nn.BatchNorm2d(32),h_swish())self.conv8_ = nn.Sequential(nn.Conv2d(128, 32, 3, 1, 1, bias=False),nn.BatchNorm2d(32),h_swish())self.conv9_ = nn.Sequential(nn.Conv2d(64, 32, 3, 1, 1, bias=False),nn.BatchNorm2d(32),h_swish())# up sample layerself.upsample0 = nn.Upsample(scale_factor=2, mode='bilinear',align_corners=True)self.upsample1 = nn.Upsample(scale_factor=2, mode='bilinear',align_corners=True)self.upsample2 = nn.Upsample(scale_factor=2, mode='bilinear',align_corners=True)# last several layersself.conv15 = nn.Sequential(nn.Conv2d(192, self.num_keypoints, 1, 1, 0, bias=False),nn.Sigmoid())self.mlp_head_x = nn.Linear(64, int(256 * 2))self.mlp_head_y = nn.Linear(64, int(256 * 2))def forward(self, x):# stem layersx = self.conv1(x)x = self.conv2(x)x = self.conv2_b1(x)# blazeblocks and mobilebottlenecks# naming differently for the skip connectiony0 = self.conv3(x)y0 = self.conv3_b1(y0)y1 = self.conv4(y0)y1 = self.conv4_b1(y1)y1 = self.conv4_b2(y1)y2 = self.conv5(y1)y2 = self.conv5_b1(y2)y2 = self.conv5_b2(y2)y3 = self.conv6(y2)y3 = self.conv6_b1(y3)# heatmap branchx3 = self.conv7_(y3)x2 = self.conv8_(y2) + self.upsample2(x3)x1 = self.conv9_(y1) + self.upsample1(x2)x0 = y0 + self.upsample0(x1)# regression branch# simDR style# using .detach() to cut the propagaton to the layers beforex = x0.detach() + y0.detach()x = self.conv12_a1(x)x = self.conv12(x) + y1.detach()x = self.conv13_a1(x)x = self.conv13_a2(x)x = self.conv13(x) + y2.detach()x = self.conv14_a1(x)x = self.conv14_a2(x)x = self.conv14(x) + y3.detach()x = self.conv15_a1(x)x = self.conv15(x)x = rearrange(x, 'b c h w -> b c (h w)')pred_x = self.mlp_head_x(x)pred_y = self.mlp_head_y(x)return (pred_x, pred_y)def _initialize_weights(self):# weight initializationfor m in self.modules():if isinstance(m, nn.Conv2d):nn.init.kaiming_normal_(m.weight, mode='fan_out')if m.bias is not None:nn.init.zeros_(m.bias)elif isinstance(m, nn.BatchNorm2d):nn.init.ones_(m.weight)nn.init.zeros_(m.bias)elif isinstance(m, nn.Linear):nn.init.normal_(m.weight, 0, 0.01)if m.bias is not None:nn.init.zeros_(m.bias)if __name__ == '__main__':# from torchsummaryX import summarymodel = BlazePose(17)model=model.cuda()model.eval()for i in range(10):dummy_input = torch.rand(1, 3, 256, 256).cuda()start = time.time()out=model(dummy_input)print(out[0].shape,time.time()-start)

查看全文

http://www.xdnf.cn/news/945829.html