intracl.py 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121
  1. import paddle
  2. from paddle import nn
  3. # refer from: https://github.com/ViTAE-Transformer/I3CL/blob/736c80237f66d352d488e83b05f3e33c55201317/mmdet/models/detectors/intra_cl_module.py
  4. class IntraCLBlock(nn.Layer):
  5. def __init__(self, in_channels=96, reduce_factor=4):
  6. super(IntraCLBlock, self).__init__()
  7. self.channels = in_channels
  8. self.rf = reduce_factor
  9. weight_attr = paddle.nn.initializer.KaimingUniform()
  10. self.conv1x1_reduce_channel = nn.Conv2D(
  11. self.channels, self.channels // self.rf, kernel_size=1, stride=1, padding=0
  12. )
  13. self.conv1x1_return_channel = nn.Conv2D(
  14. self.channels // self.rf, self.channels, kernel_size=1, stride=1, padding=0
  15. )
  16. self.v_layer_7x1 = nn.Conv2D(
  17. self.channels // self.rf,
  18. self.channels // self.rf,
  19. kernel_size=(7, 1),
  20. stride=(1, 1),
  21. padding=(3, 0),
  22. )
  23. self.v_layer_5x1 = nn.Conv2D(
  24. self.channels // self.rf,
  25. self.channels // self.rf,
  26. kernel_size=(5, 1),
  27. stride=(1, 1),
  28. padding=(2, 0),
  29. )
  30. self.v_layer_3x1 = nn.Conv2D(
  31. self.channels // self.rf,
  32. self.channels // self.rf,
  33. kernel_size=(3, 1),
  34. stride=(1, 1),
  35. padding=(1, 0),
  36. )
  37. self.q_layer_1x7 = nn.Conv2D(
  38. self.channels // self.rf,
  39. self.channels // self.rf,
  40. kernel_size=(1, 7),
  41. stride=(1, 1),
  42. padding=(0, 3),
  43. )
  44. self.q_layer_1x5 = nn.Conv2D(
  45. self.channels // self.rf,
  46. self.channels // self.rf,
  47. kernel_size=(1, 5),
  48. stride=(1, 1),
  49. padding=(0, 2),
  50. )
  51. self.q_layer_1x3 = nn.Conv2D(
  52. self.channels // self.rf,
  53. self.channels // self.rf,
  54. kernel_size=(1, 3),
  55. stride=(1, 1),
  56. padding=(0, 1),
  57. )
  58. # base
  59. self.c_layer_7x7 = nn.Conv2D(
  60. self.channels // self.rf,
  61. self.channels // self.rf,
  62. kernel_size=(7, 7),
  63. stride=(1, 1),
  64. padding=(3, 3),
  65. )
  66. self.c_layer_5x5 = nn.Conv2D(
  67. self.channels // self.rf,
  68. self.channels // self.rf,
  69. kernel_size=(5, 5),
  70. stride=(1, 1),
  71. padding=(2, 2),
  72. )
  73. self.c_layer_3x3 = nn.Conv2D(
  74. self.channels // self.rf,
  75. self.channels // self.rf,
  76. kernel_size=(3, 3),
  77. stride=(1, 1),
  78. padding=(1, 1),
  79. )
  80. self.bn = nn.BatchNorm2D(self.channels)
  81. self.relu = nn.ReLU()
  82. def forward(self, x):
  83. x_new = self.conv1x1_reduce_channel(x)
  84. x_7_c = self.c_layer_7x7(x_new)
  85. x_7_v = self.v_layer_7x1(x_new)
  86. x_7_q = self.q_layer_1x7(x_new)
  87. x_7 = x_7_c + x_7_v + x_7_q
  88. x_5_c = self.c_layer_5x5(x_7)
  89. x_5_v = self.v_layer_5x1(x_7)
  90. x_5_q = self.q_layer_1x5(x_7)
  91. x_5 = x_5_c + x_5_v + x_5_q
  92. x_3_c = self.c_layer_3x3(x_5)
  93. x_3_v = self.v_layer_3x1(x_5)
  94. x_3_q = self.q_layer_1x3(x_5)
  95. x_3 = x_3_c + x_3_v + x_3_q
  96. x_relation = self.conv1x1_return_channel(x_3)
  97. x_relation = self.bn(x_relation)
  98. x_relation = self.relu(x_relation)
  99. return x + x_relation
  100. def build_intraclblock_list(num_block):
  101. IntraCLBlock_list = nn.LayerList()
  102. for i in range(num_block):
  103. IntraCLBlock_list.append(IntraCLBlock())
  104. return IntraCLBlock_list