upfirdn2d.py 5.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187
  1. import os
  2. import torch
  3. from torch.autograd import Function
  4. from torch.utils.cpp_extension import load
  5. module_path = os.path.dirname(__file__)
  6. upfirdn2d_op = load(
  7. 'upfirdn2d',
  8. sources=[
  9. os.path.join(module_path, 'upfirdn2d.cpp'),
  10. os.path.join(module_path, 'upfirdn2d_kernel.cu'),
  11. ],
  12. )
  13. class UpFirDn2dBackward(Function):
  14. @staticmethod
  15. def forward(
  16. ctx, grad_output, kernel, grad_kernel, up, down, pad, g_pad, in_size, out_size
  17. ):
  18. up_x, up_y = up
  19. down_x, down_y = down
  20. g_pad_x0, g_pad_x1, g_pad_y0, g_pad_y1 = g_pad
  21. grad_output = grad_output.reshape(-1, out_size[0], out_size[1], 1)
  22. grad_input = upfirdn2d_op.upfirdn2d(
  23. grad_output,
  24. grad_kernel,
  25. down_x,
  26. down_y,
  27. up_x,
  28. up_y,
  29. g_pad_x0,
  30. g_pad_x1,
  31. g_pad_y0,
  32. g_pad_y1,
  33. )
  34. grad_input = grad_input.view(in_size[0], in_size[1], in_size[2], in_size[3])
  35. ctx.save_for_backward(kernel)
  36. pad_x0, pad_x1, pad_y0, pad_y1 = pad
  37. ctx.up_x = up_x
  38. ctx.up_y = up_y
  39. ctx.down_x = down_x
  40. ctx.down_y = down_y
  41. ctx.pad_x0 = pad_x0
  42. ctx.pad_x1 = pad_x1
  43. ctx.pad_y0 = pad_y0
  44. ctx.pad_y1 = pad_y1
  45. ctx.in_size = in_size
  46. ctx.out_size = out_size
  47. return grad_input
  48. @staticmethod
  49. def backward(ctx, gradgrad_input):
  50. kernel, = ctx.saved_tensors
  51. gradgrad_input = gradgrad_input.reshape(-1, ctx.in_size[2], ctx.in_size[3], 1)
  52. gradgrad_out = upfirdn2d_op.upfirdn2d(
  53. gradgrad_input,
  54. kernel,
  55. ctx.up_x,
  56. ctx.up_y,
  57. ctx.down_x,
  58. ctx.down_y,
  59. ctx.pad_x0,
  60. ctx.pad_x1,
  61. ctx.pad_y0,
  62. ctx.pad_y1,
  63. )
  64. # gradgrad_out = gradgrad_out.view(ctx.in_size[0], ctx.out_size[0], ctx.out_size[1], ctx.in_size[3])
  65. gradgrad_out = gradgrad_out.view(
  66. ctx.in_size[0], ctx.in_size[1], ctx.out_size[0], ctx.out_size[1]
  67. )
  68. return gradgrad_out, None, None, None, None, None, None, None, None
  69. class UpFirDn2d(Function):
  70. @staticmethod
  71. def forward(ctx, input, kernel, up, down, pad):
  72. up_x, up_y = up
  73. down_x, down_y = down
  74. pad_x0, pad_x1, pad_y0, pad_y1 = pad
  75. kernel_h, kernel_w = kernel.shape
  76. batch, channel, in_h, in_w = input.shape
  77. ctx.in_size = input.shape
  78. input = input.reshape(-1, in_h, in_w, 1)
  79. ctx.save_for_backward(kernel, torch.flip(kernel, [0, 1]))
  80. out_h = (in_h * up_y + pad_y0 + pad_y1 - kernel_h) // down_y + 1
  81. out_w = (in_w * up_x + pad_x0 + pad_x1 - kernel_w) // down_x + 1
  82. ctx.out_size = (out_h, out_w)
  83. ctx.up = (up_x, up_y)
  84. ctx.down = (down_x, down_y)
  85. ctx.pad = (pad_x0, pad_x1, pad_y0, pad_y1)
  86. g_pad_x0 = kernel_w - pad_x0 - 1
  87. g_pad_y0 = kernel_h - pad_y0 - 1
  88. g_pad_x1 = in_w * up_x - out_w * down_x + pad_x0 - up_x + 1
  89. g_pad_y1 = in_h * up_y - out_h * down_y + pad_y0 - up_y + 1
  90. ctx.g_pad = (g_pad_x0, g_pad_x1, g_pad_y0, g_pad_y1)
  91. out = upfirdn2d_op.upfirdn2d(
  92. input, kernel, up_x, up_y, down_x, down_y, pad_x0, pad_x1, pad_y0, pad_y1
  93. )
  94. # out = out.view(major, out_h, out_w, minor)
  95. out = out.view(-1, channel, out_h, out_w)
  96. return out
  97. @staticmethod
  98. def backward(ctx, grad_output):
  99. kernel, grad_kernel = ctx.saved_tensors
  100. grad_input = UpFirDn2dBackward.apply(
  101. grad_output,
  102. kernel,
  103. grad_kernel,
  104. ctx.up,
  105. ctx.down,
  106. ctx.pad,
  107. ctx.g_pad,
  108. ctx.in_size,
  109. ctx.out_size,
  110. )
  111. return grad_input, None, None, None, None
  112. def upfirdn2d(input, kernel, up=1, down=1, pad=(0, 0)):
  113. out = UpFirDn2d.apply(
  114. input, kernel, (up, up), (down, down), (pad[0], pad[1], pad[0], pad[1])
  115. )
  116. return out
  117. def upfirdn2d_native(
  118. input, kernel, up_x, up_y, down_x, down_y, pad_x0, pad_x1, pad_y0, pad_y1
  119. ):
  120. _, in_h, in_w, minor = input.shape
  121. kernel_h, kernel_w = kernel.shape
  122. out = input.view(-1, in_h, 1, in_w, 1, minor)
  123. out = F.pad(out, [0, 0, 0, up_x - 1, 0, 0, 0, up_y - 1])
  124. out = out.view(-1, in_h * up_y, in_w * up_x, minor)
  125. out = F.pad(
  126. out, [0, 0, max(pad_x0, 0), max(pad_x1, 0), max(pad_y0, 0), max(pad_y1, 0)]
  127. )
  128. out = out[
  129. :,
  130. max(-pad_y0, 0) : out.shape[1] - max(-pad_y1, 0),
  131. max(-pad_x0, 0) : out.shape[2] - max(-pad_x1, 0),
  132. :,
  133. ]
  134. out = out.permute(0, 3, 1, 2)
  135. out = out.reshape(
  136. [-1, 1, in_h * up_y + pad_y0 + pad_y1, in_w * up_x + pad_x0 + pad_x1]
  137. )
  138. w = torch.flip(kernel, [0, 1]).view(1, 1, kernel_h, kernel_w)
  139. out = F.conv2d(out, w)
  140. out = out.reshape(
  141. -1,
  142. minor,
  143. in_h * up_y + pad_y0 + pad_y1 - kernel_h + 1,
  144. in_w * up_x + pad_x0 + pad_x1 - kernel_w + 1,
  145. )
  146. out = out.permute(0, 2, 3, 1)
  147. return out[:, ::down_y, ::down_x, :]