Torch截断一部分后是否能梯度回传

复制代码
import torch

from torch import optim 
import torch.nn as nn
 
 
class g(nn.Module):
    def __init__(self):
        super(g, self).__init__()
        self.k = nn.Conv2d(in_channels=2, out_channels=1, kernel_size=1, padding=0, bias=False)
 
    def forward(self, z):
        return self.k(z)

 
 
c = 2
h = 5
w = 5
z = torch.rand( (1,c , h , w)).float().view(1, c, h, w)*100
z.requires_grad = True
k = g()

optim = optim.Adam(k.parameters(), lr=1)
optim.zero_grad()
r = k(z)
r= r[:,:,:3,:3]
r = r.sum()
loss = (r - 1) * (r - 1)

for name,v in k.named_parameters():
    print(name,v) 
print(z)
print("*********************")
 
loss.backward()
optim.step()
for name,v in k.named_parameters():
    print(name,v) 
print(z)

输出:

tensor(\[\[\[-0.0464],

\[ 0.4256]]], requires_grad=True)

tensor(\[\[\[65.6508, 65.0099, 38.5205, 78.4769, 31.6377,

27.1530, 5.7923, 23.9614, 59.5419, 3.5597,

69.9373, 29.7657, 91.4004, 85.5130, 65.2210,

62.6357, 23.9004, 95.3394, 59.5155, 48.1762,

98.7728, 97.2193, 66.3625, 65.0421, 22.0612],

\[19.3582, 2.4226, 47.2068, 20.1124, 31.9324,

23.4966, 5.0654, 12.4682, 35.3092, 90.3394,

8.4709, 91.5994, 79.7592, 93.8652, 92.6337,

49.0805, 63.9460, 81.2459, 63.4729, 77.1670,

17.8333, 18.6162, 44.9271, 44.8790, 3.6609]]], requires_grad=True)

*********************

k.weight Parameter containing:

tensor(\[\[\[-1.0464],

\[-0.5744]]], requires_grad=True)

tensor(\[\[\[65.6508, 65.0099, 38.5205, 78.4769, 31.6377,

27.1530, 5.7923, 23.9614, 59.5419, 3.5597,

69.9373, 29.7657, 91.4004, 85.5130, 65.2210,

62.6357, 23.9004, 95.3394, 59.5155, 48.1762,

98.7728, 97.2193, 66.3625, 65.0421, 22.0612],

\[19.3582, 2.4226, 47.2068, 20.1124, 31.9324,

23.4966, 5.0654, 12.4682, 35.3092, 90.3394,

8.4709, 91.5994, 79.7592, 93.8652, 92.6337,

49.0805, 63.9460, 81.2459, 63.4729, 77.1670,

17.8333, 18.6162, 44.9271, 44.8790, 3.6609]]], requires_grad=True)

相关推荐
biter down1 小时前
从 0 到 1 搭建 Python 接口自动化测试框架(博客系统实战)
开发语言·python
肖永威2 小时前
Python多业务并行计算框架插件化演进:从硬编码到动态注册
python·插件化·并行计算·动态注册
yz_aiks2 小时前
Linux Jar包配置Systemd自启动实战:从排查到配置全流程
linux·python·jar·自启动·systemd
不知名的老吴3 小时前
线程的生命周期之线程“插队“
java·开发语言·python
xsc6996754 小时前
从零搭建大模型与智能体平台 - 完整技术详解
python
无风听海5 小时前
多租户系统中的 OIDC:Discovery 端点与联合登录的深度实践
后端·python·flask
CTA终结者6 小时前
期货量化主力换月程序怎么移仓:天勤 underlying_symbol 与任务切换
python·区块链
马士兵教育6 小时前
Java还有前景吗?Java+AI大模型学习路线及项目?
java·人工智能·python·学习·机器学习
KaMeidebaby6 小时前
卡梅德生物技术快报|纯化重组蛋白实操详解
人工智能·python·tcp/ip·算法·机器学习
Cloud_Shy6186 小时前
解读《Effective Python 3rd Edition》:从练气到老魔(第五章 Item 30 - 32)
开发语言·人工智能·笔记·python·学习方法