Torch截断一部分后是否能梯度回传

复制代码
import torch

from torch import optim 
import torch.nn as nn
 
 
class g(nn.Module):
    def __init__(self):
        super(g, self).__init__()
        self.k = nn.Conv2d(in_channels=2, out_channels=1, kernel_size=1, padding=0, bias=False)
 
    def forward(self, z):
        return self.k(z)

 
 
c = 2
h = 5
w = 5
z = torch.rand( (1,c , h , w)).float().view(1, c, h, w)*100
z.requires_grad = True
k = g()

optim = optim.Adam(k.parameters(), lr=1)
optim.zero_grad()
r = k(z)
r= r[:,:,:3,:3]
r = r.sum()
loss = (r - 1) * (r - 1)

for name,v in k.named_parameters():
    print(name,v) 
print(z)
print("*********************")
 
loss.backward()
optim.step()
for name,v in k.named_parameters():
    print(name,v) 
print(z)

输出:

tensor([[[[-0.0464]],

\[ 0.4256\]\]\]\], requires_grad=True) tensor(\[\[\[\[65.6508, 65.0099, 38.5205, 78.4769, 31.6377\], \[27.1530, 5.7923, 23.9614, 59.5419, 3.5597\], \[69.9373, 29.7657, 91.4004, 85.5130, 65.2210\], \[62.6357, 23.9004, 95.3394, 59.5155, 48.1762\], \[98.7728, 97.2193, 66.3625, 65.0421, 22.0612\]\], \[\[19.3582, 2.4226, 47.2068, 20.1124, 31.9324\], \[23.4966, 5.0654, 12.4682, 35.3092, 90.3394\], \[ 8.4709, 91.5994, 79.7592, 93.8652, 92.6337\], \[49.0805, 63.9460, 81.2459, 63.4729, 77.1670\], \[17.8333, 18.6162, 44.9271, 44.8790, 3.6609\]\]\]\], requires_grad=True) \*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\*\* k.weight Parameter containing: tensor(\[\[\[\[-1.0464\]\], \[\[-0.5744\]\]\]\], requires_grad=True) tensor(\[\[\[\[65.6508, 65.0099, 38.5205, 78.4769, 31.6377\], \[27.1530, 5.7923, 23.9614, 59.5419, 3.5597\], \[69.9373, 29.7657, 91.4004, 85.5130, 65.2210\], \[62.6357, 23.9004, 95.3394, 59.5155, 48.1762\], \[98.7728, 97.2193, 66.3625, 65.0421, 22.0612\]\], \[\[19.3582, 2.4226, 47.2068, 20.1124, 31.9324\], \[23.4966, 5.0654, 12.4682, 35.3092, 90.3394\], \[ 8.4709, 91.5994, 79.7592, 93.8652, 92.6337\], \[49.0805, 63.9460, 81.2459, 63.4729, 77.1670\], \[17.8333, 18.6162, 44.9271, 44.8790, 3.6609\]\]\]\], requires_grad=True)

相关推荐
renhongxia110 分钟前
大模型微调RAG、LORA、强化学习
人工智能·深度学习·算法·语言模型
dundunmm22 分钟前
【论文阅读】SIMBA: single-cell embedding along with features(1)
论文阅读·深度学习·神经网络·embedding·生物信息·单细胞·多组学
BYSJMG31 分钟前
计算机大数据毕业设计推荐:基于Spark的气候疾病传播可视化分析系统【Hadoop、python、spark】
大数据·hadoop·python·信息可视化·spark·django·课程设计
抠头专注python环境配置2 小时前
OCR库pytesseract安装保姆级教程
python·ocr·conda
山烛2 小时前
矿物分类系统开发笔记(二):模型训练[删除空缺行]
人工智能·笔记·python·机器学习·分类·数据挖掘
大得3692 小时前
django生成迁移文件,执行生成到数据库
后端·python·django
大志说编程2 小时前
LangChain框架入门17: 手把手教你创建LLM工具
python·langchain·ai编程
R-G-B3 小时前
【P38 6】OpenCV Python——图片的运算(算术运算、逻辑运算)加法add、subtract减法、乘法multiply、除法divide
人工智能·python·opencv·图片的运算·图片加法add·图片subtract减法·图片乘法multiply
数据智能老司机3 小时前
MCP 实战——全局视角:为什么 MCP 将成为 AI 的颠覆者
python·llm·mcp
在星空下3 小时前
Fastapi-Vue3-Admin
前端·python·fastapi