循环神经网络RNN、RNNCell、GRUCell

python 复制代码
###################### RNNCell的使用 ####################################

#初始化完全一样
# input_size - The number of expected features in the input x
# hidden_size - The number of features in the hidden state h
# num_layers - Number of recurrent layers, default 1

#但是forward是不一样的
#ht = rnncell(xt,ht_1)
x = torch.randn(10, 1, 100)
rnnCell = nn.RNNCell(input_size=100, hidden_size=30)
ht = torch.zeros(1, 30)
out = []
for xt in x:
    ht = rnnCell(xt, ht)
    out.append(ht)
print('输出总时间步:', len(out),',每个时间步输出的形状:',out[0].shape)


#####################lstm使用#########################
# 多层RNN的例子
rnn = nn.LSTM(input_size=100, hidden_size=20, num_layers=4)
print(rnn)
x = torch.randn(10, 3, 100)
out, (h, c) = rnn(x)
print(out.shape, h.shape, c.shape)
#输出
#torch.Size([10, 3, 20]) torch.Size([4, 3, 20]) torch.Size([4, 3, 20])

x = torch.rand(3,3,4)
id = [0,1]
c = x[id].transpose(0,1)
print(x)
print(c)
print(c.shape)
#实例:正弦曲线预测

input_size = 1
hidden_size = 256
output_size = 1
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.rnn = nn.LSTM(input_size=input_size, hidden_size=hidden_size, num_layers=2)
        self.linear = nn.Linear(hidden_size, output_size)

    def forward(self, x):
        _, (h, c) = self.rnn(x)
        h = h[-1]
        h = self.linear(h)
        return h


model = Net()
criterion = nn.MSELoss()
optimizer = torch.optim.Adam(model.parameters(), lr=0.001)


num_time_steps =200
start = 0 #在0-3之间随机初始化
time_steps = np.linspace(start, start+20, num_time_steps)
data = np.sin(time_steps)
data = data.reshape(num_time_steps)

horizon_len = 10 #用于估计的时间序列长度
list = [1, 2, 3]


for iter in range(500):
    batch_size = 32
    s = random.sample(range(num_time_steps-horizon_len-1), batch_size)
    train_data_x = []
    train_data_y = []
    for s_i in s:
        train_data_x.append(data[s_i:s_i+horizon_len])
        train_data_y.append(data[s_i + horizon_len])
    train_data_x = torch.tensor(train_data_x, dtype=torch.float32).T
    train_data_x = train_data_x.unsqueeze(2).to(torch.float32)
    train_data_y = torch.tensor(train_data_y, dtype=torch.float64).reshape(-1, batch_size, 1).to(torch.float32)


    output = model(train_data_x)

    loss = criterion(output, train_data_y)
    model.zero_grad()
    loss.backward()
    optimizer.step()

    if iter % 50 == 0:
        print("Iteration: {} loss {}".format(iter, loss.item()))


num_time_steps =200
start = 0
time_steps = np.linspace(start, start+20, num=num_time_steps)
data = np.sin(time_steps)

predictions1 = []

h = torch.zeros(1, 1, hidden_size)
c = torch.zeros(1, 1, hidden_size)

input = deque(data[0:horizon_len], maxlen=horizon_len)
predictions1.extend(data[0:horizon_len])
for i in range(horizon_len, len(data)*5):
    input_tensor = torch.tensor(input).to(torch.float32)
    input_tensor = input_tensor.view(horizon_len, 1, 1)
    pred= model(input_tensor)
    input.append(pred.detach().numpy().ravel()[0])
    predictions1.append(pred.detach().numpy().ravel()[0])

plt.figure()
plt.plot(data)
plt.plot(predictions1)
plt.legend(['sin wave','pred1'])
plt.show()
相关推荐
yLDeveloper9 小时前
从模型评估、梯度难题到科学初始化:一步步解析深度学习的训练问题
深度学习
Coder_Boy_9 小时前
技术让开发更轻松的底层矛盾
java·大数据·数据库·人工智能·深度学习
2401_836235869 小时前
中安未来SDK15:以AI之眼,解锁企业档案的数字化基因
人工智能·科技·深度学习·ocr·生活
njsgcs9 小时前
llm使用 AgentScope-Tuner 通过 RL 训练 FrozenLake 智能体
人工智能·深度学习
2的n次方_10 小时前
CANN ascend-transformer-boost 架构解析:融合注意力算子管线、长序列分块策略与图引擎协同机制
深度学习·架构·transformer
人工智能培训10 小时前
具身智能视觉、触觉、力觉、听觉等信息如何实时对齐与融合?
人工智能·深度学习·大模型·transformer·企业数字化转型·具身智能
pp起床12 小时前
Gen_AI 补充内容 Logit Lens 和 Patchscopes
人工智能·深度学习·机器学习
阿杰学AI13 小时前
AI核心知识91——大语言模型之 Transformer 架构(简洁且通俗易懂版)
人工智能·深度学习·ai·语言模型·自然语言处理·aigc·transformer
芷栀夏13 小时前
CANN ops-math:筑牢 AI 神经网络底层的高性能数学运算算子库核心实现
人工智能·深度学习·神经网络
Yeats_Liao16 小时前
评估体系构建:基于自动化指标与人工打分的双重验证
运维·人工智能·深度学习·算法·机器学习·自动化