循环神经网络RNN、RNNCell、GRUCell

python 复制代码
###################### RNNCell的使用 ####################################

#初始化完全一样
# input_size - The number of expected features in the input x
# hidden_size - The number of features in the hidden state h
# num_layers - Number of recurrent layers, default 1

#但是forward是不一样的
#ht = rnncell(xt,ht_1)
x = torch.randn(10, 1, 100)
rnnCell = nn.RNNCell(input_size=100, hidden_size=30)
ht = torch.zeros(1, 30)
out = []
for xt in x:
    ht = rnnCell(xt, ht)
    out.append(ht)
print('输出总时间步:', len(out),',每个时间步输出的形状:',out[0].shape)


#####################lstm使用#########################
# 多层RNN的例子
rnn = nn.LSTM(input_size=100, hidden_size=20, num_layers=4)
print(rnn)
x = torch.randn(10, 3, 100)
out, (h, c) = rnn(x)
print(out.shape, h.shape, c.shape)
#输出
#torch.Size([10, 3, 20]) torch.Size([4, 3, 20]) torch.Size([4, 3, 20])

x = torch.rand(3,3,4)
id = [0,1]
c = x[id].transpose(0,1)
print(x)
print(c)
print(c.shape)
#实例:正弦曲线预测

input_size = 1
hidden_size = 256
output_size = 1
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.rnn = nn.LSTM(input_size=input_size, hidden_size=hidden_size, num_layers=2)
        self.linear = nn.Linear(hidden_size, output_size)

    def forward(self, x):
        _, (h, c) = self.rnn(x)
        h = h[-1]
        h = self.linear(h)
        return h


model = Net()
criterion = nn.MSELoss()
optimizer = torch.optim.Adam(model.parameters(), lr=0.001)


num_time_steps =200
start = 0 #在0-3之间随机初始化
time_steps = np.linspace(start, start+20, num_time_steps)
data = np.sin(time_steps)
data = data.reshape(num_time_steps)

horizon_len = 10 #用于估计的时间序列长度
list = [1, 2, 3]


for iter in range(500):
    batch_size = 32
    s = random.sample(range(num_time_steps-horizon_len-1), batch_size)
    train_data_x = []
    train_data_y = []
    for s_i in s:
        train_data_x.append(data[s_i:s_i+horizon_len])
        train_data_y.append(data[s_i + horizon_len])
    train_data_x = torch.tensor(train_data_x, dtype=torch.float32).T
    train_data_x = train_data_x.unsqueeze(2).to(torch.float32)
    train_data_y = torch.tensor(train_data_y, dtype=torch.float64).reshape(-1, batch_size, 1).to(torch.float32)


    output = model(train_data_x)

    loss = criterion(output, train_data_y)
    model.zero_grad()
    loss.backward()
    optimizer.step()

    if iter % 50 == 0:
        print("Iteration: {} loss {}".format(iter, loss.item()))


num_time_steps =200
start = 0
time_steps = np.linspace(start, start+20, num=num_time_steps)
data = np.sin(time_steps)

predictions1 = []

h = torch.zeros(1, 1, hidden_size)
c = torch.zeros(1, 1, hidden_size)

input = deque(data[0:horizon_len], maxlen=horizon_len)
predictions1.extend(data[0:horizon_len])
for i in range(horizon_len, len(data)*5):
    input_tensor = torch.tensor(input).to(torch.float32)
    input_tensor = input_tensor.view(horizon_len, 1, 1)
    pred= model(input_tensor)
    input.append(pred.detach().numpy().ravel()[0])
    predictions1.append(pred.detach().numpy().ravel()[0])

plt.figure()
plt.plot(data)
plt.plot(predictions1)
plt.legend(['sin wave','pred1'])
plt.show()
相关推荐
江上鹤.1486 分钟前
Day 50 CBAM 注意力机制
人工智能·深度学习
人工智能培训13 分钟前
深度学习—卷积神经网络(1)
人工智能·深度学习·神经网络·机器学习·cnn·知识图谱·dnn
CoovallyAIHub1 小时前
纯视觉的终结?顶会趋势:不会联觉(多模态)的CV不是好AI
深度学习·算法·计算机视觉
懷淰メ1 小时前
python3GUI--基于深度学习的人脸识别管理系统(详细图文介绍)
人工智能·深度学习·人脸识别·pyqt·人脸·识别系统·人脸管理
CoovallyAIHub1 小时前
一文读懂大语言模型家族:LLM、MLLM、LMM、VLM核心概念全解析
深度学习·算法·计算机视觉
Keep_Trying_Go2 小时前
文生图算法C4Synth: Cross-Caption Cycle-Consistent Text-to-Image Synthesis详解
人工智能·pytorch·深度学习·计算机视觉·文生图
智算菩萨2 小时前
【Python机器学习】交叉验证与超参数调优:自动化寻优之旅
人工智能·深度学习·机器学习
汤姆yu2 小时前
基于深度学习的交通标志识别系统
人工智能·深度学习
Small___ming3 小时前
【人工智能基础】深度学习归一化层完全指南:从入门到精通
人工智能·深度学习·归一化
亚里随笔4 小时前
激活被遗忘的训练信号:ERPO框架如何让大模型在数学推理中更进一步
深度学习·llm·rl·agentic·grpo