2023年7月31日 20:35:50go评论125阅读模式

英文:

How to make the equivalent of Tensorflow sequential model in PyTorch?

问题

I have a simple shallow model in Tensorflow for multiclass classification.

model = tf.keras.models.Sequential([  
    tf.keras.layers.Dense(64, input_shape=(384,), activation="relu"),
    tf.keras.layers.Dense(36, activation="softmax", use_bias=False)
])
model.summary()

我想在PyTorch中复制它，其中我在前向函数中使用softmax。

# 基本模型 - 它可以工作，但精度很低。需要添加更多层。
class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(n_features, 36)
        nn.ReLU()
        
    def forward(self, x):
        out = torch.softmax(self.lr(x), dim=1, dtype=None)
        return out
# 参数
n_features = 384
n_classes = 36
optim = torch.optim.SGD(model.parameters(), lr=0.1)
criterion = torch.nn.CrossEntropyLoss()
accuracy_fn = Accuracy(task="multiclass", num_classes=36)

我尝试修改我的基本模型，如下所示，但后来出现错误。

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(n_features, 64)        
        self.lr = nn.ReLU()
        self.lr = torch.nn.Linear(64, 36)
        
    def forward(self, x):
        out = torch.softmax(self.lr(x), dim=1, dtype=None)
        return out
epochs = 15
def train(model, optim, criterion, x, y, epochs=epochs):
    for e in range(1, epochs + 1):
        optim.zero_grad()
        out = model(x)
        loss = criterion(out, y)
        loss.backward()
        optim.step()
        print(f"Loss at epoch {e}: {loss.data}")
    return model
model = LR(n_features)
model = train(model, optim, criterion, X_train, y_train)

出现以下错误：

RuntimeError: mat1 and mat2 shapes cannot be multiplied (155648x384 and 64x36)

我的数据形状是：

X_train.shape
torch.Size([155648, 384])
y_train.shape
torch.Size([155648])

有人可以帮我解决我的LR类和train函数吗？

英文:

I have a simple shallow model in Tensorflow for multiclass classification.

model = tf.keras.models.Sequential([  
    tf.keras.layers.Dense(64, input_shape = (384,), activation = &quot;relu&quot;),
    tf.keras.layers.Dense(36, activation=&quot;softmax&quot;, use_bias = False)
                          ])    
        
model.summary()  
Model: &quot;sequential_5&quot;
_________________________________________________________________
 Layer (type)                Output Shape              Param #   
=================================================================
 dense_13 (Dense)            (None, 64)                24640     
                                                                 
 dense_14 (Dense)            (None, 36)                2304

I want to replicate it in PyTorch where I am using softmax in the forward function.

# base model - it works but gives v low accuracy. need to add more layers.
class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(n_features, 36)
        nn.ReLU()
        
    def forward(self, x):
        out = torch.softmax(self.lr(x),dim = 1,dtype=None)
        return out
# parameters
n_features = 384
n_classes = 36
optim = torch.optim.SGD(model.parameters(), lr=0.1)
criterion = torch.nn.CrossEntropyLoss()
accuracy_fn = Accuracy(task=&quot;multiclass&quot;,  num_classes=36)

I have tried modifying my base model like so and it gives me an error later on.

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(n_features, 64)        
        self.lr = nn.ReLU()
        self.lr = torch.nn.Linear(64, 36)
        
    def forward(self, x):
        out = torch.softmax(self.lr(x),dim = 1,dtype=None)
        return out
epochs = 15
def train(model, optim, criterion, x, y, epochs=epochs):
    for e in range(1, epochs + 1):
        optim.zero_grad()
        out = model(x)
        loss = criterion(out, y)
        loss.backward()
        optim.step()
        print(f&quot;Loss at epoch {e}: {loss.data}&quot;)
    return model
model = LR(n_features)
model = train(model, optim, criterion, X_train, y_train)
---------------------------------------------------------------------------
RuntimeError                              Traceback (most recent call last)
Cell In[175], line 18
     12  #       acc = accuracy_fn(out, y)  
     13  #       acc.backward()
     14  #       optim.step()
     15  #       print(f&quot;Acc at epoch {e}: {acc.data}&quot;)
     16     return model
---&gt; 18 model = train(model, optim, criterion, X_train, y_train)
Cell In[175], line 6, in train(model, optim, criterion, x, y, epochs)
      4 for e in range(1, epochs + 1):
      5     optim.zero_grad()
----&gt; 6     out = model(x)
      7     loss = criterion(out, y)
      8     loss.backward()
File /usr/local/lib/python3.10/site-packages/torch/nn/modules/module.py:1501, in Module._call_impl(self, *args, **kwargs)
   1496 # If we don&#39;t have any hooks, we want to skip the rest of the logic in
   1497 # this function, and just call forward.
   1498 if not (self._backward_hooks or self._backward_pre_hooks or self._forward_hooks or self._forward_pre_hooks
   1499         or _global_backward_pre_hooks or _global_backward_hooks
   1500         or _global_forward_hooks or _global_forward_pre_hooks):
-&gt; 1501     return forward_call(*args, **kwargs)
   1502 # Do not call functions when jit is used
   1503 full_backward_hooks, non_full_backward_hooks = [], []
Cell In[172], line 10, in LR.forward(self, x)
      9 def forward(self, x):
---&gt; 10     out = torch.softmax(self.lr(x),dim = 1,dtype=None)
     11     return out
File /usr/local/lib/python3.10/site-packages/torch/nn/modules/module.py:1501, in Module._call_impl(self, *args, **kwargs)
   1496 # If we don&#39;t have any hooks, we want to skip the rest of the logic in
   1497 # this function, and just call forward.
   1498 if not (self._backward_hooks or self._backward_pre_hooks or self._forward_hooks or self._forward_pre_hooks
   1499         or _global_backward_pre_hooks or _global_backward_hooks
   1500         or _global_forward_hooks or _global_forward_pre_hooks):
-&gt; 1501     return forward_call(*args, **kwargs)
   1502 # Do not call functions when jit is used
   1503 full_backward_hooks, non_full_backward_hooks = [], []
File /usr/local/lib/python3.10/site-packages/torch/nn/modules/linear.py:114, in Linear.forward(self, input)
    113 def forward(self, input: Tensor) -&gt; Tensor:
--&gt; 114     return F.linear(input, self.weight, self.bias)
RuntimeError: mat1 and mat2 shapes cannot be multiplied (155648x384 and 64x36)

my data shapes are:

X_train.shape
torch.Size([155648, 384]) 
y_train.shape 
torch.Size([155648]).

Can someone give me a hand with my class LR and train function?

答案1

得分: 2

在你的Torch模型中，你两次覆盖了self.lr属性。

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(n_features, 64)        
        self.lr = nn.ReLU()                  # 在这里覆盖了lr
        self.lr = torch.nn.Linear(64, 36)    # 还有在这里

所以你最终得到的模型只有这个：

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(64, 36)

如果你想要等效于Keras模型，你可以使用：

from torch import nn
model = nn.Sequential(
    nn.Linear(384, 64),
    nn.ReLU(),
    nn.Linear(64, 36, bias=False),
    nn.Softmax()
)

如果你想要为你的模型构建一个类，你可以使用：

import torch.nn as nn
class Model(nn.Module):
    def __init__(self):
        super().__init__()
        self.L1 = nn.Linear(384, 64),
        self.RLU = nn.ReLU()
        self.L2 = nn.Linear(64, 36, bias=False)
    def forward(self, x):
        x = self.L1(x)
        x = self.RLU(x)
        x = self.L2(x)
        return x

我没有加上softmax，因为CrossEntropyLoss会自动应用log-softmax。如果你要进行预测，可以单独应用softmax。

英文:

In your Torch model, you have overwritten the self.lr attribute 2 times.

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(n_features, 64)        
        self.lr = nn.ReLU()                  # lr is over-written here
        self.lr = torch.nn.Linear(64, 36)    # and here

So you end up with a model that is just this:

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Linear(64, 36)

If you want the equivalent of the Keras model, you can use:

from torch import nn
model = nn.Sequential(
    nn.Linear(384, 64),
    nn.ReLU()
    nn.Linear(64, 36, bias=False)
    nn.Softmax()
)

If you want to build a class for your model, you can use:

import torch.nn as nn
class Model(nn.Module):
    def __init__(self):
        super().__init__()
        self.L1 = nn.Linear(384, 64),
        self.RLU = nn.ReLU()
        self.L2 = nn.Linear(64, 36, bias=False)
    def forward(self, x):
        x = self.L1(x)
        x = self.RLU(x)
        x = self.L2(x)
        return x

I left off the softmax because the CrossEntropyLoss applies a log-softmax on it's own. If you are making predictions, you can apply a softmax separately.

答案2

得分: 2

你可以使用Sequential来实现以下内容：

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Sequential(
            torch.nn.Linear(n_features, 64),        
            torch.nn.ReLU(),
            torch.nn.Linear(64, 36, bias=False),
            torch.nn.Softmax(dim=1),
        )
    def forward(self, x):
        return self.lr(x)

这可以与以下方式一起使用：

x = torch.ones(1, 1000)
lr = LR(x.shape[1])
lr(x)

英文:

You could do (using the Sequential), the following:

class LR(torch.nn.Module):
    def __init__(self, n_features):
        super(LR, self).__init__()
        self.lr = torch.nn.Sequential(
            torch.nn.Linear(n_features, 64),        
            torch.nn.ReLU(),
            torch.nn.Linear(64, 36, bias=False),
            torch.nn.Softmax(dim=1),
        )
    def forward(self, x):
        return self.lr(x)

This could be used with, e.g.,

x = torch.ones(1, 1000)
lr = LR(x.shape[1])
lr(x)

通过集体智慧和协作来改善编程学习和解决问题的方式。致力于成为全球开发者共同参与的知识库，让每个人都能够通过互相帮助和分享经验来进步。

如何在PyTorch中创建类似于Tensorflow顺序模型的等效模型？

问题

答案1

答案2

无法解决在使用Visual Studio Code时的Python导入异常。

在字符串列表的列表中找到不重复的字符串出现（附加更多条件）

在Python的unittest中，为同一个SQLClient对象在每个函数中获取不同的数值。

应用高亮于数据透视表

如何在Playwright视觉比较中屏蔽多个定位器？

在C++中，可以使用可变模板参数来检索类型的内部类型。

selenium.common.exceptions.StaleElementReferenceException: Message: stale element reference: stale element not found

Creating and opening a URL to log in to Website via Basic Auth with Robot Framework/Selenium (Python)

AG Grid 在上下文菜单中以大文本形式打开

What's the correct way to type hint an empty list as a literal in python?

如何在Highcharts Gantt中更改本地化的星期名称

如何在同一个流中使用多个过滤器和映射函数？

如何使用Map/Set来将代码优化到O(n)？

.NET MAUI Android在GitHub Actions上构建失败，错误代码为1。