李沐动手学深度学习11——深度学习计算

代码如下：

import torch
from torch import nn
from torch.nn import functional as F


# 自定义块
class MLP(nn.Module):
    def __init__(self):
        super().__init__()
        self.hidden = nn.Linear(20, 256)
        self.out = nn.Linear(256, 10)

    def forward(self, X):
        return self.out(F.relu(self.hidden(X)))


# 自定义顺序块
class MySequential(nn.Module):
    def __init__(self, *args):
        super().__init__()
        for i, module in enumerate(args):
            self._modules[str(i)] = module

    def forward(self, X):
        for block in self._modules.values():
            X = block(X)
        return X


# 在前向传播中执行代码
class FixedHiddenMLP(nn.Module):
    def __init__(self):
        super().__init__()
        self.rand_weight = torch.rand((20, 20), requires_grad=False)
        self.linear = nn.Linear(20, 20)

    def forward(self, X):
        X = self.linear(X)
        X = F.relu(torch.mm(X, self.rand_weight) + 1)
        X = self.linear(X)
        while X.abs().sum() > 1:
            X /= 2
        return X.sum()


class NestMLP(nn.Module):
    def __init__(self):
        super().__init__()
        self.net = nn.Sequential(nn.Linear(20, 64), nn.ReLU(),
                                 nn.Linear(64, 32), nn.ReLU())
        self.linear = nn.Linear(32, 16)

    def forward(self, X):
        return self.linear(self.net(X))


if __name__ == "__main__":
    X = torch.rand(2, 20)
    # net = MLP()
    # nn.Module的子类在调用时会触发forward方法
    # print(net(X))
    # net = MySequential(nn.Linear(20, 256), nn.ReLU(), nn.Linear(256, 10))
    # net(X)

import torch
from torch import nn


def block1():
    return nn.Sequential(nn.Linear(4, 8), nn.ReLU(),
                         nn.Linear(8, 4), nn.ReLU())


def block2():
    net = nn.Sequential()
    for i in range(4):
        net.add_module(f'block {i}', block1())
    return net


def init_normal(m):
    if type(m) == nn.Linear:
        nn.init.normal_(m.weight, mean=0, std=0.01)
        nn.init.zeros_(m.bias)


def init_constant(m):
    if type(m) == nn.Linear:
        nn.init.constant_(m.weight, 1)
        nn.init.zeros_(m.bias)


def my_init(m):
    if type(m) == nn.Linear:
        print("Init", *[(name, param.shape) for name, param in m.named_parameters()][0])
        # uniform指均匀分布初始化
        nn.init.uniform_(m.weight, -10, 10)
        # 逐元素乘法，若绝对值大于5乘1，否则乘0
        m.weight.data *= m.weight.data.abs() >= 5


if __name__ == "__main__":
    net = nn.Sequential(nn.Linear(4, 8), nn.ReLU(), nn.Linear(8, 1))
    X = torch.rand(size=(2, 4))
    # print(net(X))
    # print(net[2].state_dict())
    # print(type(net[2].bias), net[2].bias, net[2].bias.data, net[2].bias.grad is None)
    # print(*[(name, param.shape) for name, param in net.named_parameters()])
    # print(net.state_dict()['2.bias'].data)
    # rgnet = nn.Sequential(block2(), nn.Linear(4, 1))
    # print(rgnet(X))
    # print(rgnet)
    # print(rgnet[0][1][0].bias.data)
    # net.apply(init_normal)
    # print(net[0].weight.data[0], net[0].bias.data[0])
    net.apply(my_init)
    print(net[0].weight[:2])

import torch
import torch.nn.functional as F
from torch import nn


class CenteredLayer(nn.Module):
    def __init__(self):
        super().__init__()

    def forward(self, X):
        return X-X.mean()


class MyLinear(nn.Module):
    def __init__(self, in_units, units):
        super().__init__()
        self.weight = nn.Parameter(torch.randn(in_units, units))
        self.bias = nn.Parameter(torch.randn(units,))

    def forward(self, X):
        linear = torch.matmul(X, self.weight.data) + self.bias.data
        return F.relu(linear)


if __name__ == "__main__":
    # layer = CenteredLayer()
    # print(layer(torch.FloatTensor([1, 2, 3, 4, 5])))
    # net = nn.Sequential(nn.Linear(8, 128), CenteredLayer())
    # Y = net(torch.rand(4, 8))
    # print(Y.mean())
    linear = MyLinear(5, 3)
    print(linear.weight)
    print(linear(torch.rand(2, 5)))
    net = nn.Sequential(MyLinear(64, 8), MyLinear(8, 1))
    print(net(torch.rand(2, 64)))

import torch
from torch import nn
from torch.nn import functional as F


class MLP(nn.Module):
    def __init__(self):
        super().__init__()
        self.hidden = nn.Linear(20, 256)
        self.output = nn.Linear(256, 10)

    def forward(self, x):
        return self.output(F.relu(self.hidden(x)))


if __name__ == "__main__":
    x = torch.arange(4)
    # torch.save(x, 'x-file')
    # x2 = torch.load('x-file', weights_only=True)
    # print(x2)
    y = torch.zeros(4)
    # torch.save([x, y], 'x-files')
    # x2, y2 = torch.load('x-files', weights_only=True)
    # print(x2, y2)
    # mydict = {'x': x, 'y': y}
    # torch.save(mydict, 'mydict')
    # mdict2 = torch.load('mydict', weights_only=True)
    # print(mdict2)
    net = MLP()
    X = torch.randn(size=(2, 20))
    Y = net(X)
    torch.save(net.state_dict(), 'mlp.params')
    clone = MLP()
    clone.load_state_dict(torch.load('mlp.params', weights_only=True))
    clone.eval()
    Y_clone = clone(X)
    print(Y_clone == Y)

import torch


def try_gpu(i=0):
    if torch.cuda.device_count() >= i+1:
        return torch.device(f'cuda:{i}')
    return torch.device('cpu')


def try_all_gpus():
    devices = [torch.device(f'cuda:{i}') for i in range(torch.cuda.device_count())]
    return devices if devices else [torch.device('cpu')]


if __name__ == "__main__":
    print(torch.device('cpu'), torch.device('cuda'))
    print(torch.cuda.device_count())
    x = torch.tensor([1, 2, 3])
    print(x.device)

posted on 2025-05-09 17:53 欢乐豆掠夺者阅读(15) 评论(0) 收藏举报

刷新页面返回顶部

JoyBeanRobber

导航

公告

李沐动手学深度学习11——深度学习计算