亚欧色一区w666天堂,色情一区二区三区免费看,少妇特黄A片一区二区三区,亚洲人成网站999久久久综合,国产av熟女一区二区三区

點贊

評論

原創

pytorch-訓練全流程

2024-11-14 09:41:58

import torch

torch.seed()


class PolRegression(torch.nn.Module):
    def __init__(self, input_dim):
        super(PolRegression, self).__init__()
        self.linear = torch.nn.Linear(in_features=input_dim, out_features=1)

    def forward(self, x):
        return self.linear(x)


def generate_data(batch_size=32):
    # 方式1
    x = torch.randn(batch_size)
    # 方式2
    x = torch.randint(-5, 5, (batch_size,)) * 1.0  # 改成float
    x = x.unsqueeze(1)

    # 避免廣播 torch.randn(batch_size, 1)
    y = 2.0 * x ** 3 + 3.0 * x ** 2 + 4.0 * x + 5.0 + torch.randn(batch_size, 1) / 100

    x_data = torch.cat([x ** i for i in range(1, 4)], 1)

    return x_data, y


checkpoint_path = 'poly-regression-model.pth'


def train(num_epoch=1000):
    device = "cuda" if torch.cuda.is_available() else "cpu"
    model = PolRegression(3).to(device)

    loss_func = torch.nn.MSELoss()
    optimizer = torch.optim.Adam(model.parameters(), lr=0.01)

    start_epoch = read_checkpoint(model, optimizer, checkpoint_path)
    for i in range(start_epoch, num_epoch):
        x, y = generate_data(32)
        x = x.to(device)
        y = y.to(device)

        predicted = model(x)
        # just for debug
        z = predicted - y
        loss = loss_func(predicted, y)
        loss.backward()
        optimizer.step()
        optimizer.zero_grad()
        print(f"Epoch {i + 1} , loss {loss.item()}")

        if (i + 1) % 10 == 0:
            write_checkpoint(i + 1, model, optimizer, checkpoint_path)

        if (i + 1) % 10240 == 0:
            print("just for simulator panic")  # 模擬故障
            exit(1)

    print(f'weight: {model.linear.weight.data}')
    print(f'bias: {model.linear.bias.data}')
    write_checkpoint(num_epoch, model, optimizer, checkpoint_path)


def save_checkpoint(epoch, model, optimizer, path):
    tmp_dict = {
        "epoch": epoch,
        "model_state_dict": model.state_dict(),
        "optimizer_state_dict": optimizer.state_dict()
    }
    torch.save(tmp_dict, path)


import os
import shutil


def rotate_save_file(file_path, max_versions=5):
    if not os.path.exists(file_path):
        return

    # 獲取文件名和擴展名
    file_dir, file_name = os.path.split(file_path)
    file_base, file_ext = os.path.splitext(file_name)

    # 從最大版本號開始，逐個移動文件
    for i in range(max_versions - 1, 0, -1):
        old_file = os.path.join(file_dir, f"{file_base}.{i}{file_ext}")
        new_file = os.path.join(file_dir, f"{file_base}.{i + 1}{file_ext}")
        if os.path.exists(old_file):
            shutil.move(old_file, new_file)

    # 將當前文件移動到1號版本
    shutil.move(file_path, os.path.join(file_dir, f"{file_base}.1{file_ext}"))


def write_checkpoint(epoch, model, optimizer, path):
    rotate_save_file(checkpoint_path)
    save_checkpoint(epoch, model, optimizer, path)


def load_checkpoint(model, optimizer, path):
    checkpoint = torch.load(path)
    model.load_state_dict(checkpoint["model_state_dict"])
    optimizer.load_state_dict(checkpoint["optimizer_state_dict"])
    epoch = checkpoint["epoch"]
    print(f"checkpoint loaded, starting at epoch {epoch}")
    return epoch


def read_checkpoint(model, optimizer, checkpoint_path, max_versions=5):
    file_dir, file_name = os.path.split(checkpoint_path)
    file_base, file_ext = os.path.splitext(file_name)

    for i in range(0, max_versions + 1):
        rotated_file = os.path.join(file_dir, f"{file_base}.{i}{file_ext}")
        if i == 0:
            rotated_file = checkpoint_path

        if os.path.exists(rotated_file):
            try:
                start_epoch = load_checkpoint(model, optimizer, rotated_file)
            except Exception as e:
                print(f"{rotated_file} have exception {e}")
            else:
                print(f"load {rotated_file} success")
                return start_epoch

    print("not found checkpoint, starting training from scratch.")
    return 0


def test_


'''

<bdo id='RJWRI'><sup id='CgsEN'><div id='gLjAp'><bdo id='VKTk9'></bdo></div></sup></bdo>

import torch

batch_size = 10
x = torch.randint(-5, 5, (batch_size,)) * 1.0  # 改成float
x = x.unsqueeze(1)
print(x.size())

y = 2 * x
print(y.size())

y = 2 * x + torch.randn(batch_size)
print(y.size())

z = torch.randn((batch_size, 1))
print(z.size())
'''

'''
torch.Size([10, 1])
torch.Size([10, 1])
torch.Size([10, 10])
torch.Size([10, 1])

'''

0條評論

作者已關閉評論

Top123

32文章數

0點贊數

3粉絲數

Top123

32 文章 | 3 粉絲

Top123

32文章數

0點贊數

3粉絲數

Top123

32 文章 | 3 粉絲

原創

pytorch-訓練全流程

2024-11-14 09:41:58

import torch

torch.seed()


class PolRegression(torch.nn.Module):
    def __init__(self, input_dim):
        super(PolRegression, self).__init__()
        self.linear = torch.nn.Linear(in_features=input_dim, out_features=1)

    def forward(self, x):
        return self.linear(x)


def generate_data(batch_size=32):
    # 方式1
    x = torch.randn(batch_size)
    # 方式2
    x = torch.randint(-5, 5, (batch_size,)) * 1.0  # 改成float
    x = x.unsqueeze(1)

    # 避免廣播 torch.randn(batch_size, 1)
    y = 2.0 * x ** 3 + 3.0 * x ** 2 + 4.0 * x + 5.0 + torch.randn(batch_size, 1) / 100

    x_data = torch.cat([x ** i for i in range(1, 4)], 1)

    return x_data, y


checkpoint_path = 'poly-regression-model.pth'


def train(num_epoch=1000):
    device = "cuda" if torch.cuda.is_available() else "cpu"
    model = PolRegression(3).to(device)

    loss_func = torch.nn.MSELoss()
    optimizer = torch.optim.Adam(model.parameters(), lr=0.01)

    start_epoch = read_checkpoint(model, optimizer, checkpoint_path)
    for i in range(start_epoch, num_epoch):
        x, y = generate_data(32)
        x = x.to(device)
        y = y.to(device)

        predicted = model(x)
        # just for debug
        z = predicted - y
        loss = loss_func(predicted, y)
        loss.backward()
        optimizer.step()
        optimizer.zero_grad()
        print(f"Epoch {i + 1} , loss {loss.item()}")

        if (i + 1) % 10 == 0:
            write_checkpoint(i + 1, model, optimizer, checkpoint_path)

        if (i + 1) % 10240 == 0:
            print("just for simulator panic")  # 模擬故障
            exit(1)

    print(f'weight: {model.linear.weight.data}')
    print(f'bias: {model.linear.bias.data}')
    write_checkpoint(num_epoch, model, optimizer, checkpoint_path)


def save_checkpoint(epoch, model, optimizer, path):
    tmp_dict = {
        "epoch": epoch,
        "model_state_dict": model.state_dict(),
        "optimizer_state_dict": optimizer.state_dict()
    }
    torch.save(tmp_dict, path)


import os
import shutil


def rotate_save_file(file_path, max_versions=5):
    if not os.path.exists(file_path):
        return

    # 獲取文件名和擴展名
    file_dir, file_name = os.path.split(file_path)
    file_base, file_ext = os.path.splitext(file_name)

    # 從最大版本號開始，逐個移動文件
    for i in range(max_versions - 1, 0, -1):
        old_file = os.path.join(file_dir, f"{file_base}.{i}{file_ext}")
        new_file = os.path.join(file_dir, f"{file_base}.{i + 1}{file_ext}")
        if os.path.exists(old_file):
            shutil.move(old_file, new_file)

    # 將當前文件移動到1號版本
    shutil.move(file_path, os.path.join(file_dir, f"{file_base}.1{file_ext}"))


def write_checkpoint(epoch, model, optimizer, path):
    rotate_save_file(checkpoint_path)
    save_checkpoint(epoch, model, optimizer, path)


def load_checkpoint(model, optimizer, path):
    checkpoint = torch.load(path)
    model.load_state_dict(checkpoint["model_state_dict"])
    optimizer.load_state_dict(checkpoint["optimizer_state_dict"])
    epoch = checkpoint["epoch"]
    print(f"checkpoint loaded, starting at epoch {epoch}")
    return epoch


def read_checkpoint(model, optimizer, checkpoint_path, max_versions=5):
    file_dir, file_name = os.path.split(checkpoint_path)
    file_base, file_ext = os.path.splitext(file_name)

    for i in range(0, max_versions + 1):
        rotated_file = os.path.join(file_dir, f"{file_base}.{i}{file_ext}")
        if i == 0:
            rotated_file = checkpoint_path

        if os.path.exists(rotated_file):
            try:
                start_epoch = load_checkpoint(model, optimizer, rotated_file)
            except Exception as e:
                print(f"{rotated_file} have exception {e}")
            else:
                print(f"load {rotated_file} success")
                return start_epoch

    print("not found checkpoint, starting training from scratch.")
    return 0


def test_


'''

import torch

batch_size = 10
x = torch.randint(-5, 5, (batch_size,)) * 1.0  # 改成float
x = x.unsqueeze(1)
print(x.size())

y = 2 * x
print(y.size())

y = 2 * x + torch.randn(batch_size)
print(y.size())

z = torch.randn((batch_size, 1))
print(z.size())
'''

'''
torch.Size([10, 1])
torch.Size([10, 1])
torch.Size([10, 10])
torch.Size([10, 1])

'''

文章來自個人專欄

文章 | 訂閱

0條評論

作者已關閉評論

亚欧色一区w666天堂,色情一区二区三区免费看,少妇特黄A片一区二区三区,亚洲人成网站999久久久综合,国产av熟女一区二区三区

智算服務

應用商城

定價

合作伙伴

開發者

支持與服務

了解天翼云

pytorch-訓練全流程

pytorch-訓練全流程

亚欧色一区w666天堂,色情一区二区三区免费看,少妇特黄A片一区二区三区,亚洲人成网站999久久久综合,国产av熟女一区二区三区

活動

智算服務

應用商城

定價

合作伙伴

開發者

支持與服務

了解天翼云

pytorch-訓練全流程

pytorch-訓練全流程