Pytorch学习 12 深度学习基础网络手动搭建与快速实现

2021-04-13

深度学习 | 机器学习

Pytorch 为什么看起来更加复杂？

非结构、海量数据才能看到优势。类的频繁使用其实也是为了能够更加灵活的创建不同类型的神经网络模型。

一、回归类数据集创建方法

回归类模型的数据，特征和标签都是连续型数值。

2. 创建生成回归类数据函数

# 随机模块
import random

# 绘图模块
import matplotlib as mpl
import matplotlib.pyplot as plt

# numpy
import numpy as np

# pytorch
import torch
from torch import nn, optim
import torch.functional as F
from torch.utils.data import Dataset, TensorDataset, DataLoader

def tensorGenReg(num_examples = 1000, w = [2, -1, 1], bias = True, delta = 0.01, deg = 1):
    """回归类数据集创建函数
    
    :param num_examples: 创建数据集的数据量
    :param w: 包括截距的（如果存在）特征系数向量
    :param bias: 是否需要截距
    :param delta: 扰动项的值
    :param deg: 方程次数
    :return: 生成的特征张量和标签张量
    """
    if bias == True:
        num_inputs = len(w) - 1                                  # 如果有 bias，那么 w 的位数应该减少1 
        features_true = torch.randn(num_examples, num_inputs)   # 特征张量
        w_true = torch.tensor(w[:-1]).reshape(-1, 1).float()     # 不包含全是1的列的特征张量
        b_true = torch.tensor(w[-1]).float()                     # 截距
        if num_inputs == 1:                                      # 若输入特征只有1个，则不能使用矩阵乘法
            labels_true = torch.pow(features_true, deg) * w_true + b_true
        else:
            labels_true = torch.mm(torch.pow(features_true, deg) ,w_true) + b_true
        # torch.cat(a,b)   把 a , b 拼接起来
        features = torch.cat((features_true, torch.ones(len(features_true), 1)), 1)  # 在特征张量的最后一列添加全是1的一列
        labels = labels_true + torch.randn(size = labels_true.shape) * delta    
    else:
        num_inputs = len(w)
        features = torch.randn(num_examples, num_inputs)
        w_true = torch.tensor(w).reshape(-1, 1).float()
        if num_inputs == 1:
            labels_true = torch.pow(features, deg) * w_true
        else:
            labels_true = torch.mm(torch.pow(features, deg) ,w_true)
        labels = labels_true + torch.randn(size = labels_true.shape) * delta
    return features, labels

二、分类数据集创建方法

和回归模型的数据不同，分类模型数据的标签是离散值

1. 手动创建分类数据集

回顾 torch.narmal(4, 2, size(10,3)) 10行3列的均值为4 标准差为2 的函数

影响中心点位置的因素：

生成点时的均值差别越大，簇之间的距离越远

生成点时的标准差越大，离散程度越高

2. 创建生成分类数据函数

同样，我们将上述创建分类函数的过程封装为一个函数。这里需要注意的是，我们希望找到一个变量可以控制数据整体离散程度，也就是后续建模的难以程度。这里我们规定，如果每个分类数据集中心点较近、且每个类别的点内部方差较大，则数据集整体离散程度较高，反之离散程度较低。在实际函数创建过程中，我们也希望能够找到对应的参数能够方便进行自主调节，

# 随机模块
import random

# 绘图模块
import matplotlib as mpl
import matplotlib.pyplot as plt

# numpy
import numpy as np

# pytorch
import torch
from torch import nn, optim
import torch.functional as F
from torch.utils.data import Dataset, TensorDataset, DataLoader

def tensorGenCla(num_examples = 500, num_inputs = 2, num_class = 3, deg_disperison = [4, 2], bias = False):
    """分类数据集创建函数。
    
    :param num_examples: 创建数据集的数据量
    :param num_inputs: 数据集的特征数量
    :param num_class: 数据集标签类别总数
    :param deg_disperison: 数据分布离散程度参数，需要输入一个列表，其中第一个参数表示每个类别数组均值的参考
                           第二个参数表示随机数组的标准差。
    :param bias: 建立模型逻辑回归模型时，是否带入截距
    :return: 生成的特征张量和标签张量，其中特征张量是浮点型二维数组，标签张量是长整型二维数组
    """
    
    cluster_1 = torch.empty(num_examples, 1)  # 每一类标签张量的形状
    mean_ = deg_disperison[0]                 # 每一类特征张量的均值的参考值
    std_ = deg_disperison[1]                  # 每一类特征张量的方差
    lf = []                                   # 用于存储每一类特征张量的列表容器
    ll = []                                   # 用于存储每一类标签张量的列表容器
    k = mean_ * (num_class+1) / 2             # 每一类特征张量均值的惩罚因子
    
    for i in range(num_class):
        data_temp = torch.normal(i*mean_-k, std_, size=(num_examples, num_inputs))   # 生成每一类张量
        lf.append(data_temp)                                                         # 将每一类张量添加到lf中
        labels_temp = torch.full_like(cluster_1, i)                                  # 生成类一类的标签
        ll.append(labels_temp)                                                       # 将每一类标签添加到ll中
        
    features = torch.cat(lf).float()
    labels = torch.cat(ll).long()
    
    if bias == True:
        features = torch.cat((features, torch.ones(len(features), 1)), 1)            # 在特征张量中添加一列全是1的列
    
    return features, labels

三、创建小批量切分函数

1. 手动生成数据

def data_iter(batch_size, features, labels):
    """数据切分函数
    
    :param batch_size: 每个子数据集包含多少数据
    :param features: 输入的特征张量
    :param labels: 输入的标签张量
    :return l: 包含batch_size个列表，每个列表由切分后的特征和标签所组成    
    """
    num_examples = len(features)
    indices = list(range(num_examples))
    random.shuffle(indices)
    l = []
    for i in range(0, num_examples, batch_size):   
        j = torch.tensor(indices[i: min(i + batch_size, num_examples)])
        l.append([torch.index_select(features, 0, j), torch.index_select(labels, 0, j)])
    return l

四、Python模块编写

torchLearning.py

# 随机模块
import random

# 绘图模块
import matplotlib as mpl
import matplotlib.pyplot as plt

# numpy
import numpy as np

# pytorch
import torch
from torch import nn, optim
import torch.functional as F
from torch.utils.data import Dataset, TensorDataset, DataLoader


def tensorGenReg(num_examples=1000, w=[2, -1, 1], bias=True, delta=0.01, deg=1):
    """回归类数据集创建函数

    :param num_examples: 创建数据集的数据量
    :param w: 包括截距的（如果存在）特征系数向量
    :param bias: 是否需要截距
    :param delta: 扰动项的值
    :param deg: 方程次数
    :return: 生成的特征张量和标签张量
    """
    if bias == True:
        num_inputs = len(w) - 1  # 如果有 bias，那么 w 的位数应该减少1
        features_true = torch.randn(num_examples, num_inputs)  # 特征张量
        w_true = torch.tensor(w[:-1]).reshape(-1, 1).float()  # 不包含全是1的列的特征张量
        b_true = torch.tensor(w[-1]).float()  # 截距
        if num_inputs == 1:  # 若输入特征只有1个，则不能使用矩阵乘法
            labels_true = torch.pow(features_true, deg) * w_true + b_true
        else:
            labels_true = torch.mm(torch.pow(features_true, deg), w_true) + b_true
        # torch.cat(a,b)   把 a , b 拼接起来
        features = torch.cat((features_true, torch.ones(len(features_true), 1)), 1)  # 在特征张量的最后一列添加全是1的一列
        labels = labels_true + torch.randn(size=labels_true.shape) * delta
    else:
        num_inputs = len(w)
        features = torch.randn(num_examples, num_inputs)
        w_true = torch.tensor(w).reshape(-1, 1).float()
        if num_inputs == 1:
            labels_true = torch.pow(features, deg) * w_true
        else:
            labels_true = torch.mm(torch.pow(features, deg), w_true)
        labels = labels_true + torch.randn(size=labels_true.shape) * delta
    return features, labels


def tensorGenCla(num_examples=500, num_inputs=2, num_class=3, deg_disperison=[4, 2], bias=False):
    """分类数据集创建函数。

    :param num_examples: 创建数据集的数据量
    :param num_inputs: 数据集的特征数量
    :param num_class: 数据集标签类别总数
    :param deg_disperison: 数据分布离散程度参数，需要输入一个列表，其中第一个参数表示每个类别数组均值的参考,第二个参数表示随机数组标准差。
    :param bias: 建立模型逻辑回归模型时，是否带入截距
    :return: 生成的特征张量和标签张量，其中特征张量是浮点型二维数组，标签张量是长整型二维数组
    """

    cluster_1 = torch.empty(num_examples, 1)  # 每一类标签张量的形状
    mean_ = deg_disperison[0]  # 每一类特征张量的均值的参考值
    std_ = deg_disperison[1]  # 每一类特征张量的方差
    lf = []  # 用于存储每一类特征张量的列表容器
    ll = []  # 用于存储每一类标签张量的列表容器
    k = mean_ * (num_class + 1) / 2  # 每一类特征张量均值的惩罚因子

    for i in range(num_class):
        data_temp = torch.normal(i * mean_ - k, std_, size=(num_examples, num_inputs))  # 生成每一类张量
        lf.append(data_temp)  # 将每一类张量添加到lf中
        labels_temp = torch.full_like(cluster_1, i)  # 生成类一类的标签
        ll.append(labels_temp)  # 将每一类标签添加到ll中

    features = torch.cat(lf).float()
    labels = torch.cat(ll).long()

    if bias == True:
        features = torch.cat((features, torch.ones(len(features), 1)), 1)  # 在特征张量中添加一列全是1的列

    return features, labels


def data_iter(batch_size, features, labels):
    """数据切分函数

    :param batch_size: 每个子数据集包含多少数据
    :param features: 输入的特征张量
    :param labels: 输入的标签张量
    :return l: 包含batch_size个列表，每个列表由切分后的特征和标签所组成
    """
    num_examples = len(features)
    indices = list(range(num_examples))
    random.shuffle(indices)
    l = []
    for i in range(0, num_examples, batch_size):
        j = torch.tensor(indices[i: min(i + batch_size, num_examples)])
        l.append([torch.index_select(features, 0, j), torch.index_select(labels, 0, j)])
    return l