其他分享
首页 > 其他分享> > 【深度学习】DNN房价预测

【深度学习】DNN房价预测

作者:互联网

前言

我们使用深度学习网络实现波士顿房价预测,深度学习的目的就是寻找一个合适的函数输出我们想要的结果。深度学习实际上是机器学习领域中一个研究方向,深度学习的目标是让机器能够像人一样具有分析学习的能力,能够识别文字、图像、声音等数据。我认为深度学习与机器学习最主要的区别就是神经元。

深度学习中重要内容

建立模型——神经元

建立模型——激活函数

image

建立模型——前馈神经网络

image

建立模型——深度神经网络

image

image

损失函数

实践——波士顿房价预测

数据集

使用paddle飞桨波士顿数据集

https://www.paddlepaddle.org.cn/documentation/docs/zh/api/paddle/text/UCIHousing_cn.html

绘图

## 绘图

Batch = 0
Batchs = []
all_train_accs = []
def draw_train_acc(Batchs,train_accs):
    title = "training accs"
    plt.title(title)
    plt.xlabel("batch")
    plt.ylabel("acc")
    plt.plot(Batchs, train_accs, color = 'green', label = 'training accs')
    plt.legend()
    plt.grid()
    plt.show()


all_train_loss = []
def draw_train_loss(Batchs,train_loss):
    title = "training loss"
    plt.title(title)
    plt.xlabel("batch")
    plt.ylabel("loss")
    plt.plot(Batchs, train_loss, color = 'red', label = 'training loss')
    plt.legend()
    plt.grid()
    plt.show()

## 绘制真实值与预测值的对比图
def draw_infer_result(groud_truths, infer_results):
    title = 'Boston'
    plt.title(title)
    x = np.arange(1,20)
    y = x
    plt.plot(x,y);
    plt.xlabel("ground truth")
    plt.ylabel("infer result")
    plt.scatter(groud_truths,infer_results,color='green',label='training cost')
    plt.grid()
    plt.show()

网络搭建


'''
核心

网络搭建
'''

class MyDNN(paddle.nn.Layer):
    def __init__(self):
        super(MyDNN, self).__init__()

        #self.linear1 = paddle.nn.Linear(13,1,None) #全连接层,paddle.nn.Linear(in_features,out_features,weight)

        self.linear1 = paddle.nn.Linear(13, 32, None)

        self.linear2 = paddle.nn.Linear(32, 64, None)

        self.linear3 = paddle.nn.Linear(64, 32, None)

        self.linear4 = paddle.nn.Linear(32, 1, None)
    def forward(self, inputs): ## 传播函数
        x = self.linear1(inputs)
        x = self.linear2(x)
        x = self.linear3(x)
        x = self.linear4(x)
        return x

模型训练与测试


'''
网络训练与测试
'''


## 实例化
model = MyDNN()
model.train()
mse_loss = paddle.nn.MSELoss()
opt = paddle.optimizer.SGD(learning_rate=0.001, parameters=model.parameters())
epochs_num = 100


for epochs in range(epochs_num):
    for batch_id,data in enumerate(train_loader()):
        feature = data[0]
        label = data[1]
        predict = model(feature)
        loss = mse_loss(predict, label)
        loss.backward()
        opt.step()
        opt.clear_grad()
        if batch_id!=0 and batch_id%10 == 0:
            Batch = Batch+10
            Batchs.append(Batch)
            all_train_loss.append(loss.numpy()[0])
            print("epoch{},step:{},train_loss:{}".format(epochs,batch_id,loss.numpy()[0]))

paddle.save(model.state_dict(),"UCIHousingDNN")
draw_train_loss(Batchs,all_train_loss)



para_state = paddle.load("UCIHousingDNN")
model = MyDNN()
model.eval()
model.set_state_dict(para_state)
losses = []


for batch_id,data in enumerate(eval_loader()):
    feature = data[0]
    label = data[1]
    predict = model(feature)
    loss = mse_loss(predict,label)
    losses.append(loss.numpy()[0])
avg_loss = np.mean(losses)

print(avg_loss)


draw_infer_result(label,predict)

代码

## 深度学习框架
import paddle

import numpy as np
import os
import matplotlib.pyplot as plt



## 绘图

Batch = 0
Batchs = []
all_train_accs = []
def draw_train_acc(Batchs,train_accs):
    title = "training accs"
    plt.title(title)
    plt.xlabel("batch")
    plt.ylabel("acc")
    plt.plot(Batchs, train_accs, color = 'green', label = 'training accs')
    plt.legend()
    plt.grid()
    plt.show()


all_train_loss = []
def draw_train_loss(Batchs,train_loss):
    title = "training loss"
    plt.title(title)
    plt.xlabel("batch")
    plt.ylabel("loss")
    plt.plot(Batchs, train_loss, color = 'red', label = 'training loss')
    plt.legend()
    plt.grid()
    plt.show()

## 绘制真实值与预测值的对比图
def draw_infer_result(groud_truths, infer_results):
    title = 'Boston'
    plt.title(title)
    x = np.arange(1,20)
    y = x
    plt.plot(x,y);
    plt.xlabel("ground truth")
    plt.ylabel("infer result")
    plt.scatter(groud_truths,infer_results,color='green',label='training cost')
    plt.grid()
    plt.show()


'''
数据集加载
'''

train_dataset = paddle.text.datasets.UCIHousing(mode="train")
eval_dataset = paddle.text.datasets.UCIHousing(mode="test")

train_loader = paddle.io.DataLoader(train_dataset,batch_size=32, shuffle=True)
eval_loader = paddle.io.DataLoader(eval_dataset,batch_size=8,shuffle=False)

print(train_dataset[1])


'''
核心

网络搭建
'''

class MyDNN(paddle.nn.Layer):
    def __init__(self):
        super(MyDNN, self).__init__()

        #self.linear1 = paddle.nn.Linear(13,1,None) #全连接层,paddle.nn.Linear(in_features,out_features,weight)

        self.linear1 = paddle.nn.Linear(13, 32, None)

        self.linear2 = paddle.nn.Linear(32, 64, None)

        self.linear3 = paddle.nn.Linear(64, 32, None)

        self.linear4 = paddle.nn.Linear(32, 1, None)
    def forward(self, inputs): ## 传播函数
        x = self.linear1(inputs)
        x = self.linear2(x)
        x = self.linear3(x)
        x = self.linear4(x)
        return x


'''
网络训练与测试
'''


## 实例化
model = MyDNN()
model.train()
mse_loss = paddle.nn.MSELoss()
opt = paddle.optimizer.SGD(learning_rate=0.001, parameters=model.parameters())
epochs_num = 100


for epochs in range(epochs_num):
    for batch_id,data in enumerate(train_loader()):
        feature = data[0]
        label = data[1]
        predict = model(feature)
        loss = mse_loss(predict, label)
        loss.backward()
        opt.step()
        opt.clear_grad()
        if batch_id!=0 and batch_id%10 == 0:
            Batch = Batch+10
            Batchs.append(Batch)
            all_train_loss.append(loss.numpy()[0])
            print("epoch{},step:{},train_loss:{}".format(epochs,batch_id,loss.numpy()[0]))

paddle.save(model.state_dict(),"UCIHousingDNN")
draw_train_loss(Batchs,all_train_loss)



para_state = paddle.load("UCIHousingDNN")
model = MyDNN()
model.eval()
model.set_state_dict(para_state)
losses = []


for batch_id,data in enumerate(eval_loader()):
    feature = data[0]
    label = data[1]
    predict = model(feature)
    loss = mse_loss(predict,label)
    losses.append(loss.numpy()[0])
avg_loss = np.mean(losses)

print(avg_loss)


draw_infer_result(label,predict)

结果展示

image

image

标签:loss,plt,title,房价,self,DNN,paddle,train,深度
来源: https://www.cnblogs.com/hjk-airl/p/16620993.html