代码
加载数据
import tensorflow as tf
from tensorflow import keras
fashion_mnist = keras.datasets.fashion_mnist
(X_train_full, y_train_full), (X_test, y_test) = fashion_mnist.load_data()
创建测试集
并且将像素强度降低到0-1范围
X_valid, X_train = X_train_full[:5000] / 255., X_train_full[5000:] / 255.
y_valid, y_train = y_train_full[:5000], y_train_full[5000:]
简单查看数据
import matplotlib.pyplot as plt
plt.imshow(X_train[0], cmap="binary")
plt.axis('off')
plt.show()
data:image/s3,"s3://crabby-images/58de4/58de4dbd9c7c4d3e3b8e36161b29f9bb008b81c6" alt="在这里插入图片描述"
X_train_full.shape
data:image/s3,"s3://crabby-images/d431c/d431ca0887d56620934ee017c298199f58737a49" alt="在这里插入图片描述"
y_train
data:image/s3,"s3://crabby-images/94751/9475115599e672b755a1676cb9b65c1edb464723" alt="在这里插入图片描述" 使用类名列表来告诉我们识别结果
class_names = ["T-shirt/top", "Trouser", "Pullover", "Dress", "Coat",
"Sandal", "Shirt", "Sneaker", "Bag", "Ankle boot"]
class_names[y_train[0]]
data:image/s3,"s3://crabby-images/36aae/36aae97394bb4345bdc30c1c5f0ce24960a21e83" alt="在这里插入图片描述"
训练数据
定义神经网络
model = keras.models.Sequential([
keras.layers.Flatten(input_shape=[28, 28]),
keras.layers.Dense(300, activation="relu"),
keras.layers.Dense(100, activation="relu"),
keras.layers.Dense(10, activation="softmax")
])
显示模型的所有层
model.summary()
data:image/s3,"s3://crabby-images/d5169/d5169f2c829d2a8456f587af2c4f614bea6aed89" alt="在这里插入图片描述" 访问层所有参数
hidden1 = model.layers[1]
weights, biases = hidden1.get_weights()
data:image/s3,"s3://crabby-images/c2439/c2439061ec1bffc6d9f0d9806c3d753d1fdb8a7c" alt="在这里插入图片描述" data:image/s3,"s3://crabby-images/4bd9c/4bd9cedb9788caf39ddb554520ae17211a83a690" alt="在这里插入图片描述"
指定损失函数等参数
model.compile(loss="sparse_categorical_crossentropy",
optimizer="sgd",
metrics=["accuracy"])
训练模型
history = model.fit(X_train, y_train, epochs=30,
validation_data=(X_valid, y_valid))
如果想查看每个轮次结束时测得的平均验证损失和准确率
import pandas as pd
pd.DataFrame(history.history).plot(figsize=(8, 5))
plt.grid(True)
plt.gca().set_ylim(0, 1)
plt.show()
data:image/s3,"s3://crabby-images/00e29/00e29fb5009db259ba2b5c8f9ef7c366953835b6" alt="在这里插入图片描述" 在测试集上评估
model.evaluate(X_test, y_test)
data:image/s3,"s3://crabby-images/ac291/ac29191876acbbef35dbed89aad2bb16de21ea49" alt="在这里插入图片描述"
预测
X_new = X_test[:3]
y_proba = model.predict(X_new)
y_proba.round(2)
输出各个类的概率 data:image/s3,"s3://crabby-images/42eac/42eace2cbcc6e85016506f69220b2fbed407554e" alt="在这里插入图片描述"
y_pred = model.predict_classes(X_new)
y_pred
data:image/s3,"s3://crabby-images/a74a5/a74a587e8b403e0642137707f249f38567a0b7f8" alt="在这里插入图片描述"
|