深度学习基础与图像识别系统开发

深度学习基础与图像识别系统开发 | 极客日志

pip install tensorflow

import tensorflow as tf

# 构建模型
model = tf.keras.Sequential([
    tf.keras.layers.Dense(10, activation="relu", input_shape=(784,)),
    tf.keras.layers.Dense(10, activation="softmax")
])

# 编译模型
model.compile(optimizer="adam", loss="sparse_categorical_crossentropy", metrics=["accuracy"])

# 加载数据
(x_train, y_train), (x_test, y_test) = tf.keras.datasets.mnist.load_data()

# 数据预处理
x_train = x_train.reshape((60000, 784)) / 255.0
x_test = x_test.reshape((10000, 784)) / 255.0

# 训练模型
model.fit(x_train, y_train, epochs=5, batch_size=32)

# 评估模型
test_loss, test_acc = model.evaluate(x_test, y_test)
print(f"Test Loss: {test_loss:.4f}")
print(f"Test Accuracy: {test_acc:.4f}")

pip install torch torchvision

import torch
import torch.nn as nn
import torch.optim as optim
import torchvision
import torchvision.transforms as transforms

# 数据预处理
transform = transforms.Compose([
    transforms.ToTensor(),
    transforms.Normalize((0.5,), (0.5,))
])

# 加载数据
trainset = torchvision.datasets.MNIST(root="./data", train=True, download=True, transform=transform)
trainloader = torch.utils.data.DataLoader(trainset, batch_size=32, shuffle=True)
testset = torchvision.datasets.MNIST(root="./data", train=False, download=True, transform=transform)
testloader = torch.utils.data.DataLoader(testset, batch_size=32, shuffle=False)

# 构建模型
class Net(nn.Module):
    def __init__(self):
        super(Net, self).__init__()
        self.fc1 = nn.Linear(784, 10)
        self.fc2 = nn.Linear(10, 10)

    def forward(self, x):
        x = x.view(-1, 784)
        x = torch.relu(self.fc1(x))
        x = torch.softmax(self.fc2(x), dim=1)
        return x

model = Net()

# 编译模型
criterion = nn.CrossEntropyLoss()
optimizer = optim.Adam(model.parameters(), lr=0.001)

# 训练模型
for epoch in range(5):
    running_loss = 0.0
    for i, data in enumerate(trainloader, 0):
        inputs, labels = data
        optimizer.zero_grad()
        outputs = model(inputs)
        loss = criterion(outputs, labels)
        loss.backward()
        optimizer.step()
        running_loss += loss.item()
        if i % 100 == 99:
            print(f"[Epoch {epoch + 1}, Batch {i + 1}] Loss: {running_loss / 100:.4f}")
    running_loss = 0.0

# 评估模型
correct = 0
total = 0
with torch.no_grad():
    for data in testloader:
        inputs, labels = data
        outputs = model(inputs)
        _, predicted = torch.max(outputs.data, 1)
        total += labels.size(0)
        correct += (predicted == labels).sum().item()

print(f"Test Accuracy: {correct / total:.4f}")

# 安装 TensorFlow
pip install tensorflow
# 安装 PyTorch
pip install torch torchvision
# 安装 Flask
pip install flask

import cv2
import numpy as np

def preprocess_image(image_path):
    try:
        # 加载图像
        image = cv2.imread(image_path)
        # 调整图像大小
        image = cv2.resize(image, (224, 224))
        # 归一化图像
        image = image / 255.0
        # 转换为 BGR 到 RGB
        image = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
        # 增加维度
        image = np.expand_dims(image, axis=0)
        return image
    except Exception as e:
        print(f"图像预处理失败：{e}")
        return None

import tensorflow as tf
import numpy as np

# 加载模型
model = tf.keras.applications.MobileNetV2(weights="imagenet")

def recognize_image(image):
    try:
        # 预测图像
        predictions = model.predict(image)
        # 解码预测结果
        decoded_predictions = tf.keras.applications.mobilenet_v2.decode_predictions(predictions, top=5)
        # 整理预测结果
        result = []
        for i, (imagenet_id, label, score) in enumerate(decoded_predictions[0]):
            result.append({"id": i + 1, "label": label, "score": float(score)})
        return result
    except Exception as e:
        print(f"图像识别失败：{e}")
        return None

from flask import Flask, render_template, request, redirect, url_for
import os
import uuid
from image_preprocessor import preprocess_image
from image_recognizer import recognize_image

app = Flask(__name__)
app.config["UPLOAD_FOLDER"] = "uploads"
app.config["ALLOWED_EXTENSIONS"] = {"png", "jpg", "jpeg"}

def allowed_file(filename):
    return "." in filename and filename.rsplit(".", 1)[1].lower() in app.config["ALLOWED_EXTENSIONS"]

@app.route("/")
def index():
    return render_template("index.html")

@app.route("/upload", methods=["POST"])
def upload():
    if "file" not in request.files:
        return redirect(request.url)
    file = request.files["file"]
    if file.filename == "":
        return redirect(request.url)
    if file and allowed_file(file.filename):
        filename = str(uuid.uuid4()) + "." + file.filename.rsplit(".", 1)[1].lower()
        file.save(os.path.join(app.config["UPLOAD_FOLDER"], filename))
        image_path = os.path.join(app.config["UPLOAD_FOLDER"], filename)
        image = preprocess_image(image_path)
        if image is None:
            return render_template("result.html", error="图像预处理失败")
        result = recognize_image(image)
        if result is None:
            return render_template("result.html", error="图像识别失败")
        return render_template("result.html", filename=filename, result=result)
    return redirect(request.url)

@app.route("/uploads/<filename>")
def uploaded_file(filename):
    from flask import send_from_directory
    return send_from_directory(app.config["UPLOAD_FOLDER"], filename)

if __name__ == "__main__":
    if not os.path.exists(app.config["UPLOAD_FOLDER"]):
        os.makedirs(app.config["UPLOAD_FOLDER"])
    app.run(debug=True)

<!DOCTYPE html>
<html lang="zh-CN">
<head>
    <meta charset="UTF-8">
    <meta name="viewport" content="width=device-width, initial-scale=1.0">
    <title>图像识别系统</title>
    <style>
        body {
            font-family: Arial, sans-serif;
            margin: 0;
            padding: 0;
            background-color: #f5f5f5;
        }
        .container {
            max-width: 800px;
            margin: 0 auto;
            padding: 20px;
            background-color: #fff;
            border-radius: 5px;
            box-shadow: 0 0 10px rgba(0, 0, 0, 0.1);
            margin-top: 50px;
        }
        h1 {
            text-align: center;
            margin-bottom: 20px;
            color: #333;
        }
        .upload-form {
            text-align: center;
            margin-bottom: 20px;
        }
        .upload-form input[type="file"] {
            margin-bottom: 10px;
        }
        .upload-form input[type="submit"] {
            padding: 10px 20px;
            background-color: #4CAF50;
            color: #fff;
            border: none;
            border-radius: 5px;
            cursor: pointer;
        }
        .upload-form input[type="submit"]:hover {
            background-color: #45a049;
        }
        .result {
            text-align: center;
            margin-top: 20px;
        }
        .result img {
            max-width: 100%;
            height: auto;
            margin-bottom: 20px;
        }
        .result table {
            width: 100%;
            border-collapse: collapse;
            margin-bottom: 20px;
        }
        .result th, .result td {
            padding: 10px;
            border: 1px solid #ddd;
        }
        .result th {
            background-color: #f2f2f2;
            text-align: left;
        }
        .error {
            color: red;
            text-align: center;
            margin-top: 20px;
        }
    </style>
</head>
<body>
    <div class="container">
        <h1>图像识别系统</h1>
        <form class="upload-form" method="POST" enctype="multipart/form-data" action="/upload">
            <input type="file" name="file" accept="image/*"><br>
            <input type="submit" value="上传图像">
        </form>
        {% if error %} 
        <div class="error">{{ error }}</div> 
        {% endif %} 
        {% if filename %} 
        <div class="result">
            <img src="{{ url_for('uploaded_file', filename=filename) }}" alt="上传的图像">
            <table>
                <tr>
                    <th>ID</th>
                    <th>标签</th>
                    <th>置信度</th>
                </tr>
                {% for item in result %} 
                <tr>
                    <td>{{ item.id }}</td>
                    <td>{{ item.label }}</td>
                    <td>{{ item.score }}</td>
                </tr> 
                {% endfor %} 
            </table>
        </div> 
        {% endif %} 
    </div>
</body>
</html>

深度学习基础与图像识别系统开发

第四篇：深度学习基础与图像识别系统开发

学习目标

重点内容

一、深度学习基础

1.1 深度学习的基本概念

1.1.1 深度学习的重要性

1.1.2 深度学习的应用场景

1.2 深度学习的基本架构

1.2.1 神经元的基本结构

1.2.2 神经网络的基本结构

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具

1.2.3 深度学习的训练过程

二、深度学习框架介绍

2.1 TensorFlow 介绍

2.1.1 TensorFlow 的安装

2.1.2 TensorFlow 的基本使用

2.2 PyTorch 介绍

2.2.1 PyTorch 的安装

2.2.2 PyTorch 的基本使用

三、卷积神经网络（CNN）基础

3.1 卷积神经网络的基本概念

3.1.1 卷积层

3.1.2 池化层

3.1.3 全连接层

3.2 卷积神经网络的基本架构

3.2.1 LeNet-5

3.2.2 AlexNet

3.2.3 VGG

3.2.4 GoogLeNet

3.2.5 ResNet

四、图像识别模型的构建与训练

4.1 数据预处理

4.2 模型构建

4.3 模型训练

4.4 模型评估

五、实战项目：图像识别系统开发

5.1 项目需求分析

5.1.1 应用目标

5.1.2 用户需求

5.1.3 功能范围

5.2 系统架构设计

5.2.1 应用架构

5.2.2 数据存储方案

5.3 系统实现

5.3.1 开发环境搭建

5.3.2 图像预处理

5.3.3 图像识别

5.3.4 用户界面

5.3.5 前端界面

5.4 系统运行与测试

5.4.1 系统运行

六、总结

微信扫一扫，关注极客日志

更多推荐文章

相关免费在线工具