import numpy as np
import matplotlib.pyplot as plt
import h5py
from lr_utils import load_dataset

train_set_x_orig, train_set_y, test_set_x_orig, test_set_y, classes = load_dataset()

m_train = train_set_y.shape[1]
m_test = test_set_y.shape[1]
num_px = train_set_x_orig.shape[1]

print("训练集的数量: m_train = " + str(m_train))
print("测试集的数量 : m_test = " + str(m_test))
print("每张图片的宽/高 : num_px = " + str(num_px))
print("每张图片的大小 : (" + str(num_px) + ", " + str(num_px) + ", 3)")
print("训练集_图片的维数 : " + str(train_set_x_orig.shape))
print("训练集_标签的维数 : " + str(train_set_y.shape))
print("测试集_图片的维数: " + str(test_set_x_orig.shape))
print("测试集_标签的维数: " + str(test_set_y.shape))

将训练集的维度降低并转置。
train_set_x_flatten = train_set_x_orig.reshape(train_set_x_orig.shape[0], -1).T
将测试集的维度降低并转置。
test_set_x_flatten = test_set_x_orig.reshape(test_set_x_orig.shape[0], -1).T

print("训练集降维最后的维度： " + str(train_set_x_flatten.shape))
print("训练集_标签的维数 : " + str(train_set_y.shape))
print("测试集降维之后的维度: " + str(test_set_x_flatten.shape))
print("测试集_标签的维数 : " + str(test_set_y.shape))

index = 11
plt.imshow(train_set_x_orig[index])
print("y = " + str(train_set_y[:, index]) + ", it's a '" + classes[np.squeeze(train_set_y[:, index])].decode(
    "utf-8") + "' picture.")

train_set_x = train_set_x_flatten / 255
test_set_x = test_set_x_flatten / 255

def sigmoid(z):
    s = 1 / (1 + np.exp(-z))
    return s

def initialize_with_zeros(dim):
    w = np.zeros(shape=(dim, 1))
    b = 0
    # 使用断言来确保我要的数据是正确的
    assert (w.shape == (dim, 1))  # w的维度是(dim,1)
    assert (isinstance(b, float) or isinstance(b, int))  # b的类型是float或者是int

    return (w, b)

def propagate(w, b, X, Y):
    m = X.shape[1]

    # 正向传播
    A = sigmoid(np.dot(w.T, X) + b)
    cost = (- 1 / m) * np.sum(Y * np.log(A) + (1 - Y) * (np.log(1 - A)))

    # 反向传播
    dw = (1 / m) * np.dot(X, (A - Y).T)
    db = (1 / m) * np.sum(A - Y)

    # 使用断言确保我的数据是正确的
    assert (dw.shape == w.shape)
    assert (db.dtype == float)
    cost = np.squeeze(cost)
    assert (cost.shape == ())

    # 创建一个字典，把dw和db保存起来。
    grads = {
        "dw": dw,
        "db": db
    }
    return (grads, cost)

def optimize(w, b, X, Y, num_iterations, learning_rate, print_cost=False):
    costs = []

    for i in range(num_iterations):

        grads, cost = propagate(w, b, X, Y)

        dw = grads["dw"]
        db = grads["db"]

        w = w - learning_rate * dw
        b = b - learning_rate * db

        # 记录成本
        if i % 100 == 0:
            costs.append(cost)
        # 打印成本
        if (print_cost) and (i % 100 == 0):
            print("迭代的次数: %i ， 误差值： %f" % (i, cost))

    params = {
        "w": w,
        "b": b}
    grads = {
        "dw": dw,
        "db": db}
    return (params, grads, costs)

def predict(w, b, X):
    m = X.shape[1]  # 图片的数量
    Y_prediction = np.zeros((1, m))
    w = w.reshape(X.shape[0], 1)

    # 计预测猫在图片中出现的概率
    A = sigmoid(np.dot(w.T, X) + b)
    for i in range(A.shape[1]):
        # 将概率a [0，i]转换为实际预测p [0，i]
        Y_prediction[0, i] = 1 if A[0, i] > 0.5 else 0
    # 使用断言
    assert (Y_prediction.shape == (1, m))

    return Y_prediction

def model(X_train, Y_train, X_test, Y_test, num_iterations=2000, learning_rate=0.5, print_cost=False):
    w, b = initialize_with_zeros(X_train.shape[0])

    parameters, grads, costs = optimize(w, b, X_train, Y_train, num_iterations, learning_rate, print_cost)

    # 从字典"参数"中检索参数w和b
    w, b = parameters["w"], parameters["b"]

    # 预测测试/训练集的例子
    Y_prediction_test = predict(w, b, X_test)
    Y_prediction_train = predict(w, b, X_train)

    # 打印训练后的准确性
    print("训练集准确性：", format(100 - np.mean(np.abs(Y_prediction_train - Y_train)) * 100), "%")
    print("测试集准确性：", format(100 - np.mean(np.abs(Y_prediction_test - Y_test)) * 100), "%")

    d = {
        "costs": costs,
        "Y_prediction_test": Y_prediction_test,
        "Y_prediciton_train": Y_prediction_train,
        "w": w,
        "b": b,
        "learning_rate": learning_rate,
        "num_iterations": num_iterations}
    return d

d = model(train_set_x, train_set_y, test_set_x, test_set_y, num_iterations=2000, learning_rate=0.005, print_cost=True)

绘制图
costs = np.squeeze(d['costs'])
plt.plot(costs)
plt.ylabel('cost')
plt.xlabel('iterations (per hundreds)')
plt.title("Learning rate =" + str(d["learning_rate"]))
plt.show()

learning_rates = [1, 0.01, 0.006, 0.0003, 0.001, 0.0006]
models = {}
for i in learning_rates:
    print("learning rate is: " + str(i))
    models[str(i)] = model(train_set_x, train_set_y, test_set_x, test_set_y, num_iterations=1500, learning_rate=i,
                           print_cost=False)
    print('\n' + "-------------------------------------------------------" + '\n')

for i in learning_rates:
    plt.plot(np.squeeze(models[str(i)]["costs"]), label=str(models[str(i)]["learning_rate"]))

plt.ylabel('cost')
plt.xlabel('iterations')

legend = plt.legend(loc='upper center', shadow=True)
frame = legend.get_frame()
frame.set_facecolor('0.90')
plt.show()

【文档要求】

1.尝试不同的学习率（至少三种），观察不同学习率下随着迭代次数的增加损失值的变化

请粘贴不同学习率下损失的变化曲线图像:

这里我首先打印了一下训练集的内容：

接着对模型进行训练，并打印不同学习率下损失的变化曲线图像：

在这里我分析了五种学习率，分别是0.01, 0.006, 0.0003, 0.001, 0.0006，可以看到学习率过低或者过高对于模型的拟合效果都存在一定的影响。当学习率过大则导致模型不收敛，过小则导致模型收敛特别慢或者无法学习。
2.分析不同的学习率对模型准确率的影响及原因，如何选择合适的学习率。

一般在分析选取最优学习率时，可以先采用多个学习率粗略范围的学习率作为尝试，在同一张图上可以看到对应某个区间之间的学习率work best，然后在这个区间内进行较精确的调参，再观察其学习率，是一个不断缩小范围的过程，并且位置不同，对应的合适步长也不同，具体可以使用余弦退火的方式改变学习率的大小，或者以非常低的学习率运行训练，并在每次迭代中线性增加它。当损失功能开始急剧增加时，应停止训练。记录每次迭代的学习速率和损失，最后找到一个合理的学习率。

初学人工智能导论，可能存在错误之处，还请各位不吝赐教。

受于文本原因，本文相关实验工程无法展示出来，现已将资源上传，可自行下载。

山东大学人工智能导论实验3工程文件-Logistic回归分类器识别猫-机器学习文档类资源-CSDN下载山东大学人工智能导论实验3工程文件-Logistic回归分类器识别猫详解博客地址：https://更多下载资源、学习资料请访问CSDN下载频道. 山东大学人工智能导论实验三 Logistic回归分类器识别猫 https://download.csdn.net/download/m0_52316372/85913095 ;

Original: https://blog.csdn.net/m0_52316372/article/details/125626670
Author: timerring
Title: 山东大学人工智能导论实验三 Logistic回归分类器识别猫

原创文章受到原创版权保护。转载请注明出处：https://www.johngo689.com/626681/

转载文章受原作者版权保护。转载请注明原作者出处！

人工智能

【自取】最近整理的，有需要可以领取学习：

Linux核心资料大放送~

全栈面试题汇总（持续更新&可下载）

一个提高学习100%效率的工具！

【超详细】深度学习面试题目！

LeetCode Python刷题答案下载！

LeetCode Java版刷题答案下载！

LeetCode C++ 版本，抓紧保存！

LeetCode GO语言刷题答案下载！

语义分割之FCN网络详解全卷积网络

1. FCN网络结构图原论文链接：https://paperswithcode.com/paper/fully-convolutional-networks-for-semant…

人工智能 2023年7月13日
0048
【数据挖掘】任务2：医学数据库MIMIC-III数据处理

要求本次任务的目的是处理PO2，PCO2两个指标。这两个指标均为病人的血气指标，以一定的时间间隔采集。一个病人一次住院期间可能收集一次或者多次。要求，按照采集时间的前后顺序，汇总…

人工智能 2023年7月7日
0066
简单记一次pip install opencv-python报错

这里写自定义目录标题 pip install opencv-python * 使用命令前提命令出现问题问题解决 pip install opencv-python 因为下载的…

人工智能 2023年6月19日
0079
NV12等常用YUV数据格式

NV12等常用YUV数据格式 1. YUV 采样表示法 2. YUV 格式 3. 数据格式 * 3.1 4:4:4 格式 3.2 4:2:2 格式 3.3 4:2:0 格式 4. …

人工智能 2023年7月27日
00120
计算机工程投稿到录用

计算机核心期刊投稿经验前期准备 * 检查自己的稿件计算机工程期刊为例前期准备本人是个学术垃圾，研一下学期才找到自己的研究方向，在写好了论文后，经历了多次期刊拒稿。在多次拒稿…

人工智能 2023年6月25日
00100
Python员工离职数据分析

Python员工离职数据分析 import pandas as pd import seaborn as sns import matplotlib.pyplot as plt i…

人工智能 2023年7月9日
0056
外卖项目01—软件开发整体介绍

目录一、软件开发整体介绍 03 1.1软件开发流程 03 1.2角色分工 1.3软件环境二、外卖项目介绍 04 2.1项目介绍 2.2产品原型展示 2.3技术选型 2.4功能架…

人工智能 2023年6月29日
0053
2022-2028中国Tableau咨询服务市场现状研究分析与发展前景预测报告

【报告篇幅】：95【报告图表数】：137【报告出版时间】：2022年2月报告摘要本文研究中国市场Tableau咨询服务现状及未来发展趋势，侧重分析在中国市场扮演重要角色的企业，…

人工智能 2023年7月18日
0044
python导入Graphviz库-画决策树图

学习决策树时，发现如果要用python画决策树，python需要导入Graphviz库，看了几篇csdn，发现个别文章不是很全，会出错误，这里简单记录下完整过程。文章目录 0.下…

人工智能 2023年6月15日
0088
时序分析28 – 时序预测格兰杰因果关系(中) python实践1

时序分析28 – 时序预测 – 格兰杰因果关系(中) Python 实践 1 上一篇文章我们介绍了格兰杰因果关系的基本概念、背景以及相关统计检验法。本篇文章…

人工智能 2023年7月7日
0074
小波时频图和CNN(卷积神经网络的）脑电分类技术研究

在这里我们可以用matlab进行时频图的绘制得到了时频图后，可以输入到卷积神经网络进行训练和技术研究小波基和尺度后，就可以用cwt求小波系数coefs（系数是复数时要取模），然…

人工智能 2023年6月30日
0096
在AI算法中，如何评估和优化模型的性能

问题：如何评估和优化AI模型的性能？介绍在AI领域中，评估和优化模型的性能是非常关键的步骤。通过评估模型的性能，我们可以了解其在现实场景中的表现如何，并且根据评估结果对模型进行…

人工智能 2024年1月3日
0042
Two-pass连通域标记方法与opencv代码实现

连通域是指图像中具有相同像素值且位置相邻的前景像素点组成的图像区域，一般使用二值图像表示。连通标记是指将图像中的各个连通区域找出并标记为响应的标号。 wo-Pass（两遍扫描法） …

人工智能 2023年7月20日
0051
Anacoda + pytorch 环境下安装 DGL_GPU

首先假设您已安装了 pytorch 虚拟环境在 cmd 中输入命令查看 cuda 版本 nvcc –version 打开 https://www.dgl.ai/pages/st…

人工智能 2023年7月22日
00383
TextBrewer之文本情感分类代码

文章目录 * – + 题目 + 前言 + TextBrewer + * Main Features * Architecture And Design * FAQ * …

人工智能 2023年5月27日
0078
OpenCV中使用类VideoCapture加载视频和打开摄像头

OpenCV用类VideoCapture实现视频读取的相关操作。 VideoCapture类的构造函数有三种原型，分别如下：C++原型如下： cv::VideoCapture::V…

人工智能 2023年6月20日
0084

2024 年 5 月
一	二	三	四	五	六	日
		1	2	3	4	5
6	7	8	9	10	11	12
13	14	15	16	17	18	19
20	21	22	23	24	25	26
27	28	29	30	31

山东大学人工智能导论实验三 Logistic回归分类器识别猫

1.datasets/train_catvnoncat.h5

2.datasets/ test_catvnoncat.h5

3.lr_utils.py中有加载数据集的函数

大家都在看