分析下列代码：import pandas as pd import matplotlib.pyplot as plt data = pd.read_excel("E:\\爬取\\爬取.xls") year_count = data.groupby(by="年份")["年份"].count() data['年份'] = pd.to_numeric(data['年份'], errors='coerce') plt.rcParams["font.sans-serif"] = ["SimHei"] plt.rcParams['axes.unicode_minus'] = False plt.plot(year_count.index, year_count.values) plt.title("电影年份发展折线图") plt.xlabel("年份") plt.ylabel("数量") plt.show() import pandas as pd import matplotlib.pyplot as plt data = pd.read_excel("E:\\爬取\\爬取.xls") plt.rcParams["font.sans-serif"] = ["SimHei"] plt.rcParams['axes.unicode_minus'] = False year_count = data['国家'].value_counts() plt.bar(year_count.index, year_count.values) plt.title("各个国家电影数量") plt.xlabel("国家") plt.ylabel("电影数量") plt.show() import pandas as pd import matplotlib.pyplot as plt data = pd.read_excel("E:\\爬取\\爬取.xls") plt.rcParams["font.sans-serif"] = ["SimHei"] plt.rcParams['axes.unicode_minus'] = False type_count = data["类型"].value_counts() plt.pie(type_count,labels=type_count.index,pctdistance=0.8,autopct='%1.1f%%',explode=[0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.1,0.01]) plt.figure(figsize=(20,6.5)) plt.title("电影主要类型分布图") plt.show() import pandas as pd import matplotlib.pyplot as plt data = pd.read_excel("E:\\爬取\\爬取.xls") scores = data["排名"].values votes = data["评价人数"].values plt.rcParams["font.sans-serif"] = ["SimHei"] plt.scatter(scores, votes) plt.title("排名与评价人数散点图") plt.xlabel("排名") plt.ylabel("评价人数") plt.show()

时间: 2024-04-28 14:27:09 浏览: 148

这段代码主要是用来对爬取到的电影数据进行数据可视化的处理。在代码中使用了 pandas 库对 Excel 数据进行读取和处理，使用了 matplotlib 库来绘制各种图表。第一个代码块绘制了电影年份的发展折线图，其中先对年份进行了分组统计，然后使用 plot 函数将结果绘制出来。第二个代码块绘制了各个国家电影数量的柱状图，其中使用了 value_counts 函数对国家进行统计，然后使用 bar 函数将结果绘制出来。第三个代码块绘制了电影主要类型分布的饼图，其中使用了 value_counts 函数对电影类型进行统计，然后使用 pie 函数将结果绘制出来。第四个代码块绘制了排名与评价人数的散点图，其中使用了 scatter 函数将排名和评价人数进行散点绘制。

import tkinter as tk import pandas as pd import matplotlib.pyplot as plt from matplotlib.backends.backend_tkagg import FigureCanvasTkAgg import os class ExcelPlotter(tk.Frame): def init(self, master=None): super().init(master) self.master = master self.master.title("图方便") self.file_label = tk.Label(master=self, text="Excel File Path:") self.file_label.grid(row=0, column=0, sticky="w") self.file_entry = tk.Entry(master=self) self.file_entry.grid(row=0, column=1, columnspan=2, sticky="we") self.file_button = tk.Button(master=self, text="Open", command=self.open_file) self.file_button.grid(row=0, column=3, sticky="e") self.plot_button = tk.Button(master=self, text="Plot", command=self.plot_data) self.plot_button.grid(row=1, column=2, sticky="we") self.name_label = tk.Label(master=self, text="Out Image Name:") self.name_label.grid(row=2, column=0, sticky="w") self.name_entry = tk.Entry(master=self) self.name_entry.grid(row=2, column=1, columnspan=2, sticky="we") self.save_button = tk.Button(master=self, text="Save", command=self.save_image) self.save_button.grid(row=2, column=3, sticky="e") self.figure = plt.figure(figsize=(5, 4), dpi=150) self.canvas = FigureCanvasTkAgg(self.figure, master=self) self.canvas.get_tk_widget().grid(row=4, column=0, columnspan=4, sticky="we") self.pack() def open_file(self): file_path = tk.filedialog.askopenfilename(filetypes=[("Excel Files", "*.xls")]) self.file_entry.delete(0, tk.END) self.file_entry.insert(tk.END, file_path) def plot_data(self): file_path = self.file_entry.get() if os.path.exists(file_path): data = pd.read_excel(file_path) plt.plot(data['波长(nm)'], data['吸光度'], 'k') plt.xlim(300, 1000) plt.xlabel('Wavelength(nm)', fontsize=16) plt.ylabel('Abs.', fontsize=16) plt.gcf().subplots_adjust(left=0.13, top=0.91, bottom=0.16) plt.savefig('Last Fig', dpi=1000) plt.show() def save_image(self): if self.figure: file_path = tk.filedialog.asksaveasfilename(defaultextension=".png") if file_path: self.figure.savefig(file_path) root = tk.Tk() app = ExcelPlotter(master=root) app.mainloop()帮我增加一个删除当前图像的功能

好的，您可以在 `ExcelPlotter` 类中添加一个名为 `delete_image` 的方法，实现删除当前图像的功能。可以在该方法中调用 `self.figure.clf()` 清空当前图像，然后在界面上更新显示。下面是修改后的代码： ```python import tkinter as tk import pandas as pd import matplotlib.pyplot as plt from matplotlib.backends.backend_tkagg import FigureCanvasTkAgg import os class ExcelPlotter(tk.Frame): def __init__(self, master=None): super().__init__(master) self.master = master self.master.title("图方便") self.file_label = tk.Label(master=self, text="Excel File Path:") self.file_label.grid(row=0, column=0, sticky="w") self.file_entry = tk.Entry(master=self) self.file_entry.grid(row=0, column=1, columnspan=2, sticky="we") self.file_button = tk.Button(master=self, text="Open", command=self.open_file) self.file_button.grid(row=0, column=3, sticky="e") self.plot_button = tk.Button(master=self, text="Plot", command=self.plot_data) self.plot_button.grid(row=1, column=2, sticky="we") self.delete_button = tk.Button(master=self, text="Delete", command=self.delete_image) self.delete_button.grid(row=1, column=3, sticky="e") self.name_label = tk.Label(master=self, text="Out Image Name:") self.name_label.grid(row=2, column=0, sticky="w") self.name_entry = tk.Entry(master=self) self.name_entry.grid(row=2, column=1, columnspan=2, sticky="we") self.save_button = tk.Button(master=self, text="Save", command=self.save_image) self.save_button.grid(row=2, column=3, sticky="e") self.figure = plt.figure(figsize=(5, 4), dpi=150) self.canvas = FigureCanvasTkAgg(self.figure, master=self) self.canvas.get_tk_widget().grid(row=4, column=0, columnspan=4, sticky="we") self.pack() def open_file(self): file_path = tk.filedialog.askopenfilename(filetypes=[("Excel Files", "*.xls")]) self.file_entry.delete(0, tk.END) self.file_entry.insert(tk.END, file_path) def plot_data(self): file_path = self.file_entry.get() if os.path.exists(file_path): data = pd.read_excel(file_path) plt.plot(data['波长(nm)'], data['吸光度'], 'k') plt.xlim(300, 1000) plt.xlabel('Wavelength(nm)', fontsize=16) plt.ylabel('Abs.', fontsize=16) plt.gcf().subplots_adjust(left=0.13, top=0.91, bottom=0.16) plt.show() def delete_image(self): if self.figure: self.figure.clf() self.canvas.draw() def save_image(self): if self.figure: file_path = tk.filedialog.asksaveasfilename(defaultextension=".png") if file_path: self.figure.savefig(file_path) root = tk.Tk() app = ExcelPlotter(master=root) app.mainloop() ``` 在界面上添加了一个名为 `Delete` 的按钮，点击该按钮会调用 `delete_image` 方法。该方法会清空当前图像并在界面上更新显示。

import numpy as np import pandas as pd import matplotlib.pyplot as plt from sklearn import linear_model, metrics plt.rcParams['font.sans-serif'] = 'SimHei' sheet = pd.read_excel(".//人均消费金额与人均国民收入.xls", 'sheet1') print(sheet.values) x_data = sheet.values[:, 1] y_data = sheet.values[:, 2] X_data = x_data[:, np.newaxis] Y_data = y_data[:, np.newaxis] LR = linear_model.LinearRegression() LR.fit(X_data, Y_data) # 进行训练 w = LR.coef_ # 获得回归系数权重向量 b = LR.intercept_ # 获得截距 y_fit = np.dot(X_data, w) + b # 数据拟合:等同LR.predict(x_data) MSE = metrics.mean_squared_error(Y_data, y_fit) # ------（3）评估指标：均方误差 ------------------- R2 = metrics.r2_score(Y_data, y_fit) # 评估指标：R2（决定系数分数） plt.figure(figsize=(8, 5)) plt.title('人均国民收入与人均消费金额 (R2=' + str(round(R2, 4)) + ")") plt.xlabel('人均国民收入 x (元)', fontsize=15) plt.ylabel('人均消费金额 y (元)', fontsize=15) plt.scatter(x_data, y_data, color='r', marker='o') plt.scatter(x_data, y_fit, color='b', marker='s') plt.plot(x_data, y_fit, color='g', linestyle='-') d = '回归方程 = ' + str(round(w[0, 0], 4)) + ' * x + ' + str(round(b[0], 2)) plt.legend([d, '红色：散点图', '蓝色：拟合点']) plt.show()

这段代码实现了利用线性回归模型拟合“人均国民收入”与“人均消费金额”之间的关系，并进行可视化展示。具体来说，代码的执行过程如下： 1. 读取名为“人均消费金额与人均国民收入.xls”、工作表名为“sheet1”的 Excel 文件，并将其转换成 Pandas DataFrame 格式的数据。 2. 从 DataFrame 中提取出“人均国民收入”和“人均消费金额”两列数据，并将其分别存储在 x_data 和 y_data 数组中。 3. 将 x_data 和 y_data 数组转换为二维数组 X_data 和 Y_data，其中 X_data 和 Y_data 分别对应于自变量和因变量。 4. 创建 LinearRegression 类的实例 LR，并使用 fit() 方法对 X_data 和 Y_data 进行线性回归模型的训练。 5. 获取回归系数权重向量 w 和截距 b。 6. 通过 np.dot() 函数将 X_data 和 w 相乘，并加上 b，得到拟合后的 y 值 y_fit。 7. 使用 mean_squared_error() 函数计算均方误差 MSE，并使用 r2_score() 函数计算决定系数分数 R2。 8. 使用 matplotlib 库创建画布，并添加标题、横坐标、纵坐标等信息。同时，使用 scatter() 函数绘制散点图，并使用 plot() 函数绘制拟合曲线。 9. 使用 legend() 函数添加图例，其中包括回归方程、散点图和拟合点。 10. 使用 show() 函数展示可视化结果。

阅读全文

相关推荐

用户用电量数据data.rar

Pandas+Matplotlib 箱式图异常值分析示例

解决Python pandas df 写入excel 出现的问题

对文件profit.xls中的盈利数据做出 帕累托图（帕累托图的定义可百度），用matplotlib.pyplot作图，写出代码。

用python matplotlib读取E:\爬取\爬取.xls文件，画售价分布的密度图，不要负数坐标

用python matplotlib读取E:\\爬取\\爬取.xls文件，画文件前五条数据的标题预售价(标题去掉括号)的雷达图

代码编写：使用Python matplotlib读取"E:\爬取\电影数据.xls"文件画关于电影类型的饼图

大家在看

使用Arduino监控ECG和呼吸-项目开发

航空发动机缺陷检测数据集VOC+YOLO格式291张4类别.7z

python基础教程：pandas DataFrame 行列索引及值的获取的方法

【微电网优化】基于粒子群优化IEEE经典微电网结构附matlab代码.zip

三层神经网络模型matlab版

最新推荐

基于Andorid的音乐播放器项目改进版本设计.zip

uniapp-machine-learning-from-scratch-05.rar

Cyclone IV硬件配置详细文档解析

【WinCC与Excel集成秘籍】：轻松搭建数据交互桥梁（必读指南）

华为模拟互联地址配置

Java游戏开发简易实现与地图控制教程

【超市销售数据深度分析】：从数据库挖掘商业价值的必经之路

在ubuntu中安装ros时出现updating datebase of manual pages...怎么解决

Laravel Monobullet Monolog处理与Pushbullet API通知集成

【超市库存管理优化手册】：数据库层面的解决方案

对文件profit.xls中的盈利数据做出帕累托图（帕累托图的定义可百度），用matplotlib.pyplot作图，写出代码。