import pandas as pd
import pymysql
# 连接数据库
connection = pymysql.connect(host='localhost',
user='root',
password='password',
database='ecommerce')
# 查询数据
query = "SELECT * FROM orders"
orders_df = pd.read_sql(query, connection)
# 显示前几行数据
print(orders_df.head())
]]>
# 填充缺失值
orders_df['amount'].fillna(orders_df['amount'].mean(), inplace=True)
# 检查是否有缺失值
print(orders_df.isnull().sum())
]]>
# 计算每个产品的总销售额
product_sales = orders_df.groupby('product_category')['amount'].sum()
# 显示结果
print(product_sales)
]]>