459 lines
52 KiB
Plaintext
459 lines
52 KiB
Plaintext
{
|
|
"cells": [
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 13,
|
|
"id": "9daadf20-caa6-4b25-901c-6cc3ef563f58",
|
|
"metadata": {},
|
|
"outputs": [
|
|
{
|
|
"name": "stdout",
|
|
"output_type": "stream",
|
|
"text": [
|
|
"(255, 28)\n",
|
|
"(78, 4)\n",
|
|
"(255, 31)\n",
|
|
" ds NHITS Informer LSTM iTransformer TSMixer \\\n",
|
|
"0 2024-10-08 79.76823 80.197660 79.802414 78.391460 80.200510 \n",
|
|
"1 2024-10-09 78.75903 80.235740 79.844154 78.888565 79.861180 \n",
|
|
"2 2024-10-10 79.43970 80.186230 79.885100 79.488700 79.483086 \n",
|
|
"3 2024-10-11 79.62268 80.502975 79.878560 79.406670 79.313965 \n",
|
|
"4 2024-10-14 79.91698 80.931946 79.936270 79.758575 79.197430 \n",
|
|
"\n",
|
|
" TSMixerx PatchTST RNN GRU ... y \\\n",
|
|
"0 79.243256 80.883450 80.836105 81.276060 ... 77.180000 \n",
|
|
"1 78.068150 80.950096 80.917860 81.303505 ... 76.580002 \n",
|
|
"2 77.189064 80.347400 80.866040 81.798050 ... 79.400002 \n",
|
|
"3 77.840096 80.545296 81.167710 81.552810 ... 79.040001 \n",
|
|
"4 77.904300 81.432976 81.144210 81.483215 ... 77.459999 \n",
|
|
"\n",
|
|
" min_within_quantile max_within_quantile id CREAT_DATE min_price \\\n",
|
|
"0 80.200510 81.163630 51 2024-10-07 79.848624 \n",
|
|
"1 79.861180 81.757850 52 2024-10-07 79.981211 \n",
|
|
"2 79.483086 81.190400 53 2024-10-07 79.398409 \n",
|
|
"3 79.313965 81.371100 54 2024-10-07 79.394607 \n",
|
|
"4 79.197430 81.432976 55 2024-10-07 79.351007 \n",
|
|
"\n",
|
|
" max_price 序号 LOW_PRICE HIGH_PRICE \n",
|
|
"0 81.848624 52.0 76.36 81.14 \n",
|
|
"1 81.981211 51.0 75.15 78.02 \n",
|
|
"2 81.398409 50.0 76.72 79.72 \n",
|
|
"3 81.394607 49.0 78.04 79.50 \n",
|
|
"4 81.351007 48.0 74.86 78.55 \n",
|
|
"\n",
|
|
"[5 rows x 31 columns]\n",
|
|
" ds NHITS Informer LSTM iTransformer TSMixer \\\n",
|
|
"250 2024-12-16 74.268654 73.333750 73.090164 74.007034 74.36094 \n",
|
|
"251 2024-12-17 74.724630 73.373810 73.242540 74.285530 74.24597 \n",
|
|
"252 2024-12-18 74.948860 73.505330 73.400400 74.260290 74.06419 \n",
|
|
"253 2024-12-19 74.396740 73.934380 73.764320 74.429800 74.18059 \n",
|
|
"254 2024-12-20 73.882930 73.700935 73.769050 73.977585 73.97370 \n",
|
|
"\n",
|
|
" TSMixerx PatchTST RNN GRU ... y min_within_quantile \\\n",
|
|
"250 74.67781 74.475680 75.63023 74.853800 ... NaN 74.157196 \n",
|
|
"251 74.46460 74.628000 75.22519 74.957530 ... NaN 73.711680 \n",
|
|
"252 74.32628 74.656815 75.49716 74.890236 ... NaN 74.064190 \n",
|
|
"253 74.41026 74.698875 75.87007 75.118866 ... NaN 74.148070 \n",
|
|
"254 74.49235 74.345410 75.88466 75.186325 ... NaN 73.816990 \n",
|
|
"\n",
|
|
" max_within_quantile id CREAT_DATE min_price max_price 序号 \\\n",
|
|
"250 74.576454 301 2024-12-16 73.416857 75.416857 3.0 \n",
|
|
"251 74.948060 302 2024-12-16 73.434301 75.434301 2.0 \n",
|
|
"252 75.200980 303 2024-12-16 73.707471 75.707471 1.0 \n",
|
|
"253 75.395440 304 2024-12-16 73.639791 75.639791 NaN \n",
|
|
"254 74.345410 305 2024-12-16 73.067399 75.067399 NaN \n",
|
|
"\n",
|
|
" LOW_PRICE HIGH_PRICE \n",
|
|
"250 72.53 73.28 \n",
|
|
"251 72.48 74.18 \n",
|
|
"252 72.80 74.20 \n",
|
|
"253 NaN NaN \n",
|
|
"254 NaN NaN \n",
|
|
"\n",
|
|
"[5 rows x 31 columns]\n"
|
|
]
|
|
}
|
|
],
|
|
"source": [
|
|
"import sqlite3\n",
|
|
"import os\n",
|
|
"import pandas as pd\n",
|
|
"\n",
|
|
"dataset = r'yuanyoudataset'\n",
|
|
"\n",
|
|
"# dataset = r'C:\\Users\\Administrator\\Desktop' \n",
|
|
"\n",
|
|
"# 预测价格数据\n",
|
|
"# dbfilename = os.path.join(r'D:\\code\\PriceForecast\\yuanyoudataset','jbsh_yuanyou.db')\n",
|
|
"# conn = sqlite3.connect(dbfilename)\n",
|
|
"# query = 'SELECT * FROM accuracy'\n",
|
|
"# df1 = pd.read_sql_query(query, conn)\n",
|
|
"# df1['ds'] = df1['PREDICT_DATE']\n",
|
|
"# conn.close()\n",
|
|
"# print(df1.shape)\n",
|
|
"\n",
|
|
"# 预测价格数据\n",
|
|
"dfcsvfilename = os.path.join(dataset,'accuracy_five_mean.csv')\n",
|
|
"df1 = pd.read_csv(dfcsvfilename)\n",
|
|
"print(df1.shape)\n",
|
|
"\n",
|
|
"# 最高最低价\n",
|
|
"xlsfilename = os.path.join(dataset,'数据项下载.xls')\n",
|
|
"df2 = pd.read_excel(xlsfilename)[5:]\n",
|
|
"df2 = df2.rename(columns = {'数据项名称':'ds','布伦特最低价':'LOW_PRICE','布伦特最高价':'HIGH_PRICE'})\n",
|
|
"print(df2.shape)\n",
|
|
"\n",
|
|
"\n",
|
|
"\n",
|
|
"df = pd.merge(df1,df2,on=['ds'],how='left')\n",
|
|
"\n",
|
|
"df['ds'] = pd.to_datetime(df['ds'])\n",
|
|
"# df['PREDICT_DATE'] = pd.to_datetime(df['PREDICT_DATE'])\n",
|
|
"df = df.reindex()\n",
|
|
"\n",
|
|
"print(df.shape)\n",
|
|
"# from datetime import datetime\n",
|
|
"import time\n",
|
|
"df.to_csv(os.path.join(dataset,f'预测数据-{time.time()}.csv'))\n",
|
|
"# df = df[['ds','min_within_quantile','max_within_quantile']]\n",
|
|
"\n",
|
|
"\n",
|
|
"\n",
|
|
"# 打印数据框的前几行\n",
|
|
"print(df.head())\n",
|
|
"print(df.tail())\n"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 14,
|
|
"id": "0d77ab7d",
|
|
"metadata": {},
|
|
"outputs": [],
|
|
"source": [
|
|
"# 模型评估前五均值 \n",
|
|
"df['min_price'] = df.iloc[:,1:6].mean(axis=1) -1.5\n",
|
|
"df['max_price'] = df.iloc[:,1:6].mean(axis=1) +1.5"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 15,
|
|
"id": "e51c3fd0-6bff-45de-b8b6-971e7986c7a7",
|
|
"metadata": {},
|
|
"outputs": [
|
|
{
|
|
"name": "stdout",
|
|
"output_type": "stream",
|
|
"text": [
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-09-27 2024-10-04 0\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-09-27 2024-10-04 0\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-09-27 2024-10-04 0\n"
|
|
]
|
|
},
|
|
{
|
|
"name": "stdout",
|
|
"output_type": "stream",
|
|
"text": [
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-09-27 2024-10-04 0\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-09-27 2024-10-04 0\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-04 2024-10-11 0.433988\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-04 2024-10-11 0.433988\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-04 2024-10-11 0.433988\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-04 2024-10-11 0.433988\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-04 2024-10-11 0.433988\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-11 2024-10-18 0.367557\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-11 2024-10-18 0.367557\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-11 2024-10-18 0.367557\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-11 2024-10-18 0.367557\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-11 2024-10-18 0.367557\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-18 2024-10-25 0.342808\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-18 2024-10-25 0.342808\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-18 2024-10-25 0.342808\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-18 2024-10-25 0.342808\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-18 2024-10-25 0.342808\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-25 2024-11-01 0.397058\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-25 2024-11-01 0.397058\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-25 2024-11-01 0.397058\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-25 2024-11-01 0.397058\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-10-25 2024-11-01 0.397058\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-01 2024-11-08 0.666605\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-01 2024-11-08 0.666605\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-01 2024-11-08 0.666605\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-01 2024-11-08 0.666605\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-01 2024-11-08 0.666605\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-08 2024-11-15 0.805488\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-08 2024-11-15 0.805488\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-08 2024-11-15 0.805488\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-08 2024-11-15 0.805488\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-08 2024-11-15 0.805488\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-15 2024-11-22 0.744558\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-15 2024-11-22 0.744558\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-15 2024-11-22 0.744558\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-15 2024-11-22 0.744558\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-15 2024-11-22 0.744558\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-22 2024-11-29 0.351228\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-22 2024-11-29 0.351228\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-22 2024-11-29 0.351228\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-22 2024-11-29 0.351228\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-22 2024-11-29 0.351228\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-29 2024-12-06 0.727334\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-29 2024-12-06 0.727334\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-29 2024-12-06 0.727334\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-29 2024-12-06 0.727334\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-11-29 2024-12-06 0.727334\n",
|
|
" 开始日期 结束日期 准确率\n",
|
|
"0 2024-12-06 2024-12-13 0.835391\n"
|
|
]
|
|
}
|
|
],
|
|
"source": [
|
|
"# 定义一个函数来计算准确率\n",
|
|
"# 比较真实最高最低,和预测最高最低 计算准确率\n",
|
|
"def calculate_accuracy(row):\n",
|
|
" # 全子集情况:\n",
|
|
" if (row['max_price'] >= row['HIGH_PRICE'] and row['min_price'] <= row['LOW_PRICE']) or \\\n",
|
|
" (row['max_price'] <= row['HIGH_PRICE'] and row['min_price'] >= row['LOW_PRICE']):\n",
|
|
" return 1 \n",
|
|
" # 无交集情况:\n",
|
|
" if row['max_price'] < row['LOW_PRICE'] or \\\n",
|
|
" row['min_price'] > row['HIGH_PRICE']:\n",
|
|
" return 0\n",
|
|
" # 有交集情况:\n",
|
|
" else:\n",
|
|
" sorted_prices = sorted([row['LOW_PRICE'], row['min_price'], row['max_price'], row['HIGH_PRICE']])\n",
|
|
" middle_diff = sorted_prices[2] - sorted_prices[1]\n",
|
|
" price_range = row['HIGH_PRICE'] - row['LOW_PRICE']\n",
|
|
" accuracy = middle_diff / price_range\n",
|
|
" return accuracy\n",
|
|
"import datetime\n",
|
|
"weight_dict = [0.4,0.15,0.1,0.1,0.25] # 权重\n",
|
|
"\n",
|
|
"columns = ['HIGH_PRICE','LOW_PRICE','min_price','max_price']\n",
|
|
"df[columns] = df[columns].astype(float)\n",
|
|
"df['ACCURACY'] = df.apply(calculate_accuracy, axis=1)\n",
|
|
"# df['ACCURACY'] = df.apply(is_within_range, axis=1)\n",
|
|
"# 取结束日期上一周的日期\n",
|
|
"def get_week_date(end_time):\n",
|
|
" endtime = end_time\n",
|
|
" endtimeweek = datetime.datetime.strptime(endtime, '%Y-%m-%d')\n",
|
|
" up_week = endtimeweek - datetime.timedelta(days=endtimeweek.weekday() + 14)\n",
|
|
" up_week_dates = [up_week + datetime.timedelta(days=i) for i in range(14)][4:-2]\n",
|
|
" up_week_dates = [date.strftime('%Y-%m-%d') for date in up_week_dates]\n",
|
|
" return up_week_dates\n",
|
|
"\n",
|
|
"# 计算准确率并保存结果\n",
|
|
"def _get_accuracy_rate(df,up_week_dates,endtime):\n",
|
|
" df3 = df.copy()\n",
|
|
" df3 = df3[df3['CREAT_DATE'].isin(up_week_dates)]\n",
|
|
" df3 = df3[df3['ds'].isin(up_week_dates)]\n",
|
|
" accuracy_rote = 0\n",
|
|
" for i,group in df3.groupby('ds'):\n",
|
|
" # print('权重:',weight_dict[len(group)-1])\n",
|
|
" # print('准确率:',(group['ACCURACY'].sum()/len(group))*weight_dict[len(group)-1])\n",
|
|
" accuracy_rote += (group['ACCURACY'].sum()/len(group))*weight_dict[len(group)-1]\n",
|
|
" df3.to_csv(os.path.join(dataset,f'accuracy_{endtime}.csv'),index=False)\n",
|
|
" df4 = pd.DataFrame(columns=['开始日期','结束日期','准确率'])\n",
|
|
" df4.loc[len(df4)] = {'开始日期':up_week_dates[0],'结束日期':up_week_dates[-1],'准确率':accuracy_rote}\n",
|
|
" df4.to_csv(os.path.join(dataset,f'accuracy_rote_{endtime}.csv'),index=False)\n",
|
|
" print(df4)\n",
|
|
" # df4.to_sql(\"accuracy_rote\", con=sqlitedb.connection, if_exists='append', index=False)\n",
|
|
"\n",
|
|
"\n",
|
|
"end_times = df['CREAT_DATE'].unique()\n",
|
|
"for endtime in end_times:\n",
|
|
" up_week_dates = get_week_date(endtime)\n",
|
|
" _get_accuracy_rate(df,up_week_dates,endtime)\n",
|
|
"\n",
|
|
"# 打印结果\n",
|
|
"\n"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 31,
|
|
"id": "0f942c69",
|
|
"metadata": {},
|
|
"outputs": [
|
|
{
|
|
"name": "stdout",
|
|
"output_type": "stream",
|
|
"text": [
|
|
"(255, 6)\n",
|
|
" ds min_price max_price LOW_PRICE LOW_PRICE CREAT_DATE\n",
|
|
"0 2024-10-08 78.172055 81.172055 76.36 76.36 2024-10-07\n",
|
|
"1 2024-10-09 78.017734 81.017734 75.15 75.15 2024-10-07\n",
|
|
"2 2024-10-10 78.196563 81.196563 76.72 76.72 2024-10-07\n",
|
|
"3 2024-10-11 78.244970 81.244970 78.04 78.04 2024-10-07\n",
|
|
"4 2024-10-14 78.448240 81.448240 74.86 74.86 2024-10-07\n",
|
|
"5 2024-10-09 75.442758 78.442758 75.15 75.15 2024-10-08\n",
|
|
"6 2024-10-10 75.684414 78.684414 76.72 76.72 2024-10-08\n",
|
|
"7 2024-10-11 75.675482 78.675482 78.04 78.04 2024-10-08\n",
|
|
"8 2024-10-14 75.819379 78.819379 74.86 74.86 2024-10-08\n",
|
|
"9 2024-10-15 75.830953 78.830953 73.34 73.34 2024-10-08\n",
|
|
"['2024-10-07', '2024-10-08', '2024-10-09', '2024-10-10', '2024-10-11', '2024-10-12', '2024-10-13']\n",
|
|
"(10, 6)\n",
|
|
" ds min_price max_price LOW_PRICE LOW_PRICE CREAT_DATE\n",
|
|
"0 2024-10-08 78.172055 81.172055 76.36 76.36 2024-10-07\n",
|
|
"1 2024-10-09 78.017734 81.017734 75.15 75.15 2024-10-07\n",
|
|
"2 2024-10-10 78.196563 81.196563 76.72 76.72 2024-10-07\n",
|
|
"3 2024-10-11 78.244970 81.244970 78.04 78.04 2024-10-07\n",
|
|
"5 2024-10-09 75.442758 78.442758 75.15 75.15 2024-10-08\n",
|
|
"6 2024-10-10 75.684414 78.684414 76.72 76.72 2024-10-08\n",
|
|
"7 2024-10-11 75.675482 78.675482 78.04 78.04 2024-10-08\n",
|
|
"10 2024-10-10 75.439643 78.439643 76.72 76.72 2024-10-09\n",
|
|
"11 2024-10-11 75.214194 78.214194 78.04 78.04 2024-10-09\n",
|
|
"15 2024-10-11 77.558740 80.558740 78.04 78.04 2024-10-10\n"
|
|
]
|
|
},
|
|
{
|
|
"ename": "ValueError",
|
|
"evalue": "Per-column arrays must each be 1-dimensional",
|
|
"output_type": "error",
|
|
"traceback": [
|
|
"\u001b[1;31m---------------------------------------------------------------------------\u001b[0m",
|
|
"\u001b[1;31mValueError\u001b[0m Traceback (most recent call last)",
|
|
"Cell \u001b[1;32mIn[31], line 33\u001b[0m\n\u001b[0;32m 31\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmin_price\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n\u001b[0;32m 32\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmax_price\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n\u001b[1;32m---> 33\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mLOW_PRICE\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n\u001b[0;32m 34\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mHIGH_PRICE\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\relational.py:742\u001b[0m, in \u001b[0;36mscatterplot\u001b[1;34m(data, x, y, hue, size, style, palette, hue_order, hue_norm, sizes, size_order, size_norm, markers, style_order, legend, ax, **kwargs)\u001b[0m\n\u001b[0;32m 732\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mscatterplot\u001b[39m(\n\u001b[0;32m 733\u001b[0m data\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, \u001b[38;5;241m*\u001b[39m,\n\u001b[0;32m 734\u001b[0m x\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, y\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, hue\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, size\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, style\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m (...)\u001b[0m\n\u001b[0;32m 738\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs\n\u001b[0;32m 739\u001b[0m ):\n\u001b[0;32m 741\u001b[0m variables \u001b[38;5;241m=\u001b[39m _ScatterPlotter\u001b[38;5;241m.\u001b[39mget_semantics(\u001b[38;5;28mlocals\u001b[39m())\n\u001b[1;32m--> 742\u001b[0m p \u001b[38;5;241m=\u001b[39m _ScatterPlotter(data\u001b[38;5;241m=\u001b[39mdata, variables\u001b[38;5;241m=\u001b[39mvariables, legend\u001b[38;5;241m=\u001b[39mlegend)\n\u001b[0;32m 744\u001b[0m p\u001b[38;5;241m.\u001b[39mmap_hue(palette\u001b[38;5;241m=\u001b[39mpalette, order\u001b[38;5;241m=\u001b[39mhue_order, norm\u001b[38;5;241m=\u001b[39mhue_norm)\n\u001b[0;32m 745\u001b[0m p\u001b[38;5;241m.\u001b[39mmap_size(sizes\u001b[38;5;241m=\u001b[39msizes, order\u001b[38;5;241m=\u001b[39msize_order, norm\u001b[38;5;241m=\u001b[39msize_norm)\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\relational.py:538\u001b[0m, in \u001b[0;36m_ScatterPlotter.__init__\u001b[1;34m(self, data, variables, legend)\u001b[0m\n\u001b[0;32m 529\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21m__init__\u001b[39m(\u001b[38;5;28mself\u001b[39m, \u001b[38;5;241m*\u001b[39m, data\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, variables\u001b[38;5;241m=\u001b[39m{}, legend\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m):\n\u001b[0;32m 530\u001b[0m \n\u001b[0;32m 531\u001b[0m \u001b[38;5;66;03m# TODO this is messy, we want the mapping to be agnostic about\u001b[39;00m\n\u001b[0;32m 532\u001b[0m \u001b[38;5;66;03m# the kind of plot to draw, but for the time being we need to set\u001b[39;00m\n\u001b[0;32m 533\u001b[0m \u001b[38;5;66;03m# this information so the SizeMapping can use it\u001b[39;00m\n\u001b[0;32m 534\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_default_size_range \u001b[38;5;241m=\u001b[39m (\n\u001b[0;32m 535\u001b[0m np\u001b[38;5;241m.\u001b[39mr_[\u001b[38;5;241m.5\u001b[39m, \u001b[38;5;241m2\u001b[39m] \u001b[38;5;241m*\u001b[39m np\u001b[38;5;241m.\u001b[39msquare(mpl\u001b[38;5;241m.\u001b[39mrcParams[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlines.markersize\u001b[39m\u001b[38;5;124m\"\u001b[39m])\n\u001b[0;32m 536\u001b[0m )\n\u001b[1;32m--> 538\u001b[0m \u001b[38;5;28msuper\u001b[39m()\u001b[38;5;241m.\u001b[39m\u001b[38;5;21m__init__\u001b[39m(data\u001b[38;5;241m=\u001b[39mdata, variables\u001b[38;5;241m=\u001b[39mvariables)\n\u001b[0;32m 540\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlegend \u001b[38;5;241m=\u001b[39m legend\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\_oldcore.py:640\u001b[0m, in \u001b[0;36mVectorPlotter.__init__\u001b[1;34m(self, data, variables)\u001b[0m\n\u001b[0;32m 635\u001b[0m \u001b[38;5;66;03m# var_ordered is relevant only for categorical axis variables, and may\u001b[39;00m\n\u001b[0;32m 636\u001b[0m \u001b[38;5;66;03m# be better handled by an internal axis information object that tracks\u001b[39;00m\n\u001b[0;32m 637\u001b[0m \u001b[38;5;66;03m# such information and is set up by the scale_* methods. The analogous\u001b[39;00m\n\u001b[0;32m 638\u001b[0m \u001b[38;5;66;03m# information for numeric axes would be information about log scales.\u001b[39;00m\n\u001b[0;32m 639\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_var_ordered \u001b[38;5;241m=\u001b[39m {\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mx\u001b[39m\u001b[38;5;124m\"\u001b[39m: \u001b[38;5;28;01mFalse\u001b[39;00m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124my\u001b[39m\u001b[38;5;124m\"\u001b[39m: \u001b[38;5;28;01mFalse\u001b[39;00m} \u001b[38;5;66;03m# alt., used DefaultDict\u001b[39;00m\n\u001b[1;32m--> 640\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39massign_variables(data, variables)\n\u001b[0;32m 642\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m var, \u001b[38;5;28mcls\u001b[39m \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_semantic_mappings\u001b[38;5;241m.\u001b[39mitems():\n\u001b[0;32m 643\u001b[0m \n\u001b[0;32m 644\u001b[0m \u001b[38;5;66;03m# Create the mapping function\u001b[39;00m\n\u001b[0;32m 645\u001b[0m map_func \u001b[38;5;241m=\u001b[39m partial(\u001b[38;5;28mcls\u001b[39m\u001b[38;5;241m.\u001b[39mmap, plotter\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m)\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\_oldcore.py:701\u001b[0m, in \u001b[0;36mVectorPlotter.assign_variables\u001b[1;34m(self, data, variables)\u001b[0m\n\u001b[0;32m 699\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 700\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39minput_format \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlong\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[1;32m--> 701\u001b[0m plot_data, variables \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_assign_variables_longform(\n\u001b[0;32m 702\u001b[0m data, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mvariables,\n\u001b[0;32m 703\u001b[0m )\n\u001b[0;32m 705\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mplot_data \u001b[38;5;241m=\u001b[39m plot_data\n\u001b[0;32m 706\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mvariables \u001b[38;5;241m=\u001b[39m variables\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\_oldcore.py:962\u001b[0m, in \u001b[0;36mVectorPlotter._assign_variables_longform\u001b[1;34m(self, data, **kwargs)\u001b[0m\n\u001b[0;32m 958\u001b[0m variables[key] \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mgetattr\u001b[39m(val, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mname\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;28;01mNone\u001b[39;00m)\n\u001b[0;32m 960\u001b[0m \u001b[38;5;66;03m# Construct a tidy plot DataFrame. This will convert a number of\u001b[39;00m\n\u001b[0;32m 961\u001b[0m \u001b[38;5;66;03m# types automatically, aligning on index in case of pandas objects\u001b[39;00m\n\u001b[1;32m--> 962\u001b[0m plot_data \u001b[38;5;241m=\u001b[39m pd\u001b[38;5;241m.\u001b[39mDataFrame(plot_data)\n\u001b[0;32m 964\u001b[0m \u001b[38;5;66;03m# Reduce the variables dictionary to fields with valid data\u001b[39;00m\n\u001b[0;32m 965\u001b[0m variables \u001b[38;5;241m=\u001b[39m {\n\u001b[0;32m 966\u001b[0m var: name\n\u001b[0;32m 967\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m var, name \u001b[38;5;129;01min\u001b[39;00m variables\u001b[38;5;241m.\u001b[39mitems()\n\u001b[0;32m 968\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m plot_data[var]\u001b[38;5;241m.\u001b[39mnotnull()\u001b[38;5;241m.\u001b[39many()\n\u001b[0;32m 969\u001b[0m }\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\frame.py:733\u001b[0m, in \u001b[0;36mDataFrame.__init__\u001b[1;34m(self, data, index, columns, dtype, copy)\u001b[0m\n\u001b[0;32m 727\u001b[0m mgr \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_mgr(\n\u001b[0;32m 728\u001b[0m data, axes\u001b[38;5;241m=\u001b[39m{\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mindex\u001b[39m\u001b[38;5;124m\"\u001b[39m: index, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mcolumns\u001b[39m\u001b[38;5;124m\"\u001b[39m: columns}, dtype\u001b[38;5;241m=\u001b[39mdtype, copy\u001b[38;5;241m=\u001b[39mcopy\n\u001b[0;32m 729\u001b[0m )\n\u001b[0;32m 731\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(data, \u001b[38;5;28mdict\u001b[39m):\n\u001b[0;32m 732\u001b[0m \u001b[38;5;66;03m# GH#38939 de facto copy defaults to False only in non-dict cases\u001b[39;00m\n\u001b[1;32m--> 733\u001b[0m mgr \u001b[38;5;241m=\u001b[39m dict_to_mgr(data, index, columns, dtype\u001b[38;5;241m=\u001b[39mdtype, copy\u001b[38;5;241m=\u001b[39mcopy, typ\u001b[38;5;241m=\u001b[39mmanager)\n\u001b[0;32m 734\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(data, ma\u001b[38;5;241m.\u001b[39mMaskedArray):\n\u001b[0;32m 735\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mnumpy\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mma\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m mrecords\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\internals\\construction.py:503\u001b[0m, in \u001b[0;36mdict_to_mgr\u001b[1;34m(data, index, columns, dtype, typ, copy)\u001b[0m\n\u001b[0;32m 499\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 500\u001b[0m \u001b[38;5;66;03m# dtype check to exclude e.g. range objects, scalars\u001b[39;00m\n\u001b[0;32m 501\u001b[0m arrays \u001b[38;5;241m=\u001b[39m [x\u001b[38;5;241m.\u001b[39mcopy() \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mhasattr\u001b[39m(x, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdtype\u001b[39m\u001b[38;5;124m\"\u001b[39m) \u001b[38;5;28;01melse\u001b[39;00m x \u001b[38;5;28;01mfor\u001b[39;00m x \u001b[38;5;129;01min\u001b[39;00m arrays]\n\u001b[1;32m--> 503\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m arrays_to_mgr(arrays, columns, index, dtype\u001b[38;5;241m=\u001b[39mdtype, typ\u001b[38;5;241m=\u001b[39mtyp, consolidate\u001b[38;5;241m=\u001b[39mcopy)\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\internals\\construction.py:114\u001b[0m, in \u001b[0;36marrays_to_mgr\u001b[1;34m(arrays, columns, index, dtype, verify_integrity, typ, consolidate)\u001b[0m\n\u001b[0;32m 111\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m verify_integrity:\n\u001b[0;32m 112\u001b[0m \u001b[38;5;66;03m# figure out the index, if necessary\u001b[39;00m\n\u001b[0;32m 113\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m index \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m--> 114\u001b[0m index \u001b[38;5;241m=\u001b[39m _extract_index(arrays)\n\u001b[0;32m 115\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 116\u001b[0m index \u001b[38;5;241m=\u001b[39m ensure_index(index)\n",
|
|
"File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\internals\\construction.py:664\u001b[0m, in \u001b[0;36m_extract_index\u001b[1;34m(data)\u001b[0m\n\u001b[0;32m 662\u001b[0m raw_lengths\u001b[38;5;241m.\u001b[39mappend(\u001b[38;5;28mlen\u001b[39m(val))\n\u001b[0;32m 663\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(val, np\u001b[38;5;241m.\u001b[39mndarray) \u001b[38;5;129;01mand\u001b[39;00m val\u001b[38;5;241m.\u001b[39mndim \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m1\u001b[39m:\n\u001b[1;32m--> 664\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mPer-column arrays must each be 1-dimensional\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[0;32m 666\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m indexes \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m raw_lengths:\n\u001b[0;32m 667\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mIf using all scalar values, you must pass an index\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n",
|
|
"\u001b[1;31mValueError\u001b[0m: Per-column arrays must each be 1-dimensional"
|
|
]
|
|
},
|
|
{
|
|
"data": {
|
|
"image/png": "",
|
|
"text/plain": [
|
|
"<Figure size 1600x1000 with 1 Axes>"
|
|
]
|
|
},
|
|
"metadata": {},
|
|
"output_type": "display_data"
|
|
}
|
|
],
|
|
"source": [
|
|
"# 画图\n",
|
|
"import matplotlib.pyplot as plt\n",
|
|
"import seaborn as sns\n",
|
|
"\n",
|
|
"df5 = df.copy()\n",
|
|
"df5 = df5[['ds','min_price','max_price','LOW_PRICE','LOW_PRICE','CREAT_DATE']]\n",
|
|
"\n",
|
|
"print(df5.shape)\n",
|
|
"print(df5.head(10))\n",
|
|
"# 画图配置\n",
|
|
"plt.figure(figsize=(16,10))\n",
|
|
"\n",
|
|
"def get_this_week_date(end_time):\n",
|
|
" endtime = end_time\n",
|
|
" # endtimeweek = datetime.datetime.strptime(endtime, '%Y-%m-%d')\n",
|
|
" endtimeweek = endtime\n",
|
|
" up_week = endtimeweek - datetime.timedelta(days=endtimeweek.weekday() )\n",
|
|
" up_week_dates = [up_week + datetime.timedelta(days=i) for i in range(7)]\n",
|
|
" up_week_dates = [date.strftime('%Y-%m-%d') for date in up_week_dates]\n",
|
|
" return up_week_dates\n",
|
|
"\n",
|
|
"# ds分组\n",
|
|
"end_times = df['ds'].unique()\n",
|
|
"for endtime in end_times:\n",
|
|
" up_week_dates = get_this_week_date(endtime)\n",
|
|
" print(up_week_dates)\n",
|
|
" df6 = df5[df5['ds'].isin(up_week_dates)]\n",
|
|
" print(df6.shape)\n",
|
|
" print(df6.head(10))\n",
|
|
" # sns画散点图\n",
|
|
" sns.scatterplot(x=df6.index,y=df6['min_price'].values,data=df6)\n",
|
|
" sns.scatterplot(x=df6.index,y=df6['max_price'].values,data=df6)\n",
|
|
" sns.scatterplot(x=df6.index,y=df6['LOW_PRICE'].values,data=df6)\n",
|
|
" sns.scatterplot(x=df6.index,y=df6['HIGH_PRICE'].values,data=df6)\n",
|
|
" sns.scatterplot(x=df6.index,y=df6['HIGH_PRICE'].values,data=df6)"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": null,
|
|
"id": "336fa6ed",
|
|
"metadata": {},
|
|
"outputs": [],
|
|
"source": []
|
|
}
|
|
],
|
|
"metadata": {
|
|
"kernelspec": {
|
|
"display_name": "base",
|
|
"language": "python",
|
|
"name": "python3"
|
|
},
|
|
"language_info": {
|
|
"codemirror_mode": {
|
|
"name": "ipython",
|
|
"version": 3
|
|
},
|
|
"file_extension": ".py",
|
|
"mimetype": "text/x-python",
|
|
"name": "python",
|
|
"nbconvert_exporter": "python",
|
|
"pygments_lexer": "ipython3",
|
|
"version": "3.11.7"
|
|
}
|
|
},
|
|
"nbformat": 4,
|
|
"nbformat_minor": 5
|
|
}
|