{ "cells": [ { "cell_type": "code", "execution_count": 13, "id": "9daadf20-caa6-4b25-901c-6cc3ef563f58", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "(255, 28)\n", "(78, 4)\n", "(255, 31)\n", " ds NHITS Informer LSTM iTransformer TSMixer \\\n", "0 2024-10-08 79.76823 80.197660 79.802414 78.391460 80.200510 \n", "1 2024-10-09 78.75903 80.235740 79.844154 78.888565 79.861180 \n", "2 2024-10-10 79.43970 80.186230 79.885100 79.488700 79.483086 \n", "3 2024-10-11 79.62268 80.502975 79.878560 79.406670 79.313965 \n", "4 2024-10-14 79.91698 80.931946 79.936270 79.758575 79.197430 \n", "\n", " TSMixerx PatchTST RNN GRU ... y \\\n", "0 79.243256 80.883450 80.836105 81.276060 ... 77.180000 \n", "1 78.068150 80.950096 80.917860 81.303505 ... 76.580002 \n", "2 77.189064 80.347400 80.866040 81.798050 ... 79.400002 \n", "3 77.840096 80.545296 81.167710 81.552810 ... 79.040001 \n", "4 77.904300 81.432976 81.144210 81.483215 ... 77.459999 \n", "\n", " min_within_quantile max_within_quantile id CREAT_DATE min_price \\\n", "0 80.200510 81.163630 51 2024-10-07 79.848624 \n", "1 79.861180 81.757850 52 2024-10-07 79.981211 \n", "2 79.483086 81.190400 53 2024-10-07 79.398409 \n", "3 79.313965 81.371100 54 2024-10-07 79.394607 \n", "4 79.197430 81.432976 55 2024-10-07 79.351007 \n", "\n", " max_price 序号 LOW_PRICE HIGH_PRICE \n", "0 81.848624 52.0 76.36 81.14 \n", "1 81.981211 51.0 75.15 78.02 \n", "2 81.398409 50.0 76.72 79.72 \n", "3 81.394607 49.0 78.04 79.50 \n", "4 81.351007 48.0 74.86 78.55 \n", "\n", "[5 rows x 31 columns]\n", " ds NHITS Informer LSTM iTransformer TSMixer \\\n", "250 2024-12-16 74.268654 73.333750 73.090164 74.007034 74.36094 \n", "251 2024-12-17 74.724630 73.373810 73.242540 74.285530 74.24597 \n", "252 2024-12-18 74.948860 73.505330 73.400400 74.260290 74.06419 \n", "253 2024-12-19 74.396740 73.934380 73.764320 74.429800 74.18059 \n", "254 2024-12-20 73.882930 73.700935 73.769050 73.977585 73.97370 \n", "\n", " TSMixerx PatchTST RNN GRU ... y min_within_quantile \\\n", "250 74.67781 74.475680 75.63023 74.853800 ... NaN 74.157196 \n", "251 74.46460 74.628000 75.22519 74.957530 ... NaN 73.711680 \n", "252 74.32628 74.656815 75.49716 74.890236 ... NaN 74.064190 \n", "253 74.41026 74.698875 75.87007 75.118866 ... NaN 74.148070 \n", "254 74.49235 74.345410 75.88466 75.186325 ... NaN 73.816990 \n", "\n", " max_within_quantile id CREAT_DATE min_price max_price 序号 \\\n", "250 74.576454 301 2024-12-16 73.416857 75.416857 3.0 \n", "251 74.948060 302 2024-12-16 73.434301 75.434301 2.0 \n", "252 75.200980 303 2024-12-16 73.707471 75.707471 1.0 \n", "253 75.395440 304 2024-12-16 73.639791 75.639791 NaN \n", "254 74.345410 305 2024-12-16 73.067399 75.067399 NaN \n", "\n", " LOW_PRICE HIGH_PRICE \n", "250 72.53 73.28 \n", "251 72.48 74.18 \n", "252 72.80 74.20 \n", "253 NaN NaN \n", "254 NaN NaN \n", "\n", "[5 rows x 31 columns]\n" ] } ], "source": [ "import sqlite3\n", "import os\n", "import pandas as pd\n", "\n", "dataset = r'yuanyoudataset'\n", "\n", "# dataset = r'C:\\Users\\Administrator\\Desktop' \n", "\n", "# 预测价格数据\n", "# dbfilename = os.path.join(r'D:\\code\\PriceForecast\\yuanyoudataset','jbsh_yuanyou.db')\n", "# conn = sqlite3.connect(dbfilename)\n", "# query = 'SELECT * FROM accuracy'\n", "# df1 = pd.read_sql_query(query, conn)\n", "# df1['ds'] = df1['PREDICT_DATE']\n", "# conn.close()\n", "# print(df1.shape)\n", "\n", "# 预测价格数据\n", "dfcsvfilename = os.path.join(dataset,'accuracy_five_mean.csv')\n", "df1 = pd.read_csv(dfcsvfilename)\n", "print(df1.shape)\n", "\n", "# 最高最低价\n", "xlsfilename = os.path.join(dataset,'数据项下载.xls')\n", "df2 = pd.read_excel(xlsfilename)[5:]\n", "df2 = df2.rename(columns = {'数据项名称':'ds','布伦特最低价':'LOW_PRICE','布伦特最高价':'HIGH_PRICE'})\n", "print(df2.shape)\n", "\n", "\n", "\n", "df = pd.merge(df1,df2,on=['ds'],how='left')\n", "\n", "df['ds'] = pd.to_datetime(df['ds'])\n", "# df['PREDICT_DATE'] = pd.to_datetime(df['PREDICT_DATE'])\n", "df = df.reindex()\n", "\n", "print(df.shape)\n", "# from datetime import datetime\n", "import time\n", "df.to_csv(os.path.join(dataset,f'预测数据-{time.time()}.csv'))\n", "# df = df[['ds','min_within_quantile','max_within_quantile']]\n", "\n", "\n", "\n", "# 打印数据框的前几行\n", "print(df.head())\n", "print(df.tail())\n" ] }, { "cell_type": "code", "execution_count": 14, "id": "0d77ab7d", "metadata": {}, "outputs": [], "source": [ "# 模型评估前五均值 \n", "df['min_price'] = df.iloc[:,1:6].mean(axis=1) -1.5\n", "df['max_price'] = df.iloc[:,1:6].mean(axis=1) +1.5" ] }, { "cell_type": "code", "execution_count": 15, "id": "e51c3fd0-6bff-45de-b8b6-971e7986c7a7", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ " 开始日期 结束日期 准确率\n", "0 2024-09-27 2024-10-04 0\n", " 开始日期 结束日期 准确率\n", "0 2024-09-27 2024-10-04 0\n", " 开始日期 结束日期 准确率\n", "0 2024-09-27 2024-10-04 0\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ " 开始日期 结束日期 准确率\n", "0 2024-09-27 2024-10-04 0\n", " 开始日期 结束日期 准确率\n", "0 2024-09-27 2024-10-04 0\n", " 开始日期 结束日期 准确率\n", "0 2024-10-04 2024-10-11 0.433988\n", " 开始日期 结束日期 准确率\n", "0 2024-10-04 2024-10-11 0.433988\n", " 开始日期 结束日期 准确率\n", "0 2024-10-04 2024-10-11 0.433988\n", " 开始日期 结束日期 准确率\n", "0 2024-10-04 2024-10-11 0.433988\n", " 开始日期 结束日期 准确率\n", "0 2024-10-04 2024-10-11 0.433988\n", " 开始日期 结束日期 准确率\n", "0 2024-10-11 2024-10-18 0.367557\n", " 开始日期 结束日期 准确率\n", "0 2024-10-11 2024-10-18 0.367557\n", " 开始日期 结束日期 准确率\n", "0 2024-10-11 2024-10-18 0.367557\n", " 开始日期 结束日期 准确率\n", "0 2024-10-11 2024-10-18 0.367557\n", " 开始日期 结束日期 准确率\n", "0 2024-10-11 2024-10-18 0.367557\n", " 开始日期 结束日期 准确率\n", "0 2024-10-18 2024-10-25 0.342808\n", " 开始日期 结束日期 准确率\n", "0 2024-10-18 2024-10-25 0.342808\n", " 开始日期 结束日期 准确率\n", "0 2024-10-18 2024-10-25 0.342808\n", " 开始日期 结束日期 准确率\n", "0 2024-10-18 2024-10-25 0.342808\n", " 开始日期 结束日期 准确率\n", "0 2024-10-18 2024-10-25 0.342808\n", " 开始日期 结束日期 准确率\n", "0 2024-10-25 2024-11-01 0.397058\n", " 开始日期 结束日期 准确率\n", "0 2024-10-25 2024-11-01 0.397058\n", " 开始日期 结束日期 准确率\n", "0 2024-10-25 2024-11-01 0.397058\n", " 开始日期 结束日期 准确率\n", "0 2024-10-25 2024-11-01 0.397058\n", " 开始日期 结束日期 准确率\n", "0 2024-10-25 2024-11-01 0.397058\n", " 开始日期 结束日期 准确率\n", "0 2024-11-01 2024-11-08 0.666605\n", " 开始日期 结束日期 准确率\n", "0 2024-11-01 2024-11-08 0.666605\n", " 开始日期 结束日期 准确率\n", "0 2024-11-01 2024-11-08 0.666605\n", " 开始日期 结束日期 准确率\n", "0 2024-11-01 2024-11-08 0.666605\n", " 开始日期 结束日期 准确率\n", "0 2024-11-01 2024-11-08 0.666605\n", " 开始日期 结束日期 准确率\n", "0 2024-11-08 2024-11-15 0.805488\n", " 开始日期 结束日期 准确率\n", "0 2024-11-08 2024-11-15 0.805488\n", " 开始日期 结束日期 准确率\n", "0 2024-11-08 2024-11-15 0.805488\n", " 开始日期 结束日期 准确率\n", "0 2024-11-08 2024-11-15 0.805488\n", " 开始日期 结束日期 准确率\n", "0 2024-11-08 2024-11-15 0.805488\n", " 开始日期 结束日期 准确率\n", "0 2024-11-15 2024-11-22 0.744558\n", " 开始日期 结束日期 准确率\n", "0 2024-11-15 2024-11-22 0.744558\n", " 开始日期 结束日期 准确率\n", "0 2024-11-15 2024-11-22 0.744558\n", " 开始日期 结束日期 准确率\n", "0 2024-11-15 2024-11-22 0.744558\n", " 开始日期 结束日期 准确率\n", "0 2024-11-15 2024-11-22 0.744558\n", " 开始日期 结束日期 准确率\n", "0 2024-11-22 2024-11-29 0.351228\n", " 开始日期 结束日期 准确率\n", "0 2024-11-22 2024-11-29 0.351228\n", " 开始日期 结束日期 准确率\n", "0 2024-11-22 2024-11-29 0.351228\n", " 开始日期 结束日期 准确率\n", "0 2024-11-22 2024-11-29 0.351228\n", " 开始日期 结束日期 准确率\n", "0 2024-11-22 2024-11-29 0.351228\n", " 开始日期 结束日期 准确率\n", "0 2024-11-29 2024-12-06 0.727334\n", " 开始日期 结束日期 准确率\n", "0 2024-11-29 2024-12-06 0.727334\n", " 开始日期 结束日期 准确率\n", "0 2024-11-29 2024-12-06 0.727334\n", " 开始日期 结束日期 准确率\n", "0 2024-11-29 2024-12-06 0.727334\n", " 开始日期 结束日期 准确率\n", "0 2024-11-29 2024-12-06 0.727334\n", " 开始日期 结束日期 准确率\n", "0 2024-12-06 2024-12-13 0.835391\n" ] } ], "source": [ "# 定义一个函数来计算准确率\n", "# 比较真实最高最低,和预测最高最低 计算准确率\n", "def calculate_accuracy(row):\n", " # 全子集情况:\n", " if (row['max_price'] >= row['HIGH_PRICE'] and row['min_price'] <= row['LOW_PRICE']) or \\\n", " (row['max_price'] <= row['HIGH_PRICE'] and row['min_price'] >= row['LOW_PRICE']):\n", " return 1 \n", " # 无交集情况:\n", " if row['max_price'] < row['LOW_PRICE'] or \\\n", " row['min_price'] > row['HIGH_PRICE']:\n", " return 0\n", " # 有交集情况:\n", " else:\n", " sorted_prices = sorted([row['LOW_PRICE'], row['min_price'], row['max_price'], row['HIGH_PRICE']])\n", " middle_diff = sorted_prices[2] - sorted_prices[1]\n", " price_range = row['HIGH_PRICE'] - row['LOW_PRICE']\n", " accuracy = middle_diff / price_range\n", " return accuracy\n", "import datetime\n", "weight_dict = [0.4,0.15,0.1,0.1,0.25] # 权重\n", "\n", "columns = ['HIGH_PRICE','LOW_PRICE','min_price','max_price']\n", "df[columns] = df[columns].astype(float)\n", "df['ACCURACY'] = df.apply(calculate_accuracy, axis=1)\n", "# df['ACCURACY'] = df.apply(is_within_range, axis=1)\n", "# 取结束日期上一周的日期\n", "def get_week_date(end_time):\n", " endtime = end_time\n", " endtimeweek = datetime.datetime.strptime(endtime, '%Y-%m-%d')\n", " up_week = endtimeweek - datetime.timedelta(days=endtimeweek.weekday() + 14)\n", " up_week_dates = [up_week + datetime.timedelta(days=i) for i in range(14)][4:-2]\n", " up_week_dates = [date.strftime('%Y-%m-%d') for date in up_week_dates]\n", " return up_week_dates\n", "\n", "# 计算准确率并保存结果\n", "def _get_accuracy_rate(df,up_week_dates,endtime):\n", " df3 = df.copy()\n", " df3 = df3[df3['CREAT_DATE'].isin(up_week_dates)]\n", " df3 = df3[df3['ds'].isin(up_week_dates)]\n", " accuracy_rote = 0\n", " for i,group in df3.groupby('ds'):\n", " # print('权重:',weight_dict[len(group)-1])\n", " # print('准确率:',(group['ACCURACY'].sum()/len(group))*weight_dict[len(group)-1])\n", " accuracy_rote += (group['ACCURACY'].sum()/len(group))*weight_dict[len(group)-1]\n", " df3.to_csv(os.path.join(dataset,f'accuracy_{endtime}.csv'),index=False)\n", " df4 = pd.DataFrame(columns=['开始日期','结束日期','准确率'])\n", " df4.loc[len(df4)] = {'开始日期':up_week_dates[0],'结束日期':up_week_dates[-1],'准确率':accuracy_rote}\n", " df4.to_csv(os.path.join(dataset,f'accuracy_rote_{endtime}.csv'),index=False)\n", " print(df4)\n", " # df4.to_sql(\"accuracy_rote\", con=sqlitedb.connection, if_exists='append', index=False)\n", "\n", "\n", "end_times = df['CREAT_DATE'].unique()\n", "for endtime in end_times:\n", " up_week_dates = get_week_date(endtime)\n", " _get_accuracy_rate(df,up_week_dates,endtime)\n", "\n", "# 打印结果\n", "\n" ] }, { "cell_type": "code", "execution_count": 31, "id": "0f942c69", "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "(255, 6)\n", " ds min_price max_price LOW_PRICE LOW_PRICE CREAT_DATE\n", "0 2024-10-08 78.172055 81.172055 76.36 76.36 2024-10-07\n", "1 2024-10-09 78.017734 81.017734 75.15 75.15 2024-10-07\n", "2 2024-10-10 78.196563 81.196563 76.72 76.72 2024-10-07\n", "3 2024-10-11 78.244970 81.244970 78.04 78.04 2024-10-07\n", "4 2024-10-14 78.448240 81.448240 74.86 74.86 2024-10-07\n", "5 2024-10-09 75.442758 78.442758 75.15 75.15 2024-10-08\n", "6 2024-10-10 75.684414 78.684414 76.72 76.72 2024-10-08\n", "7 2024-10-11 75.675482 78.675482 78.04 78.04 2024-10-08\n", "8 2024-10-14 75.819379 78.819379 74.86 74.86 2024-10-08\n", "9 2024-10-15 75.830953 78.830953 73.34 73.34 2024-10-08\n", "['2024-10-07', '2024-10-08', '2024-10-09', '2024-10-10', '2024-10-11', '2024-10-12', '2024-10-13']\n", "(10, 6)\n", " ds min_price max_price LOW_PRICE LOW_PRICE CREAT_DATE\n", "0 2024-10-08 78.172055 81.172055 76.36 76.36 2024-10-07\n", "1 2024-10-09 78.017734 81.017734 75.15 75.15 2024-10-07\n", "2 2024-10-10 78.196563 81.196563 76.72 76.72 2024-10-07\n", "3 2024-10-11 78.244970 81.244970 78.04 78.04 2024-10-07\n", "5 2024-10-09 75.442758 78.442758 75.15 75.15 2024-10-08\n", "6 2024-10-10 75.684414 78.684414 76.72 76.72 2024-10-08\n", "7 2024-10-11 75.675482 78.675482 78.04 78.04 2024-10-08\n", "10 2024-10-10 75.439643 78.439643 76.72 76.72 2024-10-09\n", "11 2024-10-11 75.214194 78.214194 78.04 78.04 2024-10-09\n", "15 2024-10-11 77.558740 80.558740 78.04 78.04 2024-10-10\n" ] }, { "ename": "ValueError", "evalue": "Per-column arrays must each be 1-dimensional", "output_type": "error", "traceback": [ "\u001b[1;31m---------------------------------------------------------------------------\u001b[0m", "\u001b[1;31mValueError\u001b[0m Traceback (most recent call last)", "Cell \u001b[1;32mIn[31], line 33\u001b[0m\n\u001b[0;32m 31\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmin_price\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n\u001b[0;32m 32\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mmax_price\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n\u001b[1;32m---> 33\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mLOW_PRICE\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n\u001b[0;32m 34\u001b[0m sns\u001b[38;5;241m.\u001b[39mscatterplot(x\u001b[38;5;241m=\u001b[39mdf6\u001b[38;5;241m.\u001b[39mindex,y\u001b[38;5;241m=\u001b[39mdf6[\u001b[38;5;124m'\u001b[39m\u001b[38;5;124mHIGH_PRICE\u001b[39m\u001b[38;5;124m'\u001b[39m]\u001b[38;5;241m.\u001b[39mvalues,data\u001b[38;5;241m=\u001b[39mdf6)\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\relational.py:742\u001b[0m, in \u001b[0;36mscatterplot\u001b[1;34m(data, x, y, hue, size, style, palette, hue_order, hue_norm, sizes, size_order, size_norm, markers, style_order, legend, ax, **kwargs)\u001b[0m\n\u001b[0;32m 732\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21mscatterplot\u001b[39m(\n\u001b[0;32m 733\u001b[0m data\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, \u001b[38;5;241m*\u001b[39m,\n\u001b[0;32m 734\u001b[0m x\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, y\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, hue\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, size\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, style\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m,\n\u001b[1;32m (...)\u001b[0m\n\u001b[0;32m 738\u001b[0m \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mkwargs\n\u001b[0;32m 739\u001b[0m ):\n\u001b[0;32m 741\u001b[0m variables \u001b[38;5;241m=\u001b[39m _ScatterPlotter\u001b[38;5;241m.\u001b[39mget_semantics(\u001b[38;5;28mlocals\u001b[39m())\n\u001b[1;32m--> 742\u001b[0m p \u001b[38;5;241m=\u001b[39m _ScatterPlotter(data\u001b[38;5;241m=\u001b[39mdata, variables\u001b[38;5;241m=\u001b[39mvariables, legend\u001b[38;5;241m=\u001b[39mlegend)\n\u001b[0;32m 744\u001b[0m p\u001b[38;5;241m.\u001b[39mmap_hue(palette\u001b[38;5;241m=\u001b[39mpalette, order\u001b[38;5;241m=\u001b[39mhue_order, norm\u001b[38;5;241m=\u001b[39mhue_norm)\n\u001b[0;32m 745\u001b[0m p\u001b[38;5;241m.\u001b[39mmap_size(sizes\u001b[38;5;241m=\u001b[39msizes, order\u001b[38;5;241m=\u001b[39msize_order, norm\u001b[38;5;241m=\u001b[39msize_norm)\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\relational.py:538\u001b[0m, in \u001b[0;36m_ScatterPlotter.__init__\u001b[1;34m(self, data, variables, legend)\u001b[0m\n\u001b[0;32m 529\u001b[0m \u001b[38;5;28;01mdef\u001b[39;00m \u001b[38;5;21m__init__\u001b[39m(\u001b[38;5;28mself\u001b[39m, \u001b[38;5;241m*\u001b[39m, data\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m, variables\u001b[38;5;241m=\u001b[39m{}, legend\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mNone\u001b[39;00m):\n\u001b[0;32m 530\u001b[0m \n\u001b[0;32m 531\u001b[0m \u001b[38;5;66;03m# TODO this is messy, we want the mapping to be agnostic about\u001b[39;00m\n\u001b[0;32m 532\u001b[0m \u001b[38;5;66;03m# the kind of plot to draw, but for the time being we need to set\u001b[39;00m\n\u001b[0;32m 533\u001b[0m \u001b[38;5;66;03m# this information so the SizeMapping can use it\u001b[39;00m\n\u001b[0;32m 534\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_default_size_range \u001b[38;5;241m=\u001b[39m (\n\u001b[0;32m 535\u001b[0m np\u001b[38;5;241m.\u001b[39mr_[\u001b[38;5;241m.5\u001b[39m, \u001b[38;5;241m2\u001b[39m] \u001b[38;5;241m*\u001b[39m np\u001b[38;5;241m.\u001b[39msquare(mpl\u001b[38;5;241m.\u001b[39mrcParams[\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlines.markersize\u001b[39m\u001b[38;5;124m\"\u001b[39m])\n\u001b[0;32m 536\u001b[0m )\n\u001b[1;32m--> 538\u001b[0m \u001b[38;5;28msuper\u001b[39m()\u001b[38;5;241m.\u001b[39m\u001b[38;5;21m__init__\u001b[39m(data\u001b[38;5;241m=\u001b[39mdata, variables\u001b[38;5;241m=\u001b[39mvariables)\n\u001b[0;32m 540\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mlegend \u001b[38;5;241m=\u001b[39m legend\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\_oldcore.py:640\u001b[0m, in \u001b[0;36mVectorPlotter.__init__\u001b[1;34m(self, data, variables)\u001b[0m\n\u001b[0;32m 635\u001b[0m \u001b[38;5;66;03m# var_ordered is relevant only for categorical axis variables, and may\u001b[39;00m\n\u001b[0;32m 636\u001b[0m \u001b[38;5;66;03m# be better handled by an internal axis information object that tracks\u001b[39;00m\n\u001b[0;32m 637\u001b[0m \u001b[38;5;66;03m# such information and is set up by the scale_* methods. The analogous\u001b[39;00m\n\u001b[0;32m 638\u001b[0m \u001b[38;5;66;03m# information for numeric axes would be information about log scales.\u001b[39;00m\n\u001b[0;32m 639\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_var_ordered \u001b[38;5;241m=\u001b[39m {\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mx\u001b[39m\u001b[38;5;124m\"\u001b[39m: \u001b[38;5;28;01mFalse\u001b[39;00m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124my\u001b[39m\u001b[38;5;124m\"\u001b[39m: \u001b[38;5;28;01mFalse\u001b[39;00m} \u001b[38;5;66;03m# alt., used DefaultDict\u001b[39;00m\n\u001b[1;32m--> 640\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39massign_variables(data, variables)\n\u001b[0;32m 642\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m var, \u001b[38;5;28mcls\u001b[39m \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_semantic_mappings\u001b[38;5;241m.\u001b[39mitems():\n\u001b[0;32m 643\u001b[0m \n\u001b[0;32m 644\u001b[0m \u001b[38;5;66;03m# Create the mapping function\u001b[39;00m\n\u001b[0;32m 645\u001b[0m map_func \u001b[38;5;241m=\u001b[39m partial(\u001b[38;5;28mcls\u001b[39m\u001b[38;5;241m.\u001b[39mmap, plotter\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mself\u001b[39m)\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\_oldcore.py:701\u001b[0m, in \u001b[0;36mVectorPlotter.assign_variables\u001b[1;34m(self, data, variables)\u001b[0m\n\u001b[0;32m 699\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 700\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39minput_format \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mlong\u001b[39m\u001b[38;5;124m\"\u001b[39m\n\u001b[1;32m--> 701\u001b[0m plot_data, variables \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_assign_variables_longform(\n\u001b[0;32m 702\u001b[0m data, \u001b[38;5;241m*\u001b[39m\u001b[38;5;241m*\u001b[39mvariables,\n\u001b[0;32m 703\u001b[0m )\n\u001b[0;32m 705\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mplot_data \u001b[38;5;241m=\u001b[39m plot_data\n\u001b[0;32m 706\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mvariables \u001b[38;5;241m=\u001b[39m variables\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\seaborn\\_oldcore.py:962\u001b[0m, in \u001b[0;36mVectorPlotter._assign_variables_longform\u001b[1;34m(self, data, **kwargs)\u001b[0m\n\u001b[0;32m 958\u001b[0m variables[key] \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mgetattr\u001b[39m(val, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mname\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;28;01mNone\u001b[39;00m)\n\u001b[0;32m 960\u001b[0m \u001b[38;5;66;03m# Construct a tidy plot DataFrame. This will convert a number of\u001b[39;00m\n\u001b[0;32m 961\u001b[0m \u001b[38;5;66;03m# types automatically, aligning on index in case of pandas objects\u001b[39;00m\n\u001b[1;32m--> 962\u001b[0m plot_data \u001b[38;5;241m=\u001b[39m pd\u001b[38;5;241m.\u001b[39mDataFrame(plot_data)\n\u001b[0;32m 964\u001b[0m \u001b[38;5;66;03m# Reduce the variables dictionary to fields with valid data\u001b[39;00m\n\u001b[0;32m 965\u001b[0m variables \u001b[38;5;241m=\u001b[39m {\n\u001b[0;32m 966\u001b[0m var: name\n\u001b[0;32m 967\u001b[0m \u001b[38;5;28;01mfor\u001b[39;00m var, name \u001b[38;5;129;01min\u001b[39;00m variables\u001b[38;5;241m.\u001b[39mitems()\n\u001b[0;32m 968\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m plot_data[var]\u001b[38;5;241m.\u001b[39mnotnull()\u001b[38;5;241m.\u001b[39many()\n\u001b[0;32m 969\u001b[0m }\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\frame.py:733\u001b[0m, in \u001b[0;36mDataFrame.__init__\u001b[1;34m(self, data, index, columns, dtype, copy)\u001b[0m\n\u001b[0;32m 727\u001b[0m mgr \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_init_mgr(\n\u001b[0;32m 728\u001b[0m data, axes\u001b[38;5;241m=\u001b[39m{\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mindex\u001b[39m\u001b[38;5;124m\"\u001b[39m: index, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mcolumns\u001b[39m\u001b[38;5;124m\"\u001b[39m: columns}, dtype\u001b[38;5;241m=\u001b[39mdtype, copy\u001b[38;5;241m=\u001b[39mcopy\n\u001b[0;32m 729\u001b[0m )\n\u001b[0;32m 731\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(data, \u001b[38;5;28mdict\u001b[39m):\n\u001b[0;32m 732\u001b[0m \u001b[38;5;66;03m# GH#38939 de facto copy defaults to False only in non-dict cases\u001b[39;00m\n\u001b[1;32m--> 733\u001b[0m mgr \u001b[38;5;241m=\u001b[39m dict_to_mgr(data, index, columns, dtype\u001b[38;5;241m=\u001b[39mdtype, copy\u001b[38;5;241m=\u001b[39mcopy, typ\u001b[38;5;241m=\u001b[39mmanager)\n\u001b[0;32m 734\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(data, ma\u001b[38;5;241m.\u001b[39mMaskedArray):\n\u001b[0;32m 735\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01mnumpy\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01mma\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m mrecords\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\internals\\construction.py:503\u001b[0m, in \u001b[0;36mdict_to_mgr\u001b[1;34m(data, index, columns, dtype, typ, copy)\u001b[0m\n\u001b[0;32m 499\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 500\u001b[0m \u001b[38;5;66;03m# dtype check to exclude e.g. range objects, scalars\u001b[39;00m\n\u001b[0;32m 501\u001b[0m arrays \u001b[38;5;241m=\u001b[39m [x\u001b[38;5;241m.\u001b[39mcopy() \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mhasattr\u001b[39m(x, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdtype\u001b[39m\u001b[38;5;124m\"\u001b[39m) \u001b[38;5;28;01melse\u001b[39;00m x \u001b[38;5;28;01mfor\u001b[39;00m x \u001b[38;5;129;01min\u001b[39;00m arrays]\n\u001b[1;32m--> 503\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m arrays_to_mgr(arrays, columns, index, dtype\u001b[38;5;241m=\u001b[39mdtype, typ\u001b[38;5;241m=\u001b[39mtyp, consolidate\u001b[38;5;241m=\u001b[39mcopy)\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\internals\\construction.py:114\u001b[0m, in \u001b[0;36marrays_to_mgr\u001b[1;34m(arrays, columns, index, dtype, verify_integrity, typ, consolidate)\u001b[0m\n\u001b[0;32m 111\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m verify_integrity:\n\u001b[0;32m 112\u001b[0m \u001b[38;5;66;03m# figure out the index, if necessary\u001b[39;00m\n\u001b[0;32m 113\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m index \u001b[38;5;129;01mis\u001b[39;00m \u001b[38;5;28;01mNone\u001b[39;00m:\n\u001b[1;32m--> 114\u001b[0m index \u001b[38;5;241m=\u001b[39m _extract_index(arrays)\n\u001b[0;32m 115\u001b[0m \u001b[38;5;28;01melse\u001b[39;00m:\n\u001b[0;32m 116\u001b[0m index \u001b[38;5;241m=\u001b[39m ensure_index(index)\n", "File \u001b[1;32md:\\ProgramData\\anaconda3\\Lib\\site-packages\\pandas\\core\\internals\\construction.py:664\u001b[0m, in \u001b[0;36m_extract_index\u001b[1;34m(data)\u001b[0m\n\u001b[0;32m 662\u001b[0m raw_lengths\u001b[38;5;241m.\u001b[39mappend(\u001b[38;5;28mlen\u001b[39m(val))\n\u001b[0;32m 663\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m \u001b[38;5;28misinstance\u001b[39m(val, np\u001b[38;5;241m.\u001b[39mndarray) \u001b[38;5;129;01mand\u001b[39;00m val\u001b[38;5;241m.\u001b[39mndim \u001b[38;5;241m>\u001b[39m \u001b[38;5;241m1\u001b[39m:\n\u001b[1;32m--> 664\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mPer-column arrays must each be 1-dimensional\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[0;32m 666\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m indexes \u001b[38;5;129;01mand\u001b[39;00m \u001b[38;5;129;01mnot\u001b[39;00m raw_lengths:\n\u001b[0;32m 667\u001b[0m \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mIf using all scalar values, you must pass an index\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n", "\u001b[1;31mValueError\u001b[0m: Per-column arrays must each be 1-dimensional" ] }, { "data": { "image/png": "", "text/plain": [ "
" ] }, "metadata": {}, "output_type": "display_data" } ], "source": [ "# 画图\n", "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "\n", "df5 = df.copy()\n", "df5 = df5[['ds','min_price','max_price','LOW_PRICE','LOW_PRICE','CREAT_DATE']]\n", "\n", "print(df5.shape)\n", "print(df5.head(10))\n", "# 画图配置\n", "plt.figure(figsize=(16,10))\n", "\n", "def get_this_week_date(end_time):\n", " endtime = end_time\n", " # endtimeweek = datetime.datetime.strptime(endtime, '%Y-%m-%d')\n", " endtimeweek = endtime\n", " up_week = endtimeweek - datetime.timedelta(days=endtimeweek.weekday() )\n", " up_week_dates = [up_week + datetime.timedelta(days=i) for i in range(7)]\n", " up_week_dates = [date.strftime('%Y-%m-%d') for date in up_week_dates]\n", " return up_week_dates\n", "\n", "# ds分组\n", "end_times = df['ds'].unique()\n", "for endtime in end_times:\n", " up_week_dates = get_this_week_date(endtime)\n", " print(up_week_dates)\n", " df6 = df5[df5['ds'].isin(up_week_dates)]\n", " print(df6.shape)\n", " print(df6.head(10))\n", " # sns画散点图\n", " sns.scatterplot(x=df6.index,y=df6['min_price'].values,data=df6)\n", " sns.scatterplot(x=df6.index,y=df6['max_price'].values,data=df6)\n", " sns.scatterplot(x=df6.index,y=df6['LOW_PRICE'].values,data=df6)\n", " sns.scatterplot(x=df6.index,y=df6['HIGH_PRICE'].values,data=df6)\n", " sns.scatterplot(x=df6.index,y=df6['HIGH_PRICE'].values,data=df6)" ] }, { "cell_type": "code", "execution_count": null, "id": "336fa6ed", "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "base", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.11.7" } }, "nbformat": 4, "nbformat_minor": 5 }