983 lines
		
	
	
		
			39 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
			
		
		
	
	
			983 lines
		
	
	
		
			39 KiB
		
	
	
	
		
			Plaintext
		
	
	
	
	
	
| {
 | ||
|  "cells": [
 | ||
|   {
 | ||
|    "cell_type": "code",
 | ||
|    "execution_count": null,
 | ||
|    "metadata": {
 | ||
|     "scrolled": true
 | ||
|    },
 | ||
|    "outputs": [
 | ||
|     {
 | ||
|      "data": {
 | ||
|       "text/html": [
 | ||
|        "        <script type=\"text/javascript\">\n",
 | ||
|        "        window.PlotlyConfig = {MathJaxConfig: 'local'};\n",
 | ||
|        "        if (window.MathJax && window.MathJax.Hub && window.MathJax.Hub.Config) {window.MathJax.Hub.Config({SVG: {font: \"STIX-Web\"}});}\n",
 | ||
|        "        </script>\n",
 | ||
|        "        <script type=\"module\">import \"https://cdn.plot.ly/plotly-3.0.0.min\"</script>\n",
 | ||
|        "        "
 | ||
|       ]
 | ||
|      },
 | ||
|      "metadata": {},
 | ||
|      "output_type": "display_data"
 | ||
|     }
 | ||
|    ],
 | ||
|    "source": [
 | ||
|     "import requests\n",
 | ||
|     "import json\n",
 | ||
|     "import xlrd\n",
 | ||
|     "import xlwt\n",
 | ||
|     "from datetime import datetime,timedelta\n",
 | ||
|     "import time\n",
 | ||
|     "# 变量定义\n",
 | ||
|     "login_url = \"http://10.200.32.39/jingbo-api/api/server/login\"\n",
 | ||
|     "search_url = \"http://10.200.32.39/jingbo-api/api/warehouse/dwDataItem/queryByItemNos\"\n",
 | ||
|     "\n",
 | ||
|     "login_push_url = \"http://10.200.32.39/jingbo-api/api/server/login\"\n",
 | ||
|     "upload_url = \"http://10.200.32.39/jingbo-api/api/dw/dataValue/pushDataValueList\"\n",
 | ||
|     "queryDataListItemNos_url = \"http://10.200.32.39/jingbo-api//api/warehouse/dwDataItem/queryDataListItemNos\"\n",
 | ||
|     "\n",
 | ||
|     "login_data = {\n",
 | ||
|     "    \"data\": {\n",
 | ||
|     "        \"account\": \"api_dev\",\n",
 | ||
|     "        \"password\": \"ZTEwYWRjMzk0OWJhNTlhYmJlNTZlMDU3ZjIwZjg4M2U=\",\n",
 | ||
|     "        \"tenantHashCode\": \"8a4577dbd919675758d57999a1e891fe\",\n",
 | ||
|     "        \"terminal\": \"API\"\n",
 | ||
|     "    },\n",
 | ||
|     "    \"funcModule\": \"API\",\n",
 | ||
|     "    \"funcOperation\": \"获取token\"\n",
 | ||
|     "}\n",
 | ||
|     "\n",
 | ||
|     "login_push_data = {\n",
 | ||
|     "    \"data\": {\n",
 | ||
|     "        \"account\": \"api_dev\",\n",
 | ||
|     "        \"password\": \"ZTEwYWRjMzk0OWJhNTlhYmJlNTZlMDU3ZjIwZjg4M2U=\",\n",
 | ||
|     "        \"tenantHashCode\": \"8a4577dbd919675758d57999a1e891fe\",\n",
 | ||
|     "        \"terminal\": \"API\"\n",
 | ||
|     "    },\n",
 | ||
|     "    \"funcModule\": \"API\",\n",
 | ||
|     "    \"funcOperation\": \"获取token\"\n",
 | ||
|     "}\n",
 | ||
|     "\n",
 | ||
|     "read_file_path_name = \"纯苯数据项.xls\"\n",
 | ||
|     "one_cols = []\n",
 | ||
|     "two_cols = []\n",
 | ||
|     "\n",
 | ||
|     "import pandas as pd\n",
 | ||
|     "import numpy as np\n",
 | ||
|     "import matplotlib.pyplot as plt\n",
 | ||
|     "import seaborn as sn\n",
 | ||
|     "import random\n",
 | ||
|     "import time\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "from plotly import __version__\n",
 | ||
|     "from plotly.offline import download_plotlyjs, init_notebook_mode, plot, iplot\n",
 | ||
|     "\n",
 | ||
|     "from sklearn import preprocessing\n",
 | ||
|     "\n",
 | ||
|     "from pandas import Series,DataFrame\n",
 | ||
|     "\n",
 | ||
|     "import matplotlib.pyplot as plt\n",
 | ||
|     "\n",
 | ||
|     "import sklearn.datasets as datasets\n",
 | ||
|     "\n",
 | ||
|     "#导入机器学习算法模型\n",
 | ||
|     "from sklearn.linear_model import Lasso\n",
 | ||
|     "from xgboost import XGBRegressor\n",
 | ||
|     "\n",
 | ||
|     "import statsmodels.api as sm\n",
 | ||
|     "try:\n",
 | ||
|     "    from keras.preprocessing.sequence import TimeseriesGenerator\n",
 | ||
|     "except:\n",
 | ||
|     "    from tensorflow.keras.preprocessing.sequence import TimeseriesGenerator\n",
 | ||
|     "\n",
 | ||
|     "import plotly.express as px\n",
 | ||
|     "import plotly.graph_objects as go\n",
 | ||
|     "\n",
 | ||
|     "import xgboost as xgb\n",
 | ||
|     "from xgboost import plot_importance, plot_tree\n",
 | ||
|     "from sklearn.metrics import mean_absolute_error\n",
 | ||
|     "from statsmodels.tools.eval_measures import mse,rmse\n",
 | ||
|     "from sklearn.model_selection import GridSearchCV\n",
 | ||
|     "from xgboost import XGBRegressor\n",
 | ||
|     "import warnings\n",
 | ||
|     "import pickle\n",
 | ||
|     "\n",
 | ||
|     "from sklearn.metrics import mean_squared_error\n",
 | ||
|     "\n",
 | ||
|     "#切割训练数据和样本数据\n",
 | ||
|     "from sklearn.model_selection import train_test_split\n",
 | ||
|     "\n",
 | ||
|     "#用于模型评分\n",
 | ||
|     "from sklearn.metrics import r2_score\n",
 | ||
|     "\n",
 | ||
|     "le = preprocessing.LabelEncoder()\n",
 | ||
|     "\n",
 | ||
|     "# print(__version__) # requires version >= 1.9.0\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "import cufflinks as cf\n",
 | ||
|     "cf.go_offline()\n",
 | ||
|     "\n",
 | ||
|     "random.seed(100)\n",
 | ||
|     "\n",
 | ||
|     "%matplotlib inline\n",
 | ||
|     "\n",
 | ||
|     "# 数据获取\n",
 | ||
|     "\n",
 | ||
|     "def get_head_auth():\n",
 | ||
|     "    login_res = requests.post(url=login_url, json=login_data, timeout=(3, 5))\n",
 | ||
|     "    text = json.loads(login_res.text)\n",
 | ||
|     "    if text[\"status\"]:\n",
 | ||
|     "        token = text[\"data\"][\"accessToken\"]\n",
 | ||
|     "        return token\n",
 | ||
|     "    else:\n",
 | ||
|     "        print(\"获取认证失败\")\n",
 | ||
|     "        return None\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def get_data_value(token, dataItemNoList,date):\n",
 | ||
|     "    search_data = {\n",
 | ||
|     "        \"data\": {\n",
 | ||
|     "            \"date\": getNow(date)[0],\n",
 | ||
|     "            \"dataItemNoList\": dataItemNoList\n",
 | ||
|     "        },\n",
 | ||
|     "        \"funcModule\": \"数据项\",\n",
 | ||
|     "        \"funcOperation\": \"查询\"\n",
 | ||
|     "    }\n",
 | ||
|     "    headers = {\"Authorization\": token}\n",
 | ||
|     "    search_res = requests.post(url=search_url, headers=headers, json=search_data, timeout=(3, 5))\n",
 | ||
|     "    search_value = json.loads(search_res.text)[\"data\"]\n",
 | ||
|     "    if search_value:\n",
 | ||
|     "        return search_value\n",
 | ||
|     "    else:\n",
 | ||
|     "        print(\"今天没有新数据\")\n",
 | ||
|     "        return search_value\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "# xls文件处理\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def write_xls(data,date):\n",
 | ||
|     "    # 创建一个Workbook对象\n",
 | ||
|     "    workbook = xlwt.Workbook()\n",
 | ||
|     "\n",
 | ||
|     "    # 创建一个Sheet对象,可指定名称\n",
 | ||
|     "    sheet = workbook.load('Sheet1')\n",
 | ||
|     "\n",
 | ||
|     "    # 写入数据行\n",
 | ||
|     "    for row_index, row_data in enumerate(data):\n",
 | ||
|     "        for col_index, cell_data in enumerate(row_data):\n",
 | ||
|     "            sheet.write(row_index, col_index, cell_data)\n",
 | ||
|     "\n",
 | ||
|     "    # 保存Workbook到文件\n",
 | ||
|     "    workbook.save(get_cur_time(date)[0] + '.xls')\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def getNow(date='', offset=0):\n",
 | ||
|     "    \"\"\"生成指定日期的两种格式字符串\n",
 | ||
|     "    Args:\n",
 | ||
|     "        date: 支持多种输入类型:\n",
 | ||
|     "            - datetime对象\n",
 | ||
|     "            - 字符串格式(支持'%Y-%m-%d'和'%Y%m%d')\n",
 | ||
|     "            - 空字符串表示当前日期\n",
 | ||
|     "        offset: 日期偏移天数\n",
 | ||
|     "    Returns:\n",
 | ||
|     "        tuple: (紧凑日期字符串, 标准日期字符串)\n",
 | ||
|     "    \"\"\"\n",
 | ||
|     "    # 日期解析逻辑\n",
 | ||
|     "    from datetime import datetime,timedelta\n",
 | ||
|     "    if isinstance(date, datetime):\n",
 | ||
|     "        now = date\n",
 | ||
|     "    else:\n",
 | ||
|     "        now = datetime.now()\n",
 | ||
|     "        if date:\n",
 | ||
|     "            # 尝试多种日期格式解析\n",
 | ||
|     "            for fmt in ('%Y-%m-%d', '%Y%m%d', '%Y/%m/%d'):\n",
 | ||
|     "                try:\n",
 | ||
|     "                    now = datetime.strptime(str(date), fmt)\n",
 | ||
|     "                    break\n",
 | ||
|     "                except ValueError:\n",
 | ||
|     "                    continue\n",
 | ||
|     "            else:\n",
 | ||
|     "                raise ValueError(f\"无法解析的日期格式: {date}\")\n",
 | ||
|     "\n",
 | ||
|     "    # 应用日期偏移\n",
 | ||
|     "    now = now - timedelta(days=offset)\n",
 | ||
|     "    \n",
 | ||
|     "    # 统一格式化输出\n",
 | ||
|     "    date_str = now.strftime(\"%Y-%m-%d\")\n",
 | ||
|     "    compact_date = date_str.replace(\"-\", \"\")\n",
 | ||
|     "    return compact_date, date_str\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def get_cur_time(date=''):\n",
 | ||
|     "    if date == '':\n",
 | ||
|     "        now = datetime.now()\n",
 | ||
|     "    # 如果是字符串,尝试解析日期\n",
 | ||
|     "    elif isinstance(date, str):\n",
 | ||
|     "        now = datetime.strptime(date, '%Y-%m-%d')\n",
 | ||
|     "    else:\n",
 | ||
|     "        now = date\n",
 | ||
|     "    year = now.year\n",
 | ||
|     "    month = now.month\n",
 | ||
|     "    day = now.day\n",
 | ||
|     "\n",
 | ||
|     "    if month < 10:\n",
 | ||
|     "        month = \"0\" + str(month)\n",
 | ||
|     "    if day < 10:\n",
 | ||
|     "        day = \"0\" + str(day)\n",
 | ||
|     "    cur_time = str(year) + str(month) + str(day)\n",
 | ||
|     "    cur_time2 = str(year) + \"-\" + str(month) + \"-\" + str(day)\n",
 | ||
|     "    return cur_time, cur_time2\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def get_head_push_auth():\n",
 | ||
|     "    login_res = requests.post(url=login_push_url, json=login_push_data, timeout=(3, 5))\n",
 | ||
|     "    text = json.loads(login_res.text)\n",
 | ||
|     "    if text[\"status\"]:\n",
 | ||
|     "        token = text[\"data\"][\"accessToken\"]\n",
 | ||
|     "        return token\n",
 | ||
|     "    else:\n",
 | ||
|     "        print(\"获取认证失败\")\n",
 | ||
|     "        return None\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def upload_data_to_system(token_push,date):\n",
 | ||
|     "    datavalue = forecast_price()\n",
 | ||
|     "    data = {\n",
 | ||
|     "        \"funcModule\": \"数据表信息列表\",\n",
 | ||
|     "        \"funcOperation\": \"新增\",\n",
 | ||
|     "        \"data\": [\n",
 | ||
|     "            {\"dataItemNo\": \"C01100047|FORECAST_PRICE\",\n",
 | ||
|     "             \"dataDate\": getNow(date)[0],\n",
 | ||
|     "             \"dataStatus\": \"add\",\n",
 | ||
|     "             \"dataValue\": datavalue\n",
 | ||
|     "             }\n",
 | ||
|     "\n",
 | ||
|     "        ]\n",
 | ||
|     "    }\n",
 | ||
|     "    print(data)\n",
 | ||
|     "    headers = {\"Authorization\": token_push}\n",
 | ||
|     "    res = requests.post(url=upload_url, headers=headers, json=data, timeout=(3, 5))\n",
 | ||
|     "    print(res.text)\n",
 | ||
|     "\n",
 | ||
|     "   \n",
 | ||
|     "    \n",
 | ||
|     "def forecast_price():\n",
 | ||
|     "    # df_test = pd.read_csv('定价模型数据收集0212.csv')\n",
 | ||
|     "    df_test = pd.read_excel('纯苯数据项.xls',sheet_name='Sheet1')\n",
 | ||
|     "    df_test.drop([0],inplace=True)\n",
 | ||
|     "    # df_test['Date']=pd.to_datetime(df_test['Date'],  format='%m/%d/%Y',infer_datetime_format=True)\n",
 | ||
|     "    df_test['Date']=pd.to_datetime(df_test['Date'],  format=r'%Y-%m-%d',infer_datetime_format=True)\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "    df_test_1 = df_test\n",
 | ||
|     "    df_test_1=df_test_1.fillna(df_test.ffill())\n",
 | ||
|     "    df_test_1=df_test_1.fillna(df_test_1.bfill())\n",
 | ||
|     "\n",
 | ||
|     "    # 选择用于模型训练的列名称\n",
 | ||
|     "    col_for_training = df_test_1.columns\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "    import joblib\n",
 | ||
|     "    Best_model_DalyLGPrice = joblib.load(\"日度价格预测_最佳模型.pkl\")\n",
 | ||
|     "    # 最新的一天为最后一行的数据\n",
 | ||
|     "   \n",
 | ||
|     "    df_test_1_Day = df_test_1.tail(1)\n",
 | ||
|     "    # 移除不需要的列\n",
 | ||
|     "    df_test_1_Day.index = df_test_1_Day[\"Date\"]\n",
 | ||
|     "    df_test_1_Day = df_test_1_Day.drop([\"Date\"], axis= 1)\n",
 | ||
|     "    df_test_1_Day=df_test_1_Day.drop('Price',axis=1)\n",
 | ||
|     "    df_test_1_Day=df_test_1_Day.dropna()\n",
 | ||
|     "\n",
 | ||
|     "    for col in df_test_1_Day.columns:\n",
 | ||
|     "        df_test_1_Day[col] = pd.to_numeric(df_test_1_Day[col],errors='coerce')\n",
 | ||
|     "    #预测今日价格,显示至小数点后两位\n",
 | ||
|     "    Ypredict_Today=Best_model_DalyLGPrice.predict(df_test_1_Day)\n",
 | ||
|     "\n",
 | ||
|     "    df_test_1_Day['日度预测价格']=Ypredict_Today\n",
 | ||
|     "    print(df_test_1_Day['日度预测价格'])\n",
 | ||
|     "    a = df_test_1_Day['日度预测价格']\n",
 | ||
|     "    a = a[0]\n",
 | ||
|     "    a = float(a)\n",
 | ||
|     "    a = round(a,2)\n",
 | ||
|     "    return a\n",
 | ||
|     "def optimize_Model():\n",
 | ||
|     "    from sklearn.model_selection import train_test_split\n",
 | ||
|     "    from sklearn.impute  import SimpleImputer\n",
 | ||
|     "    from sklearn.preprocessing import OrdinalEncoder\n",
 | ||
|     "    from sklearn.feature_selection import SelectFromModel\n",
 | ||
|     "    from sklearn.metrics import mean_squared_error, r2_score\n",
 | ||
|     "    import pandas as pd\n",
 | ||
|     "\n",
 | ||
|     "    pd.set_option('display.max_rows',40)  \n",
 | ||
|     "    pd.set_option('display.max_columns',40)  \n",
 | ||
|     "    df_test = pd.read_excel('纯苯数据项.xls')\n",
 | ||
|     "    df_test.drop([0],inplace=True)\n",
 | ||
|     "    # df_test['Date']=pd.to_datetime(df_test['Date'],  format='%m/%d/%Y',infer_datetime_format=True)\n",
 | ||
|     "    df_test['Date']=pd.to_datetime(df_test['Date'],  format='%Y-%m-%d',infer_datetime_format=True)\n",
 | ||
|     "\n",
 | ||
|     "    \n",
 | ||
|     "    #将缺失值补为前一个或者后一个数值\n",
 | ||
|     "    df_test_1 = df_test\n",
 | ||
|     "    df_test_1=df_test_1.fillna(df_test.ffill())\n",
 | ||
|     "    df_test_1=df_test_1.fillna(df_test_1.bfill())\n",
 | ||
|     "    df_test_1[\"Date\"] = pd.to_datetime(df_test_1[\"Date\"])\n",
 | ||
|     "    df_test_1.index = df_test_1[\"Date\"]\n",
 | ||
|     "    df_test_1 = df_test_1.drop([\"Date\"], axis= 1)\n",
 | ||
|     "    df_test_1 = df_test_1.astype('float')\n",
 | ||
|     "    \n",
 | ||
|     "    \n",
 | ||
|     "    import numpy as np\n",
 | ||
|     "    import pandas as pd\n",
 | ||
|     "    from pandas import Series,DataFrame\n",
 | ||
|     "\n",
 | ||
|     "    import matplotlib.pyplot as plt\n",
 | ||
|     "\n",
 | ||
|     "    import sklearn.datasets as datasets\n",
 | ||
|     "\n",
 | ||
|     "    #导入机器学习算法模型\n",
 | ||
|     "    from sklearn.linear_model import Lasso\n",
 | ||
|     "    from xgboost import XGBRegressor\n",
 | ||
|     "\n",
 | ||
|     "    import statsmodels.api as sm\n",
 | ||
|     "    try:\n",
 | ||
|     "        from keras.preprocessing.sequence import TimeseriesGenerator\n",
 | ||
|     "    except:\n",
 | ||
|     "        from tensorflow.keras.preprocessing.sequence import TimeseriesGenerator\n",
 | ||
|     "\n",
 | ||
|     "    import plotly.express as px\n",
 | ||
|     "    import plotly.graph_objects as go\n",
 | ||
|     "\n",
 | ||
|     "    import xgboost as xgb\n",
 | ||
|     "    from xgboost import plot_importance, plot_tree\n",
 | ||
|     "    from sklearn.metrics import mean_absolute_error\n",
 | ||
|     "    from statsmodels.tools.eval_measures import mse,rmse\n",
 | ||
|     "    from sklearn.model_selection import GridSearchCV\n",
 | ||
|     "    from xgboost import XGBRegressor\n",
 | ||
|     "    import warnings\n",
 | ||
|     "    import pickle\n",
 | ||
|     "\n",
 | ||
|     "    from sklearn.metrics import mean_squared_error\n",
 | ||
|     "\n",
 | ||
|     "    #切割训练数据和样本数据\n",
 | ||
|     "    from sklearn.model_selection import train_test_split\n",
 | ||
|     "\n",
 | ||
|     "    #用于模型评分\n",
 | ||
|     "    from sklearn.metrics import r2_score\n",
 | ||
|     "\n",
 | ||
|     "    dataset1=df_test_1.drop('Price',axis=1)#.astype(float)\n",
 | ||
|     "\n",
 | ||
|     "    y=df_test_1['Price']\n",
 | ||
|     "\n",
 | ||
|     "    x=dataset1 \n",
 | ||
|     "\n",
 | ||
|     "    train = x\n",
 | ||
|     "    target = y\n",
 | ||
|     "\n",
 | ||
|     "    #切割数据样本集合测试集\n",
 | ||
|     "    X_train,x_test,y_train,y_true = train_test_split(train,target,test_size=0.2,random_state=0)\n",
 | ||
|     "\n",
 | ||
|     "    #模型缩写\n",
 | ||
|     "    Lasso =  Lasso(random_state=0)\n",
 | ||
|     "    XGBR = XGBRegressor(random_state=0)\n",
 | ||
|     "    #训练模型\n",
 | ||
|     "    Lasso.fit(X_train,y_train)\n",
 | ||
|     "    XGBR.fit(X_train,y_train)\n",
 | ||
|     "    #模型拟合\n",
 | ||
|     "    y_pre_Lasso = Lasso.predict(x_test)\n",
 | ||
|     "    y_pre_XGBR = XGBR.predict(x_test)\n",
 | ||
|     "\n",
 | ||
|     "    #计算Lasso、XGBR、RandomForestR、AdaBoostR、GradientBoostingR、BaggingRegressor各模型的R²\n",
 | ||
|     "    Lasso_score = r2_score(y_true,y_pre_Lasso)\n",
 | ||
|     "    XGBR_score=r2_score(y_true,y_pre_XGBR)\n",
 | ||
|     "\n",
 | ||
|     "    #计算Lasso、XGBR的MSE和RMSE\n",
 | ||
|     "    Lasso_MSE=mean_squared_error(y_true, y_pre_Lasso)\n",
 | ||
|     "    XGBR_MSE=mean_squared_error(y_true, y_pre_XGBR)\n",
 | ||
|     "\n",
 | ||
|     "    Lasso_RMSE=np.sqrt(Lasso_MSE)\n",
 | ||
|     "    XGBR_RMSE=np.sqrt(XGBR_MSE)\n",
 | ||
|     "    # 将不同模型的不同误差值整合成一个表格\n",
 | ||
|     "    model_results = pd.DataFrame([['Lasso', Lasso_RMSE, Lasso_score],\n",
 | ||
|     "                                 ['XgBoost', XGBR_RMSE, XGBR_score]],\n",
 | ||
|     "                   columns = ['模型(Model)','均方根误差(RMSE)', 'R^2 score'])\n",
 | ||
|     "    #将模型名称(Model)列设置为索引\n",
 | ||
|     "    model_results1=model_results.set_index('模型(Model)')\n",
 | ||
|     "\n",
 | ||
|     "    model_results1\n",
 | ||
|     "    #定义plot_feature_importance函数,该函数用于计算特征重要性。此部分代码无需调整\n",
 | ||
|     "    def plot_feature_importance(importance,names,model_type):\n",
 | ||
|     "        feature_importance = np.array(importance)\n",
 | ||
|     "        feature_names = np.array(names)\n",
 | ||
|     "\n",
 | ||
|     "        data={'feature_names':feature_names,'feature_importance':feature_importance}\n",
 | ||
|     "        fi_df = pd.DataFrame(data)\n",
 | ||
|     "\n",
 | ||
|     "        fi_df.sort_values(by=['feature_importance'], ascending=False,inplace=True)\n",
 | ||
|     "\n",
 | ||
|     "        plt.figure(figsize=(10,8))\n",
 | ||
|     "        sn.barplot(x=fi_df['feature_importance'], y=fi_df['feature_names'])\n",
 | ||
|     "\n",
 | ||
|     "        plt.title(model_type + \" \"+'FEATURE IMPORTANCE')\n",
 | ||
|     "        plt.xlabel('FEATURE IMPORTANCE')\n",
 | ||
|     "        plt.ylabel('FEATURE NAMES')\n",
 | ||
|     "        from pylab import mpl\n",
 | ||
|     "    %pylab\n",
 | ||
|     "    mpl.rcParams['font.sans-serif'] = ['SimHei']\n",
 | ||
|     "    ## Xgboost 模型参数优化-初步\n",
 | ||
|     "    #参考: https://juejin.im/post/6844903661013827598 \n",
 | ||
|     "    #每次调参时,备选参数数值以同数量级的1、3、10设置即可(比如设置1、3、10,或0.1、0.3、1.0,或0.01,0.03,0.10即可)\n",
 | ||
|     "\n",
 | ||
|     "    from xgboost import XGBRegressor\n",
 | ||
|     "    from sklearn.model_selection import GridSearchCV\n",
 | ||
|     "\n",
 | ||
|     "    estimator = XGBRegressor(random_state=0,\n",
 | ||
|     "        nthread=4,\n",
 | ||
|     "        seed=0\n",
 | ||
|     "    )\n",
 | ||
|     "    parameters = {\n",
 | ||
|     "        'max_depth': range (2, 11, 2),     # 树的最大深度\n",
 | ||
|     "        'n_estimators': range (50, 101, 10),  # 迭代次数\n",
 | ||
|     "        'learning_rate': [0.01, 0.03, 0.1, 0.3, 0.5, 1]\n",
 | ||
|     "    }\n",
 | ||
|     "\n",
 | ||
|     "    grid_search_XGB = GridSearchCV(\n",
 | ||
|     "        estimator=estimator,\n",
 | ||
|     "        param_grid=parameters,\n",
 | ||
|     "    #     n_jobs = 10,\n",
 | ||
|     "        cv = 3,\n",
 | ||
|     "        verbose=True\n",
 | ||
|     "    )\n",
 | ||
|     "\n",
 | ||
|     "    grid_search_XGB.fit(X_train, y_train)\n",
 | ||
|     "    #如果电脑在此步骤报错,可能是因为计算量太大,超过硬件可支持程度,可注释掉“n_jobs=10”一行\n",
 | ||
|     "\n",
 | ||
|     "    best_parameters = grid_search_XGB.best_estimator_.get_params()\n",
 | ||
|     "    y_pred = grid_search_XGB.predict(x_test)\n",
 | ||
|     "\n",
 | ||
|     "    op_XGBR_score = r2_score(y_true,y_pred)\n",
 | ||
|     "    op_XGBR_MSE= mean_squared_error(y_true, y_pred)\n",
 | ||
|     "    op_XGBR_RMSE= np.sqrt(op_XGBR_MSE)\n",
 | ||
|     "\n",
 | ||
|     "    model_results2 = pd.DataFrame([['Optimized_Xgboost', op_XGBR_RMSE, op_XGBR_score]],\n",
 | ||
|     "                   columns = ['模型(Model)', '均方根误差(RMSE)', 'R^2 score'])\n",
 | ||
|     "    model_results2=model_results2.set_index('模型(Model)')\n",
 | ||
|     "\n",
 | ||
|     "    # results = model_results1.append(model_results2, ignore_index = False)\n",
 | ||
|     "    results = pd.concat([model_results1,model_results2],ignore_index=True)\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "    import pickle\n",
 | ||
|     "\n",
 | ||
|     "    Pkl_Filename = \"日度价格预测_最佳模型.pkl\"  \n",
 | ||
|     "\n",
 | ||
|     "    with open(Pkl_Filename, 'wb') as file:  \n",
 | ||
|     "       pickle.dump(grid_search_XGB, file)\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "   \n",
 | ||
|     "\n",
 | ||
|     "def read_xls_data():\n",
 | ||
|     "    global one_cols, two_cols\n",
 | ||
|     "    # 打开 XLS 文件\n",
 | ||
|     "    workbook = xlrd.open_workbook(read_file_path_name)\n",
 | ||
|     "\n",
 | ||
|     "    # 获取所有表格名称\n",
 | ||
|     "    # sheet_names = workbook.sheet_names()\n",
 | ||
|     "\n",
 | ||
|     "    # 选择第一个表格\n",
 | ||
|     "    sheet = workbook.sheet_by_index(0)\n",
 | ||
|     "\n",
 | ||
|     "    # 获取行数和列数\n",
 | ||
|     "    num_rows = sheet.nrows\n",
 | ||
|     "    # num_cols = sheet.ncols\n",
 | ||
|     "\n",
 | ||
|     "    # 遍历每一行,获取单元格数据\n",
 | ||
|     "    # for i in range(num_rows):\n",
 | ||
|     "    #     row_data = sheet.row_values(i)\n",
 | ||
|     "    #     one_cols.append(row_data)\n",
 | ||
|     "    #     two_cols.append(row_data[1])\n",
 | ||
|     "\n",
 | ||
|     "    row_data = sheet.row_values(1)\n",
 | ||
|     "    print(f'获取到的数据项ID{row_data}')\n",
 | ||
|     "    one_cols = row_data[1:]\n",
 | ||
|     "    print(f'获取到的数据项ID{one_cols}')\n",
 | ||
|     "\n",
 | ||
|     "    # 关闭 XLS 文件\n",
 | ||
|     "    # workbook.close()\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def start(date=None,token=None,token_push=None):\n",
 | ||
|     "    read_xls_data()\n",
 | ||
|     "    if date == None:\n",
 | ||
|     "        date = getNow()[0]\n",
 | ||
|     "    if token == None:\n",
 | ||
|     "        token = get_head_auth()\n",
 | ||
|     "        token_push = get_head_push_auth()\n",
 | ||
|     "\n",
 | ||
|     "    datas = get_data_value(token, one_cols,date)\n",
 | ||
|     "    if not datas:\n",
 | ||
|     "        print(\"今天没有新数据\")\n",
 | ||
|     "        return\n",
 | ||
|     "\n",
 | ||
|     "    # data_list = [two_cols, one_cols]\n",
 | ||
|     "    append_rows = [getNow(date)[1]]\n",
 | ||
|     "#     append_rows = [getNow()[1]]\n",
 | ||
|     "    dataItemNo_dataValue = {}\n",
 | ||
|     "    for data_value in datas:\n",
 | ||
|     "        if \"dataValue\" not in data_value:\n",
 | ||
|     "            print(data_value)\n",
 | ||
|     "            dataItemNo_dataValue[data_value[\"dataItemNo\"]] = \"\"\n",
 | ||
|     "        else:\n",
 | ||
|     "            dataItemNo_dataValue[data_value[\"dataItemNo\"]] = data_value[\"dataValue\"]\n",
 | ||
|     "       \n",
 | ||
|     "    for value in one_cols:\n",
 | ||
|     "        if value in dataItemNo_dataValue:\n",
 | ||
|     "            append_rows.append(dataItemNo_dataValue[value])\n",
 | ||
|     "        else:\n",
 | ||
|     "            append_rows.append(\"\")\n",
 | ||
|     "    save_xls(append_rows)\n",
 | ||
|     "    \n",
 | ||
|     "    # 获取当月的数据写入到指定文件,如果是补充数据,不需要执行\n",
 | ||
|     "    queryDataListItemNos()\n",
 | ||
|     "    # 模型训练\n",
 | ||
|     "    optimize_Model()\n",
 | ||
|     "    # 上传预测数据\n",
 | ||
|     "    upload_data_to_system(token_push,date)\n",
 | ||
|     "    # data_list.append(three_cols)\n",
 | ||
|     "    # write_xls(data_list)\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def start_1(date=None):\n",
 | ||
|     "    read_xls_data()\n",
 | ||
|     "    if date == None:\n",
 | ||
|     "        date = getNow(offset=1)[0]\n",
 | ||
|     "    token = get_head_auth()\n",
 | ||
|     "    if not token:\n",
 | ||
|     "        return\n",
 | ||
|     "    \n",
 | ||
|     "\n",
 | ||
|     "    datas = get_data_value(token, one_cols,date=date)\n",
 | ||
|     "#     if not datas:\n",
 | ||
|     "#         return\n",
 | ||
|     "\n",
 | ||
|     "    # data_list = [two_cols, one_cols]\n",
 | ||
|     "    append_rows = [getNow(offset=1)[1]]\n",
 | ||
|     "    dataItemNo_dataValue = {}\n",
 | ||
|     "    for data_value in datas:\n",
 | ||
|     "        if \"dataValue\" not in data_value:\n",
 | ||
|     "            print(data_value)\n",
 | ||
|     "            dataItemNo_dataValue[data_value[\"dataItemNo\"]] = \"\"\n",
 | ||
|     "        else:\n",
 | ||
|     "            dataItemNo_dataValue[data_value[\"dataItemNo\"]] = data_value[\"dataValue\"]\n",
 | ||
|     "       \n",
 | ||
|     "    for value in one_cols:\n",
 | ||
|     "        if value in dataItemNo_dataValue:\n",
 | ||
|     "            append_rows.append(dataItemNo_dataValue[value])\n",
 | ||
|     "        else:\n",
 | ||
|     "            append_rows.append(\"\")\n",
 | ||
|     "    save_xls_1(append_rows)\n",
 | ||
|     "\n",
 | ||
|     "    \n",
 | ||
|     "    # data_list.append(three_cols)\n",
 | ||
|     "    # write_xls(data_list)\n",
 | ||
|     "    \n",
 | ||
|     "def save_xls_1(append_rows):\n",
 | ||
|     "\n",
 | ||
|     "    # 打开xls文件\n",
 | ||
|     "    workbook = xlrd.open_workbook('纯苯数据项.xls')\n",
 | ||
|     "\n",
 | ||
|     "    # 获取所有sheet的个数\n",
 | ||
|     "    sheet_count = len(workbook.sheet_names())\n",
 | ||
|     "\n",
 | ||
|     "    # 获取所有sheet的名称\n",
 | ||
|     "    sheet_names = workbook.sheet_names()\n",
 | ||
|     "\n",
 | ||
|     "    new_workbook = xlwt.Workbook()\n",
 | ||
|     "    for i in range(sheet_count):\n",
 | ||
|     "        # 获取当前sheet\n",
 | ||
|     "        sheet = workbook.sheet_by_index(i)\n",
 | ||
|     "\n",
 | ||
|     "        # 获取sheet的行数和列数\n",
 | ||
|     "        row_count = sheet.nrows - 1\n",
 | ||
|     "        col_count = sheet.ncols\n",
 | ||
|     "        # 获取原有数据\n",
 | ||
|     "        data = []\n",
 | ||
|     "        for row in range(row_count):\n",
 | ||
|     "            row_data = []\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                row_data.append(sheet.cell_value(row, col))\n",
 | ||
|     "            data.append(row_data)\n",
 | ||
|     "        # 创建xlwt的Workbook对象\n",
 | ||
|     "        # 创建sheet\n",
 | ||
|     "        new_sheet = new_workbook.add_sheet(sheet_names[i])\n",
 | ||
|     "\n",
 | ||
|     "        # 将原有的数据写入新的sheet\n",
 | ||
|     "        for row in range(row_count):\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                new_sheet.write(row, col, data[row][col])\n",
 | ||
|     "\n",
 | ||
|     "        if i == 0:\n",
 | ||
|     "            # 在新的sheet中添加数据\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                new_sheet.write(row_count, col, append_rows[col])\n",
 | ||
|     "\n",
 | ||
|     "    # 保存新的xls文件\n",
 | ||
|     "    new_workbook.save(\"纯苯数据项.xls\")    \n",
 | ||
|     "\n",
 | ||
|     "    \n",
 | ||
|     "    \n",
 | ||
|     "    \n",
 | ||
|     "def check_data(dataItemNo):\n",
 | ||
|     "    token = get_head_auth()\n",
 | ||
|     "    if not token:\n",
 | ||
|     "        return\n",
 | ||
|     "\n",
 | ||
|     "    datas = get_data_value(token, dataItemNo)\n",
 | ||
|     "    if not datas:\n",
 | ||
|     "        return\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def save_xls(append_rows):\n",
 | ||
|     "\n",
 | ||
|     "    # 打开xls文件\n",
 | ||
|     "    workbook = xlrd.open_workbook('纯苯数据项.xls')\n",
 | ||
|     "\n",
 | ||
|     "    # 获取所有sheet的个数\n",
 | ||
|     "    sheet_count = len(workbook.sheet_names())\n",
 | ||
|     "\n",
 | ||
|     "    # 获取所有sheet的名称\n",
 | ||
|     "    sheet_names = workbook.sheet_names()\n",
 | ||
|     "\n",
 | ||
|     "    new_workbook = xlwt.Workbook()\n",
 | ||
|     "    for i in range(sheet_count):\n",
 | ||
|     "        # 获取当前sheet\n",
 | ||
|     "        sheet = workbook.sheet_by_index(i)\n",
 | ||
|     "\n",
 | ||
|     "        # 获取sheet的行数和列数\n",
 | ||
|     "        row_count = sheet.nrows\n",
 | ||
|     "        col_count = sheet.ncols\n",
 | ||
|     "        # 获取原有数据\n",
 | ||
|     "        data = []\n",
 | ||
|     "        for row in range(row_count):\n",
 | ||
|     "            row_data = []\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                row_data.append(sheet.cell_value(row, col))\n",
 | ||
|     "            data.append(row_data)\n",
 | ||
|     "        # 创建xlwt的Workbook对象\n",
 | ||
|     "        # 创建sheet\n",
 | ||
|     "        new_sheet = new_workbook.add_sheet(sheet_names[i])\n",
 | ||
|     "\n",
 | ||
|     "        # 将原有的数据写入新的sheet\n",
 | ||
|     "        for row in range(row_count):\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                new_sheet.write(row, col, data[row][col])\n",
 | ||
|     "\n",
 | ||
|     "        if i == 0:\n",
 | ||
|     "            # 在新的sheet中添加数据\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                new_sheet.write(row_count, col, append_rows[col])\n",
 | ||
|     "\n",
 | ||
|     "    # 保存新的xls文件\n",
 | ||
|     "    new_workbook.save(\"纯苯数据项.xls\")\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def get_queryDataListItemNos_value(token, url, dataItemNoList, dateStart, dateEnd):\n",
 | ||
|     "\n",
 | ||
|     "    search_data = {\n",
 | ||
|     "        \"funcModule\": \"数据项\",\n",
 | ||
|     "        \"funcOperation\": \"查询\",\n",
 | ||
|     "        \"data\": {\n",
 | ||
|     "            \"dateStart\": dateStart,\n",
 | ||
|     "            \"dateEnd\": dateEnd,\n",
 | ||
|     "            \"dataItemNoList\": dataItemNoList  # 数据项编码,代表 brent最低价和最高价\n",
 | ||
|     "        }\n",
 | ||
|     "    }\n",
 | ||
|     "\n",
 | ||
|     "    headers = {\"Authorization\": token}\n",
 | ||
|     "    search_res = requests.post(url=url, headers=headers, json=search_data, timeout=(3, 5))\n",
 | ||
|     "    search_value = json.loads(search_res.text)[\"data\"]\n",
 | ||
|     "    if search_value:\n",
 | ||
|     "        return search_value\n",
 | ||
|     "    else:\n",
 | ||
|     "        return None\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def save_queryDataListItemNos_xls(data_df,dataItemNoList):\n",
 | ||
|     "    from datetime import datetime,timedelta\n",
 | ||
|     "    current_year_month = datetime.now().strftime('%Y-%m')\n",
 | ||
|     "    grouped = data_df.groupby(\"dataDate\")\n",
 | ||
|     "\n",
 | ||
|     "    # 打开xls文件\n",
 | ||
|     "    workbook = xlrd.open_workbook('纯苯数据项.xls')\n",
 | ||
|     "\n",
 | ||
|     "    # 获取所有sheet的个数\n",
 | ||
|     "    sheet_count = len(workbook.sheet_names())\n",
 | ||
|     "\n",
 | ||
|     "    # 获取所有sheet的名称\n",
 | ||
|     "    sheet_names = workbook.sheet_names()\n",
 | ||
|     "\n",
 | ||
|     "    new_workbook = xlwt.Workbook()\n",
 | ||
|     "    for i in range(sheet_count):\n",
 | ||
|     "        # 获取当前sheet\n",
 | ||
|     "        sheet = workbook.sheet_by_index(i)\n",
 | ||
|     "\n",
 | ||
|     "        # 获取sheet的行数和列数\n",
 | ||
|     "        row_count = sheet.nrows\n",
 | ||
|     "        col_count = sheet.ncols\n",
 | ||
|     "        # 获取原有数据\n",
 | ||
|     "        data = []\n",
 | ||
|     "        for row in range(row_count):\n",
 | ||
|     "            row_data = []\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                row_data.append(sheet.cell_value(row, col))\n",
 | ||
|     "            data.append(row_data)\n",
 | ||
|     "\n",
 | ||
|     "        # 创建xlwt的Workbook对象\n",
 | ||
|     "        # 创建sheet\n",
 | ||
|     "        new_sheet = new_workbook.add_sheet(sheet_names[i])\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "        current_year_month_row = 0\n",
 | ||
|     "        # 将原有的数据写入新的sheet\n",
 | ||
|     "        for row in range(row_count):\n",
 | ||
|     "            for col in range(col_count):\n",
 | ||
|     "                col0 = data[row][0]\n",
 | ||
|     "                # print(\"col0\",col0[:7])\n",
 | ||
|     "                if col0[:7] == current_year_month:\n",
 | ||
|     "                    current_year_month_row += 1\n",
 | ||
|     "                    break\n",
 | ||
|     "                new_sheet.write(row, col, data[row][col])\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "        # print(\"current_year_month_row\",current_year_month_row)\n",
 | ||
|     "        if i == 0:\n",
 | ||
|     "            rowFlag = 0\n",
 | ||
|     "            # 查看每组数据\n",
 | ||
|     "            for date, group in grouped:\n",
 | ||
|     "                new_sheet.write(row_count + rowFlag - current_year_month_row, 0, date)\n",
 | ||
|     "                for j in range(len(dataItemNoList)):\n",
 | ||
|     "                    dataItemNo = dataItemNoList[j]\n",
 | ||
|     "\n",
 | ||
|     "                    if group[group[\"dataItemNo\"] == dataItemNo][\"dataValue\"].values and (not str(group[group[\"dataItemNo\"] == dataItemNo][\"dataValue\"].values[0]) == 'nan'):\n",
 | ||
|     "\n",
 | ||
|     "                        new_sheet.write(row_count + rowFlag - current_year_month_row, j + 1, group[group[\"dataItemNo\"] == dataItemNo][\"dataValue\"].values[0])\n",
 | ||
|     "\n",
 | ||
|     "                rowFlag += 1\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "    # 保存新的xls文件\n",
 | ||
|     "    new_workbook.save(\"纯苯数据项.xls\")\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "def queryDataListItemNos(date=None,token=None):\n",
 | ||
|     "    from datetime import datetime, timedelta\n",
 | ||
|     "    df = pd.read_excel('纯苯数据项.xls')\n",
 | ||
|     "    dataItemNoList = df.iloc[0].tolist()[1:]\n",
 | ||
|     "    if token is None:\n",
 | ||
|     "        token = get_head_auth()\n",
 | ||
|     "        if not token:\n",
 | ||
|     "            print('token获取失败')\n",
 | ||
|     "            return\n",
 | ||
|     "    # 获取当前日期\n",
 | ||
|     "    if date is None:\n",
 | ||
|     "        current_date = datetime.now()\n",
 | ||
|     "    else:\n",
 | ||
|     "        current_date = date\n",
 | ||
|     "    # 获取当月1日\n",
 | ||
|     "    first_day_of_month = current_date.replace(day=1)\n",
 | ||
|     "    # 格式化为 YYYYMMDD 格式\n",
 | ||
|     "    dateEnd = current_date.strftime('%Y%m%d')\n",
 | ||
|     "    dateStart = first_day_of_month.strftime('%Y%m%d')\n",
 | ||
|     "    search_value = get_queryDataListItemNos_value(token, queryDataListItemNos_url, dataItemNoList, dateStart, dateEnd)\n",
 | ||
|     "    data_df = pd.DataFrame(search_value)\n",
 | ||
|     "    data_df[\"dataDate\"] = pd.to_datetime(data_df[\"dataDate\"])\n",
 | ||
|     "    data_df[\"dataDate\"] = data_df[\"dataDate\"].dt.strftime('%Y-%m-%d')\n",
 | ||
|     "    save_queryDataListItemNos_xls(data_df,dataItemNoList)\n",
 | ||
|     "    print('当月数据更新完成')\n",
 | ||
|     "\n",
 | ||
|     "\n",
 | ||
|     "if __name__ == \"__main__\":\n",
 | ||
|     "    print('运行中ing')\n",
 | ||
|     "\n",
 | ||
|     "    # 每天定时12点运行\n",
 | ||
|     "    while True:\n",
 | ||
|     "        # 获取当前时间\n",
 | ||
|     "        current_time = time.strftime(\"%H:%M:%S\", time.localtime())\n",
 | ||
|     "        current_time_1 = time.strftime(\"%H:%M:%S\", time.localtime())\n",
 | ||
|     "        \n",
 | ||
|     "        current_time = time.strftime(\"%H:%M:%S\", time.localtime())\n",
 | ||
|     "        try:\n",
 | ||
|     "            # 判断当前时间是否为执行任务的时间点\n",
 | ||
|     "            if current_time == \"09:16:00\":\n",
 | ||
|     "                print(\"执行定时任务\")\n",
 | ||
|     "                start()\n",
 | ||
|     "            elif current_time == \"09:21:00\":\n",
 | ||
|     "                print(\"执行定时任务\")\n",
 | ||
|     "                start()\n",
 | ||
|     "            time.sleep(1)\n",
 | ||
|     "        except:\n",
 | ||
|     "            print(f\"{current_time}执行失败\")\n",
 | ||
|     "\n",
 | ||
|     "# start()\n",
 | ||
|     "#     # 检测数据准确性, 需要检测放开\n",
 | ||
|     "#     # check_data(\"100028098|LISTING_PRICE\")\n",
 | ||
|     "#     # check_data(\"9137070016544622XB|DAY_Yield\")\n"
 | ||
|    ]
 | ||
|   },
 | ||
|   {
 | ||
|    "cell_type": "code",
 | ||
|    "execution_count": null,
 | ||
|    "metadata": {
 | ||
|     "scrolled": true
 | ||
|    },
 | ||
|    "outputs": [
 | ||
|     {
 | ||
|      "name": "stdout",
 | ||
|      "output_type": "stream",
 | ||
|      "text": [
 | ||
|       "20250601\n",
 | ||
|       "获取到的数据项ID['数据项编码', 'C01100047|STRIKE_PRICE', 'Brentspj', '913716251671540959|EXCHANGE_RATE', 'C01100010|LIST_PRICE01', '250326561|STRIKE_PRICE', 'C01100047|LIST_PRICE', 'C01100047|LIST_PRICE-1', 'C01100047|LIST_PRICE-01', 'OIL_CHEM|guonei|6097|PRICE', '91370500674526498A|C01100008|STRIKE_PRICE', '91370783724809024G|BEN|PRICE', '91370500737223620X|BEN|PRICE', '91370503706169019D|BEN|PRICE', '91370503164840647R|BEN|PRICE', 'C01100047|TURNOVER', '913705221649223519|C01100047|EXW', 'C01100047|CAPACITY']\n",
 | ||
|       "获取到的数据项ID['C01100047|STRIKE_PRICE', 'Brentspj', '913716251671540959|EXCHANGE_RATE', 'C01100010|LIST_PRICE01', '250326561|STRIKE_PRICE', 'C01100047|LIST_PRICE', 'C01100047|LIST_PRICE-1', 'C01100047|LIST_PRICE-01', 'OIL_CHEM|guonei|6097|PRICE', '91370500674526498A|C01100008|STRIKE_PRICE', '91370783724809024G|BEN|PRICE', '91370500737223620X|BEN|PRICE', '91370503706169019D|BEN|PRICE', '91370503164840647R|BEN|PRICE', 'C01100047|TURNOVER', '913705221649223519|C01100047|EXW', 'C01100047|CAPACITY']\n"
 | ||
|      ]
 | ||
|     },
 | ||
|     {
 | ||
|      "name": "stderr",
 | ||
|      "output_type": "stream",
 | ||
|      "text": [
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:753: DeprecationWarning:\n",
 | ||
|       "\n",
 | ||
|       "The truth value of an empty array is ambiguous. Returning False, but in future this will result in an error. Use `array.size > 0` to check that an array is not empty.\n",
 | ||
|       "\n",
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:302: UserWarning:\n",
 | ||
|       "\n",
 | ||
|       "The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.\n",
 | ||
|       "\n",
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:307: FutureWarning:\n",
 | ||
|       "\n",
 | ||
|       "Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)`\n",
 | ||
|       "\n",
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:308: FutureWarning:\n",
 | ||
|       "\n",
 | ||
|       "Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)`\n",
 | ||
|       "\n",
 | ||
|       "c:\\Users\\EDY\\.conda\\envs\\predict\\lib\\site-packages\\sklearn\\linear_model\\_coordinate_descent.py:695: ConvergenceWarning:\n",
 | ||
|       "\n",
 | ||
|       "Objective did not converge. You might want to increase the number of iterations, check the scale of the features or consider increasing regularisation. Duality gap: 7.936e+05, tolerance: 5.806e+04\n",
 | ||
|       "\n"
 | ||
|      ]
 | ||
|     },
 | ||
|     {
 | ||
|      "name": "stdout",
 | ||
|      "output_type": "stream",
 | ||
|      "text": [
 | ||
|       "当月数据更新完成\n",
 | ||
|       "Using matplotlib backend: inline\n",
 | ||
|       "%pylab is deprecated, use %matplotlib inline and import the required libraries.\n",
 | ||
|       "Populating the interactive namespace from numpy and matplotlib\n",
 | ||
|       "Fitting 3 folds for each of 180 candidates, totalling 540 fits\n"
 | ||
|      ]
 | ||
|     },
 | ||
|     {
 | ||
|      "name": "stderr",
 | ||
|      "output_type": "stream",
 | ||
|      "text": [
 | ||
|       "c:\\Users\\EDY\\.conda\\envs\\predict\\lib\\site-packages\\IPython\\core\\magics\\pylab.py:166: UserWarning:\n",
 | ||
|       "\n",
 | ||
|       "pylab import has clobbered these variables: ['datetime', '__version__', 'random', 'plot']\n",
 | ||
|       "`%matplotlib` prevents importing * from pylab and numpy\n",
 | ||
|       "\n",
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:255: UserWarning:\n",
 | ||
|       "\n",
 | ||
|       "The argument 'infer_datetime_format' is deprecated and will be removed in a future version. A strict version of it is now the default, see https://pandas.pydata.org/pdeps/0004-consistent-to-datetime-parsing.html. You can safely remove this argument.\n",
 | ||
|       "\n",
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:259: FutureWarning:\n",
 | ||
|       "\n",
 | ||
|       "Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)`\n",
 | ||
|       "\n",
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:260: FutureWarning:\n",
 | ||
|       "\n",
 | ||
|       "Downcasting object dtype arrays on .fillna, .ffill, .bfill is deprecated and will change in a future version. Call result.infer_objects(copy=False) instead. To opt-in to the future behavior, set `pd.set_option('future.no_silent_downcasting', True)`\n",
 | ||
|       "\n",
 | ||
|       "C:\\Users\\EDY\\AppData\\Local\\Temp\\ipykernel_20756\\2211479266.py:285: FutureWarning:\n",
 | ||
|       "\n",
 | ||
|       "Series.__getitem__ treating keys as positions is deprecated. In a future version, integer keys will always be treated as labels (consistent with DataFrame behavior). To access a value by position, use `ser.iloc[pos]`\n",
 | ||
|       "\n"
 | ||
|      ]
 | ||
|     },
 | ||
|     {
 | ||
|      "name": "stdout",
 | ||
|      "output_type": "stream",
 | ||
|      "text": [
 | ||
|       "Date\n",
 | ||
|       "2025-06-04    5826.140137\n",
 | ||
|       "Name: 日度预测价格, dtype: float32\n",
 | ||
|       "{'funcModule': '数据表信息列表', 'funcOperation': '新增', 'data': [{'dataItemNo': 'C01100047|FORECAST_PRICE', 'dataDate': '20250601', 'dataStatus': 'add', 'dataValue': np.float64(5826.14)}]}\n",
 | ||
|       "{\"confirmFlg\":false,\"status\":true}\n"
 | ||
|      ]
 | ||
|     }
 | ||
|    ],
 | ||
|    "source": [
 | ||
|     "# # # 自定义日期执行预测\n",
 | ||
|     "\n",
 | ||
|     "# start_date = datetime(2025, 6, 1)\n",
 | ||
|     "# end_date = datetime(2025, 6, 2)\n",
 | ||
|     "\n",
 | ||
|     "# token = get_head_auth()\n",
 | ||
|     "# token_push = get_head_push_auth()\n",
 | ||
|     "# while start_date < end_date:\n",
 | ||
|     "#     print(start_date.strftime('%Y%m%d'))\n",
 | ||
|     "#     start(start_date,token,token_push)\n",
 | ||
|     "#     time.sleep(2)\n",
 | ||
|     "#     # start_1(start_date)\n",
 | ||
|     "#     start_date += timedelta(days=1)"
 | ||
|    ]
 | ||
|   },
 | ||
|   {
 | ||
|    "cell_type": "code",
 | ||
|    "execution_count": null,
 | ||
|    "metadata": {},
 | ||
|    "outputs": [],
 | ||
|    "source": []
 | ||
|   }
 | ||
|  ],
 | ||
|  "metadata": {
 | ||
|   "kernelspec": {
 | ||
|    "display_name": "predict",
 | ||
|    "language": "python",
 | ||
|    "name": "python3"
 | ||
|   },
 | ||
|   "language_info": {
 | ||
|    "codemirror_mode": {
 | ||
|     "name": "ipython",
 | ||
|     "version": 3
 | ||
|    },
 | ||
|    "file_extension": ".py",
 | ||
|    "mimetype": "text/x-python",
 | ||
|    "name": "python",
 | ||
|    "nbconvert_exporter": "python",
 | ||
|    "pygments_lexer": "ipython3",
 | ||
|    "version": "3.10.16"
 | ||
|   }
 | ||
|  },
 | ||
|  "nbformat": 4,
 | ||
|  "nbformat_minor": 2
 | ||
| }
 |