960 lines
61 KiB
Plaintext
960 lines
61 KiB
Plaintext
{
|
|
"cells": [
|
|
{
|
|
"cell_type": "markdown",
|
|
"id": "4d2a8b6c",
|
|
"metadata": {},
|
|
"source": [
|
|
"#### Database"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 1,
|
|
"id": "7be9eeff",
|
|
"metadata": {},
|
|
"outputs": [],
|
|
"source": [
|
|
"PROJECT_PATH = '/home/md/Work/ligalytics/leagues_stable/'\n",
|
|
"import os, sys\n",
|
|
"sys.path.insert(0, PROJECT_PATH)\n",
|
|
"os.environ.setdefault(\"DJANGO_SETTINGS_MODULE\", \"leagues.settings\")\n",
|
|
"\n",
|
|
"from leagues import settings\n",
|
|
"settings.DATABASES['default']['NAME'] = PROJECT_PATH+'/db.sqlite3'\n",
|
|
"\n",
|
|
"import django\n",
|
|
"django.setup()\n",
|
|
"\n",
|
|
"from scheduler.models import *\n",
|
|
"from common.functions import distanceInKmByGPS\n",
|
|
"season = Season.objects.filter(nicename=\"Imported: Benchmark Season\").first()\n",
|
|
"import pandas as pd\n",
|
|
"import numpy as np\n",
|
|
"from django.db.models import F\n",
|
|
"games = Game.objects.filter(season=season)\n",
|
|
"df = pd.DataFrame.from_records(games.values())\n",
|
|
"games = Game.objects.filter(season=season).exclude(historic_season=None).annotate(\n",
|
|
" home=F('homeTeam__shortname'),\n",
|
|
" away=F('awayTeam__shortname'),\n",
|
|
" home_lat=F('homeTeam__latitude'),\n",
|
|
" home_lon=F('homeTeam__longitude'),\n",
|
|
" home_attr=F('homeTeam__attractivity'),\n",
|
|
" away_lat=F('awayTeam__latitude'),\n",
|
|
" away_lon=F('awayTeam__longitude'),\n",
|
|
" away_attr=F('awayTeam__attractivity'),\n",
|
|
" home_country=F('homeTeam__country'),\n",
|
|
" away_country=F('awayTeam__country'),\n",
|
|
").values()\n",
|
|
"\n"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "markdown",
|
|
"id": "bc191792",
|
|
"metadata": {},
|
|
"source": [
|
|
"#### Dataframe"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 2,
|
|
"id": "1e404cf8",
|
|
"metadata": {},
|
|
"outputs": [],
|
|
"source": [
|
|
"from sklearn.preprocessing import OneHotEncoder\n",
|
|
"\n",
|
|
"# create dataset\n",
|
|
"df = pd.DataFrame.from_records(games.values())\n",
|
|
"\n",
|
|
"# data cleaning\n",
|
|
"df['time'] = df['time'].replace('','0')\n",
|
|
"df = df[df['attendance'] != 0]\n",
|
|
"\n",
|
|
"# remove outliers\n",
|
|
"out_fields = ['attendance']\n",
|
|
"for field in out_fields:\n",
|
|
" q_low = df[field].quantile(0.01)\n",
|
|
" q_hi = df[field].quantile(0.99)\n",
|
|
" df = df[(df[field] < q_hi) & (df[field] > q_low)]\n",
|
|
"\n",
|
|
"\n",
|
|
"# pivots\n",
|
|
"pivot_homeTeam_mean = df.pivot_table('attendance','homeTeam_id',aggfunc='mean')\n",
|
|
"pivot_homeTeam_max = df.pivot_table('attendance','homeTeam_id',aggfunc='max')\n",
|
|
"\n",
|
|
"# add more features\n",
|
|
"df['weekday'] = df.apply(lambda r: r['date'].weekday(), axis=1)\n",
|
|
"df['day'] = df.apply(lambda r: r['date'].day, axis=1)\n",
|
|
"df['month'] = df.apply(lambda r: r['date'].month, axis=1)\n",
|
|
"df['year'] = df.apply(lambda r: r['date'].year, axis=1)\n",
|
|
"df['distance'] = df.apply(lambda r: distanceInKmByGPS(r['home_lon'],r['home_lat'],r['away_lon'],r['away_lat']), axis=1)\n",
|
|
"df['weekend'] = df.apply(lambda r: int(r['weekday'] in [6,7]), axis=1)\n",
|
|
"df['winter_season'] = df.apply(lambda r: int(r['month'] in [1,2,3,10,11,12]), axis=1)\n",
|
|
"df['home_base'] = df.apply(lambda r: pivot_homeTeam_mean.loc[r['homeTeam_id'],'attendance'], axis=1)\n",
|
|
"df['stadium_size'] = df.apply(lambda r: pivot_homeTeam_max.loc[r['homeTeam_id'],'attendance'], axis=1)\n",
|
|
"df['early'] = df.apply(lambda r: r['time'].replace(':','') < \"1800\", axis=1)\n",
|
|
"df['before2010'] = df.apply(lambda r: r['historic_season'].split('-')[0] < \"2010\", axis=1)\n",
|
|
"\n",
|
|
"\n",
|
|
"\n",
|
|
"# one hot encoding\n",
|
|
"ohe_fields = ['home_country']\n",
|
|
"\n",
|
|
"for field in ohe_fields:\n",
|
|
" ohe = OneHotEncoder()\n",
|
|
" transformed = ohe.fit_transform(df[[field]])\n",
|
|
" df[ohe.categories_[0]] = transformed.toarray()\n",
|
|
"\n",
|
|
"# sort label to last index\n",
|
|
"cols = list(df.columns)\n",
|
|
"cols.append(cols.pop(cols.index('attendance')))\n",
|
|
"df = df[cols]"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "markdown",
|
|
"id": "e2ea08e5",
|
|
"metadata": {},
|
|
"source": [
|
|
"#### Train/Test Data - Normalization"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 3,
|
|
"id": "74e12f87",
|
|
"metadata": {},
|
|
"outputs": [],
|
|
"source": [
|
|
"import numpy as np \n",
|
|
"import pandas as pd \n",
|
|
"import matplotlib.pyplot as plt\n",
|
|
"import seaborn as sns\n",
|
|
"from sklearn.model_selection import train_test_split, cross_val_predict\n",
|
|
"from sklearn import metrics\n",
|
|
"from sklearn.ensemble import GradientBoostingRegressor\n",
|
|
"\n",
|
|
"\n",
|
|
"remove_columns = ['season_id', 'resultEntered', 'reversible', 'reschedule', 'homeGoals', 'awayGoals',\n",
|
|
" 'homeGoals2', 'awayGoals2', 'homeGoals3', 'awayGoals3', 'home', 'away', 'date', 'time',\n",
|
|
" 'id', 'historic_season',\n",
|
|
" 'home_country','home_lat','home_lon','away_lat','away_lon','away_country','year']\n",
|
|
"feature_cols = list(set(df.columns[:-1]) - set(remove_columns))\n",
|
|
"# feature_cols = ['weekday','weekend','home_base','distance','winter_season']\n",
|
|
"label = 'attendance'\n",
|
|
"\n",
|
|
"\n",
|
|
"data = df[feature_cols+[label]]\n",
|
|
"\n",
|
|
"\n",
|
|
"\n",
|
|
"\n",
|
|
"X = df[feature_cols] # Features\n",
|
|
"y = df[label] # Target variable\n",
|
|
"\n",
|
|
"X_train, X_test, y_train, y_test = train_test_split(\n",
|
|
" X, y, test_size=0.3, random_state=1) # 70% training and 30% test"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 4,
|
|
"id": "45e08026",
|
|
"metadata": {},
|
|
"outputs": [
|
|
{
|
|
"name": "stdout",
|
|
"output_type": "stream",
|
|
"text": [
|
|
"Random Forest Regression Accuracy: 0.6976274695189291\n"
|
|
]
|
|
}
|
|
],
|
|
"source": [
|
|
"rf_regressor = GradientBoostingRegressor(n_estimators = 200 , random_state = 42)\n",
|
|
"rf_regressor.fit(X_train,y_train)\n",
|
|
"\n",
|
|
"# #Predicting the SalePrices using test set \n",
|
|
"y_pred_rf = rf_regressor.predict(X_test)\n",
|
|
"\n",
|
|
"# #Random Forest Regression Accuracy with test set\n",
|
|
"print('Random Forest Regression Accuracy: ', rf_regressor.score(X_test,y_test))\n",
|
|
"\n",
|
|
"# #Predicting the SalePrice using cross validation (KFold method)\n",
|
|
"# y_pred_rf = cross_val_predict(rf_regressor, X, y, cv=10 )\n",
|
|
"\n",
|
|
"# #Random Forest Regression Accuracy with cross validation\n",
|
|
"# accuracy_rf = metrics.r2_score(y, y_pred_rf)\n",
|
|
"# print('Cross-Predicted(KFold) Random Forest Regression Accuracy: ', accuracy_rf)"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 5,
|
|
"id": "0de49b8a",
|
|
"metadata": {},
|
|
"outputs": [
|
|
{
|
|
"data": {
|
|
"image/png": "",
|
|
"text/plain": [
|
|
"<Figure size 1080x720 with 1 Axes>"
|
|
]
|
|
},
|
|
"metadata": {
|
|
"needs_background": "light"
|
|
},
|
|
"output_type": "display_data"
|
|
}
|
|
],
|
|
"source": [
|
|
"ranking = np.argsort(-rf_regressor.feature_importances_)\n",
|
|
"f, ax = plt.subplots(figsize=(15, 10))\n",
|
|
"sns.barplot(x=rf_regressor.feature_importances_[ranking], y=X_train.columns.values[ranking], orient='h')\n",
|
|
"ax.set_xlabel(\"feature importance\")\n",
|
|
"plt.tight_layout()\n",
|
|
"plt.show()"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 6,
|
|
"id": "4c1f8b45",
|
|
"metadata": {},
|
|
"outputs": [
|
|
{
|
|
"name": "stdout",
|
|
"output_type": "stream",
|
|
"text": [
|
|
"0 4000 6269.331273160804\n",
|
|
"1 3264 2212.472559220525\n",
|
|
"2 6000 4474.321544046366\n",
|
|
"3 4250 5853.876279843164\n",
|
|
"4 1200 2724.8479999971523\n",
|
|
"5 4300 12248.194405029995\n",
|
|
"6 3874 12179.504105471333\n",
|
|
"7 2800 7179.957816540268\n",
|
|
"8 5500 4343.454242132351\n",
|
|
"9 6000 15615.670772432313\n",
|
|
"10 3500 2142.013025198476\n",
|
|
"11 4500 6581.086576491373\n",
|
|
"12 2140 2787.000793225451\n",
|
|
"13 3146 7948.163004948026\n",
|
|
"14 2600 5277.360995538767\n",
|
|
"15 4875 4182.090794311384\n",
|
|
"16 5807 1298.0546590068432\n",
|
|
"17 5200 7641.152367897079\n",
|
|
"18 3500 12709.91385314257\n",
|
|
"19 2643 13796.44798966877\n",
|
|
"20 4000 2910.0979973906897\n",
|
|
"21 2500 11367.203439146624\n",
|
|
"22 2000 4578.676165761646\n",
|
|
"23 3198 11801.197736843704\n",
|
|
"24 3571 3256.2683962230926\n",
|
|
"25 2712 13963.658569196019\n",
|
|
"26 2100 3428.2076365623343\n",
|
|
"27 4525 3179.082309242862\n",
|
|
"28 6625 5319.700728374097\n",
|
|
"29 4966 4814.201898718184\n",
|
|
"30 2000 11668.774282716573\n",
|
|
"31 2100 16459.759735440115\n",
|
|
"32 2310 10424.049272604385\n",
|
|
"33 2600 3249.7584854521983\n",
|
|
"34 2000 4933.417332760704\n",
|
|
"35 4300 11330.47572253357\n",
|
|
"36 2734 4916.62667788047\n",
|
|
"37 3500 7616.108008546191\n",
|
|
"38 3050 5834.707115002423\n",
|
|
"39 5256 10956.873320747929\n",
|
|
"40 3012 1746.8793669215172\n",
|
|
"41 5060 4642.521259437015\n",
|
|
"42 1500 10636.260356819768\n",
|
|
"43 4000 6226.573175422698\n",
|
|
"44 1950 6253.5032474003465\n",
|
|
"45 2300 5174.122252417559\n",
|
|
"46 2300 2724.3318310328705\n",
|
|
"47 1950 9804.743199526134\n",
|
|
"48 3058 3874.7670154643415\n",
|
|
"49 2000 10001.45516441721\n",
|
|
"50 2345 5023.8562523965875\n",
|
|
"51 5500 5174.122252417559\n",
|
|
"52 5585 3817.7336514404283\n",
|
|
"53 4046 4720.395073786049\n",
|
|
"54 6000 4569.1440149122045\n",
|
|
"55 4384 4918.984377964906\n",
|
|
"56 3000 4674.700091188421\n",
|
|
"57 3500 3544.0179791758733\n",
|
|
"58 7000 18261.80159810542\n",
|
|
"59 10195 13504.402960006135\n",
|
|
"60 3476 2439.2710475675904\n",
|
|
"61 2120 6683.8055866507775\n",
|
|
"62 3800 4831.40407430577\n",
|
|
"63 2675 18297.8862272201\n",
|
|
"64 6603 5900.839366216985\n",
|
|
"65 1500 5547.896256687706\n",
|
|
"66 4000 15716.448413829125\n",
|
|
"67 4545 3510.458423897759\n",
|
|
"68 1396 4299.864451241506\n",
|
|
"69 5400 11340.993418688882\n",
|
|
"70 5041 13344.492446272585\n",
|
|
"71 1500 12842.717635745401\n",
|
|
"72 1800 2826.6198584357285\n",
|
|
"73 3189 2216.6069457661515\n",
|
|
"74 3800 7551.124847543301\n",
|
|
"75 2178 10854.693947136366\n",
|
|
"76 6169 3754.054098366518\n",
|
|
"77 2676 6227.444878272318\n",
|
|
"78 3510 4372.710484500164\n",
|
|
"79 3900 5899.365613773657\n",
|
|
"80 2120 9146.338397438585\n",
|
|
"81 8000 6598.214034291334\n",
|
|
"82 2500 4180.2412129479535\n",
|
|
"83 4016 1013.1917302016966\n",
|
|
"84 1500 13356.059667395755\n",
|
|
"85 2860 3859.7092616602254\n",
|
|
"86 2150 12546.493369090958\n",
|
|
"87 3336 13781.48736284787\n",
|
|
"88 8820 6867.843525597063\n",
|
|
"89 4792 9977.417685682762\n",
|
|
"90 1650 23425.898130663616\n",
|
|
"91 2000 6589.051500702451\n",
|
|
"92 2111 3109.4945264556886\n",
|
|
"93 4470 13408.035401832343\n",
|
|
"94 7000 5519.4148042321\n",
|
|
"95 3850 6089.400396461468\n",
|
|
"96 4366 9610.498715489919\n",
|
|
"97 2645 8316.017866765993\n",
|
|
"98 2384 6197.035790504067\n",
|
|
"99 4522 12779.77200503699\n",
|
|
"100 6328 14744.016207170152\n",
|
|
"101 3877 19458.90971123009\n",
|
|
"102 2000 4874.224861034961\n",
|
|
"103 4157 5208.703053494322\n",
|
|
"104 2942 13386.059288545708\n",
|
|
"105 3655 13257.062956113012\n",
|
|
"106 4500 2441.3256508749882\n",
|
|
"107 2964 2416.608601291409\n",
|
|
"108 2863 2553.749826440011\n",
|
|
"109 4935 11198.828086622805\n",
|
|
"110 2526 12041.524132520446\n",
|
|
"111 5679 8045.757009722594\n",
|
|
"112 7286 13009.125855582837\n",
|
|
"113 6055 12448.19779590953\n",
|
|
"114 1200 11188.064346395086\n",
|
|
"115 4110 4271.21931546039\n",
|
|
"116 1957 3087.6529257626803\n",
|
|
"117 1790 2569.376378289409\n",
|
|
"118 5422 6173.099807850697\n",
|
|
"119 4650 12505.12258551472\n",
|
|
"120 5297 12652.949405216323\n",
|
|
"121 3036 6268.840108714523\n",
|
|
"122 3233 9367.596675826102\n",
|
|
"123 12000 2337.3771641354024\n",
|
|
"124 7632 1819.0748787672667\n",
|
|
"125 3620 7428.132912505317\n",
|
|
"126 2000 2124.849872483271\n",
|
|
"127 2145 6073.702450147759\n",
|
|
"128 2227 15691.707999141212\n",
|
|
"129 2520 17731.752052395845\n",
|
|
"130 10000 9224.693549735079\n",
|
|
"131 2000 4333.254162853479\n",
|
|
"132 4052 5463.585852647499\n",
|
|
"133 2137 3385.7917346498257\n",
|
|
"134 2609 8949.299267841006\n",
|
|
"135 3256 5594.136151838447\n",
|
|
"136 8173 7321.006115614261\n",
|
|
"137 1250 6314.334305949203\n",
|
|
"138 7401 1841.6632769675457\n",
|
|
"139 4200 5913.92021057092\n",
|
|
"140 6100 5914.498891029855\n",
|
|
"141 5182 4485.159036791194\n",
|
|
"142 1300 3930.555183694012\n",
|
|
"143 2117 2087.6087105330876\n",
|
|
"144 6500 3129.218824655229\n",
|
|
"145 5174 19100.66955411291\n",
|
|
"146 3867 7381.962946265084\n",
|
|
"147 1918 3668.522599331723\n",
|
|
"148 2800 5984.122720695453\n",
|
|
"149 7648 5579.807332727605\n",
|
|
"150 5638 5000.766880937242\n",
|
|
"151 5262 8796.640913054198\n",
|
|
"152 1650 11038.130604200423\n",
|
|
"153 1657 3053.4760351098107\n",
|
|
"154 4086 16594.785800693066\n",
|
|
"155 9000 3561.181162895718\n",
|
|
"156 1500 5042.543289014211\n",
|
|
"157 8145 12723.53945595642\n",
|
|
"158 2625 7117.118765444254\n",
|
|
"159 6281 3092.870875123699\n",
|
|
"160 4520 1916.9886938042089\n",
|
|
"161 1200 3334.4719289950585\n",
|
|
"162 4829 4248.693921085489\n",
|
|
"163 1760 3065.4160555916155\n",
|
|
"164 3469 10943.4771813175\n",
|
|
"165 7500 4646.274655834034\n",
|
|
"166 5227 7247.410995462059\n",
|
|
"167 1765 12061.617431570865\n",
|
|
"168 5200 3906.7362684340383\n",
|
|
"169 6402 5802.18818098374\n",
|
|
"170 4832 3735.241252929307\n",
|
|
"171 1500 8821.101907961975\n",
|
|
"172 2342 3612.477133461679\n",
|
|
"173 2799 908.2647209562191\n",
|
|
"174 3850 3078.4680731926246\n",
|
|
"175 4200 3812.544744635514\n",
|
|
"176 4531 2705.9998772537424\n",
|
|
"177 1751 1967.6894728073173\n",
|
|
"178 4250 5924.714538352343\n",
|
|
"179 5705 6513.58136727248\n",
|
|
"180 3528 1966.268176067289\n",
|
|
"181 2496 4368.04545595507\n",
|
|
"182 4370 2024.6278361643576\n",
|
|
"183 1350 5634.107750848085\n",
|
|
"184 5334 10956.873320747929\n",
|
|
"185 1423 6752.977449121771\n",
|
|
"186 4129 4490.334901030411\n",
|
|
"187 5858 2706.770656503444\n",
|
|
"188 3300 4860.877678091679\n",
|
|
"189 3500 3893.6704796446884\n",
|
|
"190 10280 3778.999270841025\n",
|
|
"191 4500 7722.956089373864\n",
|
|
"192 10500 3823.8621517621054\n",
|
|
"193 3932 5270.396448543778\n",
|
|
"194 5500 7707.251425986663\n",
|
|
"195 2200 14389.91484985415\n",
|
|
"196 8206 6044.3459440998595\n",
|
|
"197 8000 4457.480201516091\n",
|
|
"198 6372 8890.061129175148\n",
|
|
"199 7900 13621.063242184871\n",
|
|
"200 1628 13169.821966149577\n",
|
|
"201 4142 3606.329399178841\n",
|
|
"202 1150 6794.3761007737885\n",
|
|
"203 1750 3527.0690712828796\n",
|
|
"204 4072 4870.13044656876\n",
|
|
"205 1176 14005.1555660555\n",
|
|
"206 3200 5021.013261618377\n",
|
|
"207 1715 10318.676591702464\n",
|
|
"208 7530 10459.245297486614\n",
|
|
"209 4600 8316.395535933456\n",
|
|
"210 1200 5095.800766098369\n",
|
|
"211 4452 17619.45148176299\n",
|
|
"212 2400 2917.6212527362745\n",
|
|
"213 4057 3523.9765596992324\n",
|
|
"214 5000 7568.184421468349\n",
|
|
"215 4147 2328.238657453435\n",
|
|
"216 3046 9816.145570783112\n",
|
|
"217 6215 2815.1845153039812\n",
|
|
"218 3350 2458.220350724582\n",
|
|
"219 3500 1143.4289915252082\n",
|
|
"220 5870 3349.522734018162\n",
|
|
"221 4113 6562.149215912538\n",
|
|
"222 3420 15899.046839388688\n",
|
|
"223 6116 9045.668754767581\n",
|
|
"224 5902 2748.9553238280632\n",
|
|
"225 3787 4271.853869225162\n",
|
|
"226 3600 7439.183383616434\n",
|
|
"227 7017 2210.108006140514\n",
|
|
"228 10280 4927.066871405887\n",
|
|
"229 5600 9564.813393139277\n",
|
|
"230 3656 3329.8106332184043\n",
|
|
"231 6480 17110.713931585673\n",
|
|
"232 1646 4677.074303376587\n",
|
|
"233 2600 4440.882887387751\n",
|
|
"234 4300 2118.7542046100843\n",
|
|
"235 7948 3214.332854949672\n",
|
|
"236 4579 7753.321604795282\n",
|
|
"237 4364 6460.580153817578\n",
|
|
"238 5000 3400.25051693908\n",
|
|
"239 2034 4284.09527513928\n",
|
|
"240 3500 5231.567751256019\n",
|
|
"241 5688 6856.195658240203\n",
|
|
"242 1800 12184.56551356091\n",
|
|
"243 10131 2598.8215825730167\n",
|
|
"244 5784 5943.724350980219\n",
|
|
"245 1813 4361.9722090698815\n",
|
|
"246 3700 5182.000108363626\n",
|
|
"247 6700 5850.0908748940765\n",
|
|
"248 3700 2399.8908348974273\n",
|
|
"249 7799 1934.7516235634123\n",
|
|
"250 1884 11765.60702403286\n",
|
|
"251 3042 4656.923175922518\n",
|
|
"252 5000 13415.8010505132\n",
|
|
"253 5112 13024.815014128593\n",
|
|
"254 1404 3154.9780459262442\n",
|
|
"255 2471 4309.257915103401\n",
|
|
"256 7749 10739.861964061618\n",
|
|
"257 6254 3516.7357048629206\n",
|
|
"258 2502 11979.741281816012\n",
|
|
"259 2300 3650.093842398789\n",
|
|
"260 6500 11606.67581375423\n",
|
|
"261 2646 2003.5526871642137\n",
|
|
"262 9546 3357.754620510872\n",
|
|
"263 7500 1954.3537407404217\n",
|
|
"264 11016 5754.557478633303\n",
|
|
"265 5763 9554.299673198937\n",
|
|
"266 2460 9835.688834354334\n",
|
|
"267 5511 3086.8504515496356\n",
|
|
"268 1857 12616.742317378286\n",
|
|
"269 7000 3003.607544650991\n",
|
|
"270 6333 2916.8409179975624\n",
|
|
"271 6107 4089.944537354285\n",
|
|
"272 1518 2032.35131917741\n",
|
|
"273 9310 13077.88651001709\n",
|
|
"274 3551 5538.163168934835\n",
|
|
"275 1700 5176.458388224016\n",
|
|
"276 2250 6964.458867728808\n",
|
|
"277 6000 3658.89357449004\n",
|
|
"278 2003 12082.974153438317\n",
|
|
"279 15183 3440.5699078224566\n",
|
|
"280 7113 3704.6762193220106\n",
|
|
"281 3818 7853.080965569755\n",
|
|
"282 12300 4595.931196930642\n",
|
|
"283 12488 4204.879371769705\n",
|
|
"284 8000 14443.56582836753\n",
|
|
"285 10832 6863.813679372925\n",
|
|
"286 2107 6377.807460294606\n",
|
|
"287 2100 11228.724002036284\n",
|
|
"288 14135 4931.900522781224\n",
|
|
"289 6115 -1359.8525015661405\n",
|
|
"290 9364 7649.975494379696\n",
|
|
"291 4773 9481.483722041376\n",
|
|
"292 3525 3903.097436115244\n",
|
|
"293 6126 3235.0879045787524\n",
|
|
"294 6487 6016.561185150087\n",
|
|
"295 3879 5963.8817259278985\n",
|
|
"296 4943 2022.7875651402155\n",
|
|
"297 1335 16308.04344887568\n",
|
|
"298 4125 3686.2401457869464\n",
|
|
"299 7986 19570.539544136012\n",
|
|
"300 5000 1647.3199417777416\n",
|
|
"301 3559 10844.540513558119\n",
|
|
"302 6573 6749.5080657275785\n",
|
|
"303 2300 7761.8563105694675\n",
|
|
"304 5117 6850.569455542703\n",
|
|
"305 5000 6749.5080657275785\n",
|
|
"306 7165 7562.513169172154\n",
|
|
"307 1406 4792.945224334402\n",
|
|
"308 12300 5438.795622303128\n",
|
|
"309 3573 4076.6328454195104\n",
|
|
"310 6500 6484.405267932639\n",
|
|
"311 4508 4454.794170262632\n",
|
|
"312 7546 3612.3231311814357\n",
|
|
"313 5413 6996.1341583386675\n",
|
|
"314 5754 3103.9097707577357\n",
|
|
"315 1307 3807.778748518246\n",
|
|
"316 5433 3244.8492954237204\n",
|
|
"317 2304 3555.7092877099694\n",
|
|
"318 4000 15777.67435290044\n",
|
|
"319 6425 7309.990757727653\n",
|
|
"320 7250 11630.888375951426\n",
|
|
"321 5500 8636.615133701885\n",
|
|
"322 1800 8768.014881915431\n",
|
|
"323 2240 4826.610795633974\n",
|
|
"324 9000 10890.956739194247\n",
|
|
"325 1266 5814.283121498163\n",
|
|
"326 3850 6443.817549805847\n",
|
|
"327 2122 4535.813236908496\n",
|
|
"328 6423 4517.133895929519\n",
|
|
"329 6455 12060.20986179786\n",
|
|
"330 2100 9687.757282298406\n",
|
|
"331 7843 5535.984701360246\n",
|
|
"332 9617 3697.898412456338\n",
|
|
"333 5033 13417.324343888626\n",
|
|
"334 1129 1900.0831637980234\n",
|
|
"335 1500 9359.137469515703\n",
|
|
"336 8932 4625.923230167911\n",
|
|
"337 4637 6298.491882691631\n",
|
|
"338 15327 8789.796058286662\n",
|
|
"339 1233 3349.3518456663473\n",
|
|
"340 2364 5489.380456222845\n",
|
|
"341 10316 10482.794651236341\n",
|
|
"342 13200 816.4886171815257\n",
|
|
"343 1303 2434.5700084840264\n",
|
|
"344 8687 1339.7548137515469\n",
|
|
"345 1653 14174.38517292645\n",
|
|
"346 7067 4769.726084812967\n",
|
|
"347 8265 6296.217972893376\n",
|
|
"348 1587 3735.0734883030373\n",
|
|
"349 2479 9172.144059825323\n",
|
|
"350 6366 2943.565074257849\n",
|
|
"351 5114 4607.856876244279\n",
|
|
"352 6138 6525.133501060625\n",
|
|
"353 1765 5306.257077971849\n",
|
|
"354 3129 1846.9373281342548\n",
|
|
"355 2295 3398.94891754905\n",
|
|
"356 5507 6787.25326071226\n",
|
|
"357 5200 11426.371872238831\n",
|
|
"358 6326 13253.411199790291\n",
|
|
"359 10804 12321.66926933166\n",
|
|
"360 6721 7784.752069975153\n",
|
|
"361 5574 3078.4680731926246\n",
|
|
"362 10020 5279.60487971954\n",
|
|
"363 3678 3703.664495952156\n",
|
|
"364 4342 6008.626463397685\n",
|
|
"365 8000 12218.65449210225\n",
|
|
"366 1687 4676.4051865459105\n",
|
|
"367 1967 6462.389387331538\n",
|
|
"368 27252 4596.524835292175\n",
|
|
"369 20520 10707.201673752295\n",
|
|
"370 10000 16951.68427825804\n",
|
|
"371 1661 5088.693439115733\n",
|
|
"372 1356 4243.341369783109\n",
|
|
"373 8000 13092.177864088904\n",
|
|
"374 6288 7390.894960432231\n",
|
|
"375 9979 13110.150275789669\n",
|
|
"376 3083 9102.1199952011\n",
|
|
"377 1574 12359.06343032517\n",
|
|
"378 10452 3163.5893828816875\n",
|
|
"379 4790 4611.20167092646\n",
|
|
"380 5563 4506.779900903538\n",
|
|
"381 1103 5630.433669946042\n",
|
|
"382 3846 14705.914690376329\n",
|
|
"383 3750 1678.928854632361\n",
|
|
"384 4309 4188.9078922720755\n",
|
|
"385 6254 2185.786798925416\n",
|
|
"386 2133 5240.602438128821\n",
|
|
"387 12800 6440.899480264031\n",
|
|
"388 5300 2202.973850976274\n",
|
|
"389 10102 3349.487579181281\n",
|
|
"390 9326 6276.255533517775\n",
|
|
"391 2613 10027.074674303978\n",
|
|
"392 11976 3863.6273789168304\n",
|
|
"393 12143 3393.520429895661\n",
|
|
"394 13200 3769.0173149934762\n",
|
|
"395 6320 4363.984786293422\n",
|
|
"396 1542 12775.267839770944\n",
|
|
"397 4560 4771.697760449484\n",
|
|
"398 8304 4637.7607774767075\n",
|
|
"399 10480 4525.181055134041\n",
|
|
"400 5352 6595.799090340065\n",
|
|
"401 2137 6969.014509412282\n",
|
|
"402 5169 4750.975859023578\n",
|
|
"403 2799 11080.256944317674\n",
|
|
"404 6000 2003.8289254279437\n",
|
|
"405 4986 4197.359917287667\n",
|
|
"406 1824 4332.950723087893\n",
|
|
"407 1562 5099.093054122171\n",
|
|
"408 5890 12081.878696518148\n",
|
|
"409 6077 9270.461413927558\n",
|
|
"410 1485 1496.4321088051206\n",
|
|
"411 1825 4246.200510854761\n",
|
|
"412 5340 3255.3624000842133\n",
|
|
"413 9237 1859.449426524448\n",
|
|
"414 6499 7976.974080873097\n",
|
|
"415 1240 4436.075476859059\n",
|
|
"416 4656 3617.4469653780425\n",
|
|
"417 2335 4997.427948460792\n",
|
|
"418 8000 8685.398728410411\n",
|
|
"419 5641 8353.951860004401\n",
|
|
"420 1444 8676.625836361147\n",
|
|
"421 12900 2321.255461480635\n",
|
|
"422 6500 4629.528409764403\n",
|
|
"423 7506 13467.919271136741\n",
|
|
"424 6438 7930.93744973132\n",
|
|
"425 2261 13370.226646925103\n",
|
|
"426 2121 6247.557132112603\n",
|
|
"427 5437 3592.393531883706\n",
|
|
"428 1536 3084.700451088983\n",
|
|
"429 9295 11590.303689144444\n",
|
|
"430 3252 6586.4530811986915\n",
|
|
"431 1331 2974.1520911988323\n",
|
|
"432 5442 10642.588370514337\n",
|
|
"433 4527 4146.7680464203095\n",
|
|
"434 6500 5535.980475001773\n",
|
|
"435 1238 4462.334896687268\n",
|
|
"436 10702 3998.7386180649096\n",
|
|
"437 8056 6374.403929120289\n",
|
|
"438 4517 3968.6353947354496\n",
|
|
"439 5108 11261.565350761522\n",
|
|
"440 6354 8418.830560829478\n",
|
|
"441 4322 3305.0788833275337\n",
|
|
"442 3129 5121.086170529202\n",
|
|
"443 2486 17408.009128939066\n",
|
|
"444 6200 4741.563419125667\n",
|
|
"445 10320 5313.293980930455\n",
|
|
"446 5204 11883.544862171222\n",
|
|
"447 7429 11135.61940509253\n",
|
|
"448 1837 5034.717550057033\n",
|
|
"449 3311 5410.885965608366\n",
|
|
"450 5425 4536.934131183477\n",
|
|
"451 1141 9035.881634012976\n",
|
|
"452 8142 3094.3729707170237\n",
|
|
"453 9630 5759.575130507457\n",
|
|
"454 3400 2189.066685634728\n",
|
|
"455 5991 8549.539484234854\n",
|
|
"456 4537 2673.967338892564\n",
|
|
"457 1389 4718.1351657552605\n",
|
|
"458 6560 12005.006870572877\n",
|
|
"459 5417 8357.181906814383\n",
|
|
"460 1326 11175.583517484314\n",
|
|
"461 1226 11704.844017633459\n",
|
|
"462 9439 7822.772984507\n",
|
|
"463 6075 3640.18245452465\n",
|
|
"464 4139 12954.348380007397\n",
|
|
"465 6921 4400.219099707537\n",
|
|
"466 1412 3860.7463982703334\n",
|
|
"467 1580 3516.678313124346\n",
|
|
"468 6480 3492.9019039587733\n",
|
|
"469 7740 8106.980110824186\n",
|
|
"470 9187 2395.5573418076624\n",
|
|
"471 5923 15299.331508342839\n",
|
|
"472 1690 10362.006379124352\n",
|
|
"473 1829 9487.82923378465\n",
|
|
"474 13132 12486.558265969294\n",
|
|
"475 5673 14305.952439617615\n",
|
|
"476 10143 14864.146909677464\n",
|
|
"477 2631 2331.8590852138564\n",
|
|
"478 16753 3373.2896869040014\n",
|
|
"479 8300 6524.596616257537\n",
|
|
"480 2541 9190.959336462798\n",
|
|
"481 1638 8198.234066736764\n",
|
|
"482 6097 15793.35353841358\n",
|
|
"483 8250 10749.527129598226\n",
|
|
"484 1638 2035.970947988072\n",
|
|
"485 1145 4696.342706754138\n",
|
|
"486 8300 4612.694230043811\n",
|
|
"487 9750 12698.282535481198\n",
|
|
"488 12532 16313.121000032259\n",
|
|
"489 10739 4867.058831371186\n",
|
|
"490 18230 8459.589175229492\n",
|
|
"491 6125 9447.347582186656\n",
|
|
"492 6225 4050.031770291008\n",
|
|
"493 16509 3119.674368698192\n",
|
|
"494 6782 15229.554761308495\n",
|
|
"495 6125 6761.654267834814\n",
|
|
"496 1681 16165.79694411498\n",
|
|
"497 1798 5819.205951991664\n",
|
|
"498 13385 4938.678542279483\n",
|
|
"499 12300 12501.32563965754\n",
|
|
"500 4100 6001.137996121012\n",
|
|
"501 6190 1475.6160798039427\n",
|
|
"502 9246 3958.254475739062\n",
|
|
"503 14322 5117.760831637467\n",
|
|
"504 7396 3351.115059928001\n",
|
|
"505 3851 11349.992398228365\n",
|
|
"506 4734 2254.841749289375\n",
|
|
"507 2058 4497.8123659139665\n",
|
|
"508 8869 6254.021135129916\n",
|
|
"509 11269 5503.560118534005\n",
|
|
"510 2506 3923.4245548541553\n",
|
|
"511 11730 13493.388189645208\n",
|
|
"512 8045 11793.907143350536\n",
|
|
"513 7500 19150.25573472374\n",
|
|
"514 9166 1503.1775986772748\n",
|
|
"515 5368 768.7325537958045\n",
|
|
"516 2395 11349.634056006476\n",
|
|
"517 9087 6323.225289121863\n",
|
|
"518 7407 12191.765888863798\n",
|
|
"519 5949 4662.532235685591\n",
|
|
"520 10216 1407.9870443357727\n",
|
|
"521 4731 2077.9540157496162\n",
|
|
"522 9248 7446.569623693983\n",
|
|
"523 18500 7152.090683775011\n",
|
|
"524 6308 2046.8540380357522\n",
|
|
"525 5748 7367.288137184615\n",
|
|
"526 3138 13384.130363257449\n",
|
|
"527 2012 10653.209976527616\n",
|
|
"528 8657 4045.4916586458935\n",
|
|
"529 7500 5925.985098665058\n",
|
|
"530 1463 16696.570686355375\n",
|
|
"531 7625 8283.901419829008\n",
|
|
"532 17260 1332.645261264805\n",
|
|
"533 7020 8097.968034350275\n",
|
|
"534 6592 12655.393492203057\n",
|
|
"535 1463 9686.161910222057\n",
|
|
"536 5112 14887.791991132963\n",
|
|
"537 9672 11980.464991642053\n",
|
|
"538 5360 3200.7882786135533\n",
|
|
"539 7338 4568.898795584218\n",
|
|
"540 4113 4548.0218263260895\n",
|
|
"541 5443 6464.617670339604\n",
|
|
"542 7368 3509.1119407497345\n",
|
|
"543 8017 14989.39181389453\n",
|
|
"544 8619 5951.016907958763\n",
|
|
"545 2651 2389.4447101228966\n",
|
|
"546 14840 5539.6976673052395\n",
|
|
"547 6041 5739.887811430656\n",
|
|
"548 8685 4713.845075975436\n",
|
|
"549 1252 10368.07303045706\n",
|
|
"550 2655 6283.479460803347\n",
|
|
"551 15140 10087.168600437875\n",
|
|
"552 7885 5075.27707615952\n",
|
|
"553 8685 8212.189918949982\n",
|
|
"554 7542 5046.9757285848955\n",
|
|
"555 4676 12393.032671740262\n",
|
|
"556 2450 4089.113201090722\n",
|
|
"557 7225 8668.848872884808\n",
|
|
"558 18500 3625.579521584379\n",
|
|
"559 8499 11175.583517484314\n",
|
|
"560 5057 11954.107603250402\n",
|
|
"561 8418 9871.105936883523\n",
|
|
"562 22885 4480.13584030295\n",
|
|
"563 2820 12949.498758756125\n",
|
|
"564 1868 9863.602442864936\n",
|
|
"565 2523 7594.763347975478\n",
|
|
"566 10058 4106.730423429261\n",
|
|
"567 7138 6882.786147983847\n",
|
|
"568 7610 8398.894749936191\n",
|
|
"569 2670 3175.8554412316626\n",
|
|
"570 2364 12814.987663022268\n",
|
|
"571 8435 5162.810338028615\n",
|
|
"572 8841 1036.8156262763082\n",
|
|
"573 15240 6022.001956780606\n",
|
|
"574 10180 10816.936615359207\n",
|
|
"575 12534 6207.885794866743\n",
|
|
"576 20520 4784.208803197017\n",
|
|
"577 13500 2214.8851307287455\n",
|
|
"578 5000 3893.0598787794556\n",
|
|
"579 12813 6018.340623795528\n",
|
|
"580 7050 4794.636511757451\n",
|
|
"581 6665 719.7944431444473\n",
|
|
"582 16350 12795.036594803416\n",
|
|
"583 25623 14184.768449790256\n",
|
|
"584 2063 9810.563762098913\n",
|
|
"585 3393 4663.9954601549625\n",
|
|
"586 2217 8773.41625094894\n",
|
|
"587 9003 3036.44495239287\n",
|
|
"588 14470 14674.536778589223\n",
|
|
"589 7603 7067.956282785245\n",
|
|
"590 8685 4819.903639940648\n",
|
|
"591 6436 3119.275984646008\n",
|
|
"592 6112 13083.263275048763\n",
|
|
"593 6127 4357.32710824466\n",
|
|
"594 1373 15735.44034049763\n",
|
|
"595 8046 9829.34768547027\n",
|
|
"596 6865 3214.003054487506\n",
|
|
"597 8286 5601.510414450099\n",
|
|
"598 6302 4623.138939835301\n",
|
|
"599 2208 11173.469568286891\n",
|
|
"600 3615 9099.567629826535\n",
|
|
"601 15940 1128.3453286817544\n",
|
|
"602 5010 12327.197143168583\n",
|
|
"603 8212 2358.011077505077\n",
|
|
"604 1272 3507.632555908359\n",
|
|
"605 2540 3225.323372800012\n",
|
|
"606 9600 4090.038562587634\n",
|
|
"607 26043 9172.521869455777\n",
|
|
"608 6103 9608.33642905634\n",
|
|
"609 2747 3357.020239766667\n",
|
|
"610 2960 6086.4085631268035\n",
|
|
"611 26043 7352.588636862007\n",
|
|
"612 11444 5749.178712087224\n",
|
|
"613 6608 7009.789042663147\n",
|
|
"614 8685 4860.877678091679\n",
|
|
"615 7809 2574.283478221735\n",
|
|
"616 10910 16177.070094482096\n",
|
|
"617 6015 7330.670097266955\n",
|
|
"618 5233 5874.080532458615\n",
|
|
"619 1425 13376.351664670756\n",
|
|
"620 11160 11489.591677776654\n",
|
|
"621 2105 8093.267208688064\n",
|
|
"622 7428 12065.410201066788\n",
|
|
"623 5204 4090.2545827148147\n",
|
|
"624 1851 4009.0006330108404\n",
|
|
"625 26043 3438.1572509050984\n",
|
|
"626 5426 2253.846596804711\n",
|
|
"627 6219 17137.025597423733\n",
|
|
"628 11212 8852.762121006672\n",
|
|
"629 8124 2764.2110979500026\n",
|
|
"630 1982 16415.374793629482\n",
|
|
"631 3694 8244.824334909112\n",
|
|
"632 6075 2457.9006791839233\n",
|
|
"633 4561 2321.330005122368\n",
|
|
"634 3042 4222.503424740425\n",
|
|
"635 19747 8223.799821601031\n",
|
|
"636 15145 1871.3160227674202\n",
|
|
"637 7072 4620.709006674663\n",
|
|
"638 2582 2230.203623949988\n",
|
|
"639 1425 5754.610018189932\n",
|
|
"640 5219 18795.832958315765\n",
|
|
"641 7182 2545.237704767577\n",
|
|
"642 8899 4793.967670294426\n",
|
|
"643 6313 3355.7302621566423\n",
|
|
"644 2435 1977.784883709689\n",
|
|
"645 3108 5286.771821824771\n",
|
|
"646 12198 6863.347568508702\n",
|
|
"647 5761 3753.5604597260553\n",
|
|
"648 8685 3501.396202209124\n",
|
|
"649 8141 6710.759936928313\n",
|
|
"650 9185 6449.711014158032\n",
|
|
"651 5331 6111.495678866401\n"
|
|
]
|
|
},
|
|
{
|
|
"ename": "IndexError",
|
|
"evalue": "index 652 is out of bounds for axis 0 with size 652",
|
|
"output_type": "error",
|
|
"traceback": [
|
|
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
|
|
"\u001b[0;31mIndexError\u001b[0m Traceback (most recent call last)",
|
|
"\u001b[0;32m/tmp/ipykernel_56157/1621740581.py\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0menumerate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0my\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0my_pred_rf\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
|
|
"\u001b[0;31mIndexError\u001b[0m: index 652 is out of bounds for axis 0 with size 652"
|
|
]
|
|
}
|
|
],
|
|
"source": [
|
|
"for i,v in enumerate(y):\n",
|
|
" print(i,v,y_pred_rf[i])"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": 7,
|
|
"id": "bba1ad86",
|
|
"metadata": {},
|
|
"outputs": [
|
|
{
|
|
"data": {
|
|
"text/plain": [
|
|
"2171"
|
|
]
|
|
},
|
|
"execution_count": 7,
|
|
"metadata": {},
|
|
"output_type": "execute_result"
|
|
}
|
|
],
|
|
"source": [
|
|
"len(y)"
|
|
]
|
|
},
|
|
{
|
|
"cell_type": "code",
|
|
"execution_count": null,
|
|
"id": "970a3733",
|
|
"metadata": {},
|
|
"outputs": [],
|
|
"source": []
|
|
}
|
|
],
|
|
"metadata": {
|
|
"kernelspec": {
|
|
"display_name": "Python 3.7.13 ('leagues')",
|
|
"language": "python",
|
|
"name": "python3"
|
|
},
|
|
"language_info": {
|
|
"codemirror_mode": {
|
|
"name": "ipython",
|
|
"version": 3
|
|
},
|
|
"file_extension": ".py",
|
|
"mimetype": "text/x-python",
|
|
"name": "python",
|
|
"nbconvert_exporter": "python",
|
|
"pygments_lexer": "ipython3",
|
|
"version": "3.7.13"
|
|
},
|
|
"vscode": {
|
|
"interpreter": {
|
|
"hash": "a07b7f3079ca8c056705d3c757c4f3f92f9509f33eeab9ad5420dacec37bc01a"
|
|
}
|
|
}
|
|
},
|
|
"nbformat": 4,
|
|
"nbformat_minor": 5
|
|
}
|