research/machine_learning/scripts/ml/gradientboost.ipynb
2024-01-31 21:41:29 +01:00

960 lines
61 KiB
Plaintext

{
"cells": [
{
"cell_type": "markdown",
"id": "4d2a8b6c",
"metadata": {},
"source": [
"#### Database"
]
},
{
"cell_type": "code",
"execution_count": 1,
"id": "7be9eeff",
"metadata": {},
"outputs": [],
"source": [
"PROJECT_PATH = '/home/md/Work/ligalytics/leagues_stable/'\n",
"import os, sys\n",
"sys.path.insert(0, PROJECT_PATH)\n",
"os.environ.setdefault(\"DJANGO_SETTINGS_MODULE\", \"leagues.settings\")\n",
"\n",
"from leagues import settings\n",
"settings.DATABASES['default']['NAME'] = PROJECT_PATH+'/db.sqlite3'\n",
"\n",
"import django\n",
"django.setup()\n",
"\n",
"from scheduler.models import *\n",
"from common.functions import distanceInKmByGPS\n",
"season = Season.objects.filter(nicename=\"Imported: Benchmark Season\").first()\n",
"import pandas as pd\n",
"import numpy as np\n",
"from django.db.models import F\n",
"games = Game.objects.filter(season=season)\n",
"df = pd.DataFrame.from_records(games.values())\n",
"games = Game.objects.filter(season=season).exclude(historic_season=None).annotate(\n",
" home=F('homeTeam__shortname'),\n",
" away=F('awayTeam__shortname'),\n",
" home_lat=F('homeTeam__latitude'),\n",
" home_lon=F('homeTeam__longitude'),\n",
" home_attr=F('homeTeam__attractivity'),\n",
" away_lat=F('awayTeam__latitude'),\n",
" away_lon=F('awayTeam__longitude'),\n",
" away_attr=F('awayTeam__attractivity'),\n",
" home_country=F('homeTeam__country'),\n",
" away_country=F('awayTeam__country'),\n",
").values()\n",
"\n"
]
},
{
"cell_type": "markdown",
"id": "bc191792",
"metadata": {},
"source": [
"#### Dataframe"
]
},
{
"cell_type": "code",
"execution_count": 2,
"id": "1e404cf8",
"metadata": {},
"outputs": [],
"source": [
"from sklearn.preprocessing import OneHotEncoder\n",
"\n",
"# create dataset\n",
"df = pd.DataFrame.from_records(games.values())\n",
"\n",
"# data cleaning\n",
"df['time'] = df['time'].replace('','0')\n",
"df = df[df['attendance'] != 0]\n",
"\n",
"# remove outliers\n",
"out_fields = ['attendance']\n",
"for field in out_fields:\n",
" q_low = df[field].quantile(0.01)\n",
" q_hi = df[field].quantile(0.99)\n",
" df = df[(df[field] < q_hi) & (df[field] > q_low)]\n",
"\n",
"\n",
"# pivots\n",
"pivot_homeTeam_mean = df.pivot_table('attendance','homeTeam_id',aggfunc='mean')\n",
"pivot_homeTeam_max = df.pivot_table('attendance','homeTeam_id',aggfunc='max')\n",
"\n",
"# add more features\n",
"df['weekday'] = df.apply(lambda r: r['date'].weekday(), axis=1)\n",
"df['day'] = df.apply(lambda r: r['date'].day, axis=1)\n",
"df['month'] = df.apply(lambda r: r['date'].month, axis=1)\n",
"df['year'] = df.apply(lambda r: r['date'].year, axis=1)\n",
"df['distance'] = df.apply(lambda r: distanceInKmByGPS(r['home_lon'],r['home_lat'],r['away_lon'],r['away_lat']), axis=1)\n",
"df['weekend'] = df.apply(lambda r: int(r['weekday'] in [6,7]), axis=1)\n",
"df['winter_season'] = df.apply(lambda r: int(r['month'] in [1,2,3,10,11,12]), axis=1)\n",
"df['home_base'] = df.apply(lambda r: pivot_homeTeam_mean.loc[r['homeTeam_id'],'attendance'], axis=1)\n",
"df['stadium_size'] = df.apply(lambda r: pivot_homeTeam_max.loc[r['homeTeam_id'],'attendance'], axis=1)\n",
"df['early'] = df.apply(lambda r: r['time'].replace(':','') < \"1800\", axis=1)\n",
"df['before2010'] = df.apply(lambda r: r['historic_season'].split('-')[0] < \"2010\", axis=1)\n",
"\n",
"\n",
"\n",
"# one hot encoding\n",
"ohe_fields = ['home_country']\n",
"\n",
"for field in ohe_fields:\n",
" ohe = OneHotEncoder()\n",
" transformed = ohe.fit_transform(df[[field]])\n",
" df[ohe.categories_[0]] = transformed.toarray()\n",
"\n",
"# sort label to last index\n",
"cols = list(df.columns)\n",
"cols.append(cols.pop(cols.index('attendance')))\n",
"df = df[cols]"
]
},
{
"cell_type": "markdown",
"id": "e2ea08e5",
"metadata": {},
"source": [
"#### Train/Test Data - Normalization"
]
},
{
"cell_type": "code",
"execution_count": 3,
"id": "74e12f87",
"metadata": {},
"outputs": [],
"source": [
"import numpy as np \n",
"import pandas as pd \n",
"import matplotlib.pyplot as plt\n",
"import seaborn as sns\n",
"from sklearn.model_selection import train_test_split, cross_val_predict\n",
"from sklearn import metrics\n",
"from sklearn.ensemble import GradientBoostingRegressor\n",
"\n",
"\n",
"remove_columns = ['season_id', 'resultEntered', 'reversible', 'reschedule', 'homeGoals', 'awayGoals',\n",
" 'homeGoals2', 'awayGoals2', 'homeGoals3', 'awayGoals3', 'home', 'away', 'date', 'time',\n",
" 'id', 'historic_season',\n",
" 'home_country','home_lat','home_lon','away_lat','away_lon','away_country','year']\n",
"feature_cols = list(set(df.columns[:-1]) - set(remove_columns))\n",
"# feature_cols = ['weekday','weekend','home_base','distance','winter_season']\n",
"label = 'attendance'\n",
"\n",
"\n",
"data = df[feature_cols+[label]]\n",
"\n",
"\n",
"\n",
"\n",
"X = df[feature_cols] # Features\n",
"y = df[label] # Target variable\n",
"\n",
"X_train, X_test, y_train, y_test = train_test_split(\n",
" X, y, test_size=0.3, random_state=1) # 70% training and 30% test"
]
},
{
"cell_type": "code",
"execution_count": 4,
"id": "45e08026",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"Random Forest Regression Accuracy: 0.6976274695189291\n"
]
}
],
"source": [
"rf_regressor = GradientBoostingRegressor(n_estimators = 200 , random_state = 42)\n",
"rf_regressor.fit(X_train,y_train)\n",
"\n",
"# #Predicting the SalePrices using test set \n",
"y_pred_rf = rf_regressor.predict(X_test)\n",
"\n",
"# #Random Forest Regression Accuracy with test set\n",
"print('Random Forest Regression Accuracy: ', rf_regressor.score(X_test,y_test))\n",
"\n",
"# #Predicting the SalePrice using cross validation (KFold method)\n",
"# y_pred_rf = cross_val_predict(rf_regressor, X, y, cv=10 )\n",
"\n",
"# #Random Forest Regression Accuracy with cross validation\n",
"# accuracy_rf = metrics.r2_score(y, y_pred_rf)\n",
"# print('Cross-Predicted(KFold) Random Forest Regression Accuracy: ', accuracy_rf)"
]
},
{
"cell_type": "code",
"execution_count": 5,
"id": "0de49b8a",
"metadata": {},
"outputs": [
{
"data": {
"image/png": "",
"text/plain": [
"<Figure size 1080x720 with 1 Axes>"
]
},
"metadata": {
"needs_background": "light"
},
"output_type": "display_data"
}
],
"source": [
"ranking = np.argsort(-rf_regressor.feature_importances_)\n",
"f, ax = plt.subplots(figsize=(15, 10))\n",
"sns.barplot(x=rf_regressor.feature_importances_[ranking], y=X_train.columns.values[ranking], orient='h')\n",
"ax.set_xlabel(\"feature importance\")\n",
"plt.tight_layout()\n",
"plt.show()"
]
},
{
"cell_type": "code",
"execution_count": 6,
"id": "4c1f8b45",
"metadata": {},
"outputs": [
{
"name": "stdout",
"output_type": "stream",
"text": [
"0 4000 6269.331273160804\n",
"1 3264 2212.472559220525\n",
"2 6000 4474.321544046366\n",
"3 4250 5853.876279843164\n",
"4 1200 2724.8479999971523\n",
"5 4300 12248.194405029995\n",
"6 3874 12179.504105471333\n",
"7 2800 7179.957816540268\n",
"8 5500 4343.454242132351\n",
"9 6000 15615.670772432313\n",
"10 3500 2142.013025198476\n",
"11 4500 6581.086576491373\n",
"12 2140 2787.000793225451\n",
"13 3146 7948.163004948026\n",
"14 2600 5277.360995538767\n",
"15 4875 4182.090794311384\n",
"16 5807 1298.0546590068432\n",
"17 5200 7641.152367897079\n",
"18 3500 12709.91385314257\n",
"19 2643 13796.44798966877\n",
"20 4000 2910.0979973906897\n",
"21 2500 11367.203439146624\n",
"22 2000 4578.676165761646\n",
"23 3198 11801.197736843704\n",
"24 3571 3256.2683962230926\n",
"25 2712 13963.658569196019\n",
"26 2100 3428.2076365623343\n",
"27 4525 3179.082309242862\n",
"28 6625 5319.700728374097\n",
"29 4966 4814.201898718184\n",
"30 2000 11668.774282716573\n",
"31 2100 16459.759735440115\n",
"32 2310 10424.049272604385\n",
"33 2600 3249.7584854521983\n",
"34 2000 4933.417332760704\n",
"35 4300 11330.47572253357\n",
"36 2734 4916.62667788047\n",
"37 3500 7616.108008546191\n",
"38 3050 5834.707115002423\n",
"39 5256 10956.873320747929\n",
"40 3012 1746.8793669215172\n",
"41 5060 4642.521259437015\n",
"42 1500 10636.260356819768\n",
"43 4000 6226.573175422698\n",
"44 1950 6253.5032474003465\n",
"45 2300 5174.122252417559\n",
"46 2300 2724.3318310328705\n",
"47 1950 9804.743199526134\n",
"48 3058 3874.7670154643415\n",
"49 2000 10001.45516441721\n",
"50 2345 5023.8562523965875\n",
"51 5500 5174.122252417559\n",
"52 5585 3817.7336514404283\n",
"53 4046 4720.395073786049\n",
"54 6000 4569.1440149122045\n",
"55 4384 4918.984377964906\n",
"56 3000 4674.700091188421\n",
"57 3500 3544.0179791758733\n",
"58 7000 18261.80159810542\n",
"59 10195 13504.402960006135\n",
"60 3476 2439.2710475675904\n",
"61 2120 6683.8055866507775\n",
"62 3800 4831.40407430577\n",
"63 2675 18297.8862272201\n",
"64 6603 5900.839366216985\n",
"65 1500 5547.896256687706\n",
"66 4000 15716.448413829125\n",
"67 4545 3510.458423897759\n",
"68 1396 4299.864451241506\n",
"69 5400 11340.993418688882\n",
"70 5041 13344.492446272585\n",
"71 1500 12842.717635745401\n",
"72 1800 2826.6198584357285\n",
"73 3189 2216.6069457661515\n",
"74 3800 7551.124847543301\n",
"75 2178 10854.693947136366\n",
"76 6169 3754.054098366518\n",
"77 2676 6227.444878272318\n",
"78 3510 4372.710484500164\n",
"79 3900 5899.365613773657\n",
"80 2120 9146.338397438585\n",
"81 8000 6598.214034291334\n",
"82 2500 4180.2412129479535\n",
"83 4016 1013.1917302016966\n",
"84 1500 13356.059667395755\n",
"85 2860 3859.7092616602254\n",
"86 2150 12546.493369090958\n",
"87 3336 13781.48736284787\n",
"88 8820 6867.843525597063\n",
"89 4792 9977.417685682762\n",
"90 1650 23425.898130663616\n",
"91 2000 6589.051500702451\n",
"92 2111 3109.4945264556886\n",
"93 4470 13408.035401832343\n",
"94 7000 5519.4148042321\n",
"95 3850 6089.400396461468\n",
"96 4366 9610.498715489919\n",
"97 2645 8316.017866765993\n",
"98 2384 6197.035790504067\n",
"99 4522 12779.77200503699\n",
"100 6328 14744.016207170152\n",
"101 3877 19458.90971123009\n",
"102 2000 4874.224861034961\n",
"103 4157 5208.703053494322\n",
"104 2942 13386.059288545708\n",
"105 3655 13257.062956113012\n",
"106 4500 2441.3256508749882\n",
"107 2964 2416.608601291409\n",
"108 2863 2553.749826440011\n",
"109 4935 11198.828086622805\n",
"110 2526 12041.524132520446\n",
"111 5679 8045.757009722594\n",
"112 7286 13009.125855582837\n",
"113 6055 12448.19779590953\n",
"114 1200 11188.064346395086\n",
"115 4110 4271.21931546039\n",
"116 1957 3087.6529257626803\n",
"117 1790 2569.376378289409\n",
"118 5422 6173.099807850697\n",
"119 4650 12505.12258551472\n",
"120 5297 12652.949405216323\n",
"121 3036 6268.840108714523\n",
"122 3233 9367.596675826102\n",
"123 12000 2337.3771641354024\n",
"124 7632 1819.0748787672667\n",
"125 3620 7428.132912505317\n",
"126 2000 2124.849872483271\n",
"127 2145 6073.702450147759\n",
"128 2227 15691.707999141212\n",
"129 2520 17731.752052395845\n",
"130 10000 9224.693549735079\n",
"131 2000 4333.254162853479\n",
"132 4052 5463.585852647499\n",
"133 2137 3385.7917346498257\n",
"134 2609 8949.299267841006\n",
"135 3256 5594.136151838447\n",
"136 8173 7321.006115614261\n",
"137 1250 6314.334305949203\n",
"138 7401 1841.6632769675457\n",
"139 4200 5913.92021057092\n",
"140 6100 5914.498891029855\n",
"141 5182 4485.159036791194\n",
"142 1300 3930.555183694012\n",
"143 2117 2087.6087105330876\n",
"144 6500 3129.218824655229\n",
"145 5174 19100.66955411291\n",
"146 3867 7381.962946265084\n",
"147 1918 3668.522599331723\n",
"148 2800 5984.122720695453\n",
"149 7648 5579.807332727605\n",
"150 5638 5000.766880937242\n",
"151 5262 8796.640913054198\n",
"152 1650 11038.130604200423\n",
"153 1657 3053.4760351098107\n",
"154 4086 16594.785800693066\n",
"155 9000 3561.181162895718\n",
"156 1500 5042.543289014211\n",
"157 8145 12723.53945595642\n",
"158 2625 7117.118765444254\n",
"159 6281 3092.870875123699\n",
"160 4520 1916.9886938042089\n",
"161 1200 3334.4719289950585\n",
"162 4829 4248.693921085489\n",
"163 1760 3065.4160555916155\n",
"164 3469 10943.4771813175\n",
"165 7500 4646.274655834034\n",
"166 5227 7247.410995462059\n",
"167 1765 12061.617431570865\n",
"168 5200 3906.7362684340383\n",
"169 6402 5802.18818098374\n",
"170 4832 3735.241252929307\n",
"171 1500 8821.101907961975\n",
"172 2342 3612.477133461679\n",
"173 2799 908.2647209562191\n",
"174 3850 3078.4680731926246\n",
"175 4200 3812.544744635514\n",
"176 4531 2705.9998772537424\n",
"177 1751 1967.6894728073173\n",
"178 4250 5924.714538352343\n",
"179 5705 6513.58136727248\n",
"180 3528 1966.268176067289\n",
"181 2496 4368.04545595507\n",
"182 4370 2024.6278361643576\n",
"183 1350 5634.107750848085\n",
"184 5334 10956.873320747929\n",
"185 1423 6752.977449121771\n",
"186 4129 4490.334901030411\n",
"187 5858 2706.770656503444\n",
"188 3300 4860.877678091679\n",
"189 3500 3893.6704796446884\n",
"190 10280 3778.999270841025\n",
"191 4500 7722.956089373864\n",
"192 10500 3823.8621517621054\n",
"193 3932 5270.396448543778\n",
"194 5500 7707.251425986663\n",
"195 2200 14389.91484985415\n",
"196 8206 6044.3459440998595\n",
"197 8000 4457.480201516091\n",
"198 6372 8890.061129175148\n",
"199 7900 13621.063242184871\n",
"200 1628 13169.821966149577\n",
"201 4142 3606.329399178841\n",
"202 1150 6794.3761007737885\n",
"203 1750 3527.0690712828796\n",
"204 4072 4870.13044656876\n",
"205 1176 14005.1555660555\n",
"206 3200 5021.013261618377\n",
"207 1715 10318.676591702464\n",
"208 7530 10459.245297486614\n",
"209 4600 8316.395535933456\n",
"210 1200 5095.800766098369\n",
"211 4452 17619.45148176299\n",
"212 2400 2917.6212527362745\n",
"213 4057 3523.9765596992324\n",
"214 5000 7568.184421468349\n",
"215 4147 2328.238657453435\n",
"216 3046 9816.145570783112\n",
"217 6215 2815.1845153039812\n",
"218 3350 2458.220350724582\n",
"219 3500 1143.4289915252082\n",
"220 5870 3349.522734018162\n",
"221 4113 6562.149215912538\n",
"222 3420 15899.046839388688\n",
"223 6116 9045.668754767581\n",
"224 5902 2748.9553238280632\n",
"225 3787 4271.853869225162\n",
"226 3600 7439.183383616434\n",
"227 7017 2210.108006140514\n",
"228 10280 4927.066871405887\n",
"229 5600 9564.813393139277\n",
"230 3656 3329.8106332184043\n",
"231 6480 17110.713931585673\n",
"232 1646 4677.074303376587\n",
"233 2600 4440.882887387751\n",
"234 4300 2118.7542046100843\n",
"235 7948 3214.332854949672\n",
"236 4579 7753.321604795282\n",
"237 4364 6460.580153817578\n",
"238 5000 3400.25051693908\n",
"239 2034 4284.09527513928\n",
"240 3500 5231.567751256019\n",
"241 5688 6856.195658240203\n",
"242 1800 12184.56551356091\n",
"243 10131 2598.8215825730167\n",
"244 5784 5943.724350980219\n",
"245 1813 4361.9722090698815\n",
"246 3700 5182.000108363626\n",
"247 6700 5850.0908748940765\n",
"248 3700 2399.8908348974273\n",
"249 7799 1934.7516235634123\n",
"250 1884 11765.60702403286\n",
"251 3042 4656.923175922518\n",
"252 5000 13415.8010505132\n",
"253 5112 13024.815014128593\n",
"254 1404 3154.9780459262442\n",
"255 2471 4309.257915103401\n",
"256 7749 10739.861964061618\n",
"257 6254 3516.7357048629206\n",
"258 2502 11979.741281816012\n",
"259 2300 3650.093842398789\n",
"260 6500 11606.67581375423\n",
"261 2646 2003.5526871642137\n",
"262 9546 3357.754620510872\n",
"263 7500 1954.3537407404217\n",
"264 11016 5754.557478633303\n",
"265 5763 9554.299673198937\n",
"266 2460 9835.688834354334\n",
"267 5511 3086.8504515496356\n",
"268 1857 12616.742317378286\n",
"269 7000 3003.607544650991\n",
"270 6333 2916.8409179975624\n",
"271 6107 4089.944537354285\n",
"272 1518 2032.35131917741\n",
"273 9310 13077.88651001709\n",
"274 3551 5538.163168934835\n",
"275 1700 5176.458388224016\n",
"276 2250 6964.458867728808\n",
"277 6000 3658.89357449004\n",
"278 2003 12082.974153438317\n",
"279 15183 3440.5699078224566\n",
"280 7113 3704.6762193220106\n",
"281 3818 7853.080965569755\n",
"282 12300 4595.931196930642\n",
"283 12488 4204.879371769705\n",
"284 8000 14443.56582836753\n",
"285 10832 6863.813679372925\n",
"286 2107 6377.807460294606\n",
"287 2100 11228.724002036284\n",
"288 14135 4931.900522781224\n",
"289 6115 -1359.8525015661405\n",
"290 9364 7649.975494379696\n",
"291 4773 9481.483722041376\n",
"292 3525 3903.097436115244\n",
"293 6126 3235.0879045787524\n",
"294 6487 6016.561185150087\n",
"295 3879 5963.8817259278985\n",
"296 4943 2022.7875651402155\n",
"297 1335 16308.04344887568\n",
"298 4125 3686.2401457869464\n",
"299 7986 19570.539544136012\n",
"300 5000 1647.3199417777416\n",
"301 3559 10844.540513558119\n",
"302 6573 6749.5080657275785\n",
"303 2300 7761.8563105694675\n",
"304 5117 6850.569455542703\n",
"305 5000 6749.5080657275785\n",
"306 7165 7562.513169172154\n",
"307 1406 4792.945224334402\n",
"308 12300 5438.795622303128\n",
"309 3573 4076.6328454195104\n",
"310 6500 6484.405267932639\n",
"311 4508 4454.794170262632\n",
"312 7546 3612.3231311814357\n",
"313 5413 6996.1341583386675\n",
"314 5754 3103.9097707577357\n",
"315 1307 3807.778748518246\n",
"316 5433 3244.8492954237204\n",
"317 2304 3555.7092877099694\n",
"318 4000 15777.67435290044\n",
"319 6425 7309.990757727653\n",
"320 7250 11630.888375951426\n",
"321 5500 8636.615133701885\n",
"322 1800 8768.014881915431\n",
"323 2240 4826.610795633974\n",
"324 9000 10890.956739194247\n",
"325 1266 5814.283121498163\n",
"326 3850 6443.817549805847\n",
"327 2122 4535.813236908496\n",
"328 6423 4517.133895929519\n",
"329 6455 12060.20986179786\n",
"330 2100 9687.757282298406\n",
"331 7843 5535.984701360246\n",
"332 9617 3697.898412456338\n",
"333 5033 13417.324343888626\n",
"334 1129 1900.0831637980234\n",
"335 1500 9359.137469515703\n",
"336 8932 4625.923230167911\n",
"337 4637 6298.491882691631\n",
"338 15327 8789.796058286662\n",
"339 1233 3349.3518456663473\n",
"340 2364 5489.380456222845\n",
"341 10316 10482.794651236341\n",
"342 13200 816.4886171815257\n",
"343 1303 2434.5700084840264\n",
"344 8687 1339.7548137515469\n",
"345 1653 14174.38517292645\n",
"346 7067 4769.726084812967\n",
"347 8265 6296.217972893376\n",
"348 1587 3735.0734883030373\n",
"349 2479 9172.144059825323\n",
"350 6366 2943.565074257849\n",
"351 5114 4607.856876244279\n",
"352 6138 6525.133501060625\n",
"353 1765 5306.257077971849\n",
"354 3129 1846.9373281342548\n",
"355 2295 3398.94891754905\n",
"356 5507 6787.25326071226\n",
"357 5200 11426.371872238831\n",
"358 6326 13253.411199790291\n",
"359 10804 12321.66926933166\n",
"360 6721 7784.752069975153\n",
"361 5574 3078.4680731926246\n",
"362 10020 5279.60487971954\n",
"363 3678 3703.664495952156\n",
"364 4342 6008.626463397685\n",
"365 8000 12218.65449210225\n",
"366 1687 4676.4051865459105\n",
"367 1967 6462.389387331538\n",
"368 27252 4596.524835292175\n",
"369 20520 10707.201673752295\n",
"370 10000 16951.68427825804\n",
"371 1661 5088.693439115733\n",
"372 1356 4243.341369783109\n",
"373 8000 13092.177864088904\n",
"374 6288 7390.894960432231\n",
"375 9979 13110.150275789669\n",
"376 3083 9102.1199952011\n",
"377 1574 12359.06343032517\n",
"378 10452 3163.5893828816875\n",
"379 4790 4611.20167092646\n",
"380 5563 4506.779900903538\n",
"381 1103 5630.433669946042\n",
"382 3846 14705.914690376329\n",
"383 3750 1678.928854632361\n",
"384 4309 4188.9078922720755\n",
"385 6254 2185.786798925416\n",
"386 2133 5240.602438128821\n",
"387 12800 6440.899480264031\n",
"388 5300 2202.973850976274\n",
"389 10102 3349.487579181281\n",
"390 9326 6276.255533517775\n",
"391 2613 10027.074674303978\n",
"392 11976 3863.6273789168304\n",
"393 12143 3393.520429895661\n",
"394 13200 3769.0173149934762\n",
"395 6320 4363.984786293422\n",
"396 1542 12775.267839770944\n",
"397 4560 4771.697760449484\n",
"398 8304 4637.7607774767075\n",
"399 10480 4525.181055134041\n",
"400 5352 6595.799090340065\n",
"401 2137 6969.014509412282\n",
"402 5169 4750.975859023578\n",
"403 2799 11080.256944317674\n",
"404 6000 2003.8289254279437\n",
"405 4986 4197.359917287667\n",
"406 1824 4332.950723087893\n",
"407 1562 5099.093054122171\n",
"408 5890 12081.878696518148\n",
"409 6077 9270.461413927558\n",
"410 1485 1496.4321088051206\n",
"411 1825 4246.200510854761\n",
"412 5340 3255.3624000842133\n",
"413 9237 1859.449426524448\n",
"414 6499 7976.974080873097\n",
"415 1240 4436.075476859059\n",
"416 4656 3617.4469653780425\n",
"417 2335 4997.427948460792\n",
"418 8000 8685.398728410411\n",
"419 5641 8353.951860004401\n",
"420 1444 8676.625836361147\n",
"421 12900 2321.255461480635\n",
"422 6500 4629.528409764403\n",
"423 7506 13467.919271136741\n",
"424 6438 7930.93744973132\n",
"425 2261 13370.226646925103\n",
"426 2121 6247.557132112603\n",
"427 5437 3592.393531883706\n",
"428 1536 3084.700451088983\n",
"429 9295 11590.303689144444\n",
"430 3252 6586.4530811986915\n",
"431 1331 2974.1520911988323\n",
"432 5442 10642.588370514337\n",
"433 4527 4146.7680464203095\n",
"434 6500 5535.980475001773\n",
"435 1238 4462.334896687268\n",
"436 10702 3998.7386180649096\n",
"437 8056 6374.403929120289\n",
"438 4517 3968.6353947354496\n",
"439 5108 11261.565350761522\n",
"440 6354 8418.830560829478\n",
"441 4322 3305.0788833275337\n",
"442 3129 5121.086170529202\n",
"443 2486 17408.009128939066\n",
"444 6200 4741.563419125667\n",
"445 10320 5313.293980930455\n",
"446 5204 11883.544862171222\n",
"447 7429 11135.61940509253\n",
"448 1837 5034.717550057033\n",
"449 3311 5410.885965608366\n",
"450 5425 4536.934131183477\n",
"451 1141 9035.881634012976\n",
"452 8142 3094.3729707170237\n",
"453 9630 5759.575130507457\n",
"454 3400 2189.066685634728\n",
"455 5991 8549.539484234854\n",
"456 4537 2673.967338892564\n",
"457 1389 4718.1351657552605\n",
"458 6560 12005.006870572877\n",
"459 5417 8357.181906814383\n",
"460 1326 11175.583517484314\n",
"461 1226 11704.844017633459\n",
"462 9439 7822.772984507\n",
"463 6075 3640.18245452465\n",
"464 4139 12954.348380007397\n",
"465 6921 4400.219099707537\n",
"466 1412 3860.7463982703334\n",
"467 1580 3516.678313124346\n",
"468 6480 3492.9019039587733\n",
"469 7740 8106.980110824186\n",
"470 9187 2395.5573418076624\n",
"471 5923 15299.331508342839\n",
"472 1690 10362.006379124352\n",
"473 1829 9487.82923378465\n",
"474 13132 12486.558265969294\n",
"475 5673 14305.952439617615\n",
"476 10143 14864.146909677464\n",
"477 2631 2331.8590852138564\n",
"478 16753 3373.2896869040014\n",
"479 8300 6524.596616257537\n",
"480 2541 9190.959336462798\n",
"481 1638 8198.234066736764\n",
"482 6097 15793.35353841358\n",
"483 8250 10749.527129598226\n",
"484 1638 2035.970947988072\n",
"485 1145 4696.342706754138\n",
"486 8300 4612.694230043811\n",
"487 9750 12698.282535481198\n",
"488 12532 16313.121000032259\n",
"489 10739 4867.058831371186\n",
"490 18230 8459.589175229492\n",
"491 6125 9447.347582186656\n",
"492 6225 4050.031770291008\n",
"493 16509 3119.674368698192\n",
"494 6782 15229.554761308495\n",
"495 6125 6761.654267834814\n",
"496 1681 16165.79694411498\n",
"497 1798 5819.205951991664\n",
"498 13385 4938.678542279483\n",
"499 12300 12501.32563965754\n",
"500 4100 6001.137996121012\n",
"501 6190 1475.6160798039427\n",
"502 9246 3958.254475739062\n",
"503 14322 5117.760831637467\n",
"504 7396 3351.115059928001\n",
"505 3851 11349.992398228365\n",
"506 4734 2254.841749289375\n",
"507 2058 4497.8123659139665\n",
"508 8869 6254.021135129916\n",
"509 11269 5503.560118534005\n",
"510 2506 3923.4245548541553\n",
"511 11730 13493.388189645208\n",
"512 8045 11793.907143350536\n",
"513 7500 19150.25573472374\n",
"514 9166 1503.1775986772748\n",
"515 5368 768.7325537958045\n",
"516 2395 11349.634056006476\n",
"517 9087 6323.225289121863\n",
"518 7407 12191.765888863798\n",
"519 5949 4662.532235685591\n",
"520 10216 1407.9870443357727\n",
"521 4731 2077.9540157496162\n",
"522 9248 7446.569623693983\n",
"523 18500 7152.090683775011\n",
"524 6308 2046.8540380357522\n",
"525 5748 7367.288137184615\n",
"526 3138 13384.130363257449\n",
"527 2012 10653.209976527616\n",
"528 8657 4045.4916586458935\n",
"529 7500 5925.985098665058\n",
"530 1463 16696.570686355375\n",
"531 7625 8283.901419829008\n",
"532 17260 1332.645261264805\n",
"533 7020 8097.968034350275\n",
"534 6592 12655.393492203057\n",
"535 1463 9686.161910222057\n",
"536 5112 14887.791991132963\n",
"537 9672 11980.464991642053\n",
"538 5360 3200.7882786135533\n",
"539 7338 4568.898795584218\n",
"540 4113 4548.0218263260895\n",
"541 5443 6464.617670339604\n",
"542 7368 3509.1119407497345\n",
"543 8017 14989.39181389453\n",
"544 8619 5951.016907958763\n",
"545 2651 2389.4447101228966\n",
"546 14840 5539.6976673052395\n",
"547 6041 5739.887811430656\n",
"548 8685 4713.845075975436\n",
"549 1252 10368.07303045706\n",
"550 2655 6283.479460803347\n",
"551 15140 10087.168600437875\n",
"552 7885 5075.27707615952\n",
"553 8685 8212.189918949982\n",
"554 7542 5046.9757285848955\n",
"555 4676 12393.032671740262\n",
"556 2450 4089.113201090722\n",
"557 7225 8668.848872884808\n",
"558 18500 3625.579521584379\n",
"559 8499 11175.583517484314\n",
"560 5057 11954.107603250402\n",
"561 8418 9871.105936883523\n",
"562 22885 4480.13584030295\n",
"563 2820 12949.498758756125\n",
"564 1868 9863.602442864936\n",
"565 2523 7594.763347975478\n",
"566 10058 4106.730423429261\n",
"567 7138 6882.786147983847\n",
"568 7610 8398.894749936191\n",
"569 2670 3175.8554412316626\n",
"570 2364 12814.987663022268\n",
"571 8435 5162.810338028615\n",
"572 8841 1036.8156262763082\n",
"573 15240 6022.001956780606\n",
"574 10180 10816.936615359207\n",
"575 12534 6207.885794866743\n",
"576 20520 4784.208803197017\n",
"577 13500 2214.8851307287455\n",
"578 5000 3893.0598787794556\n",
"579 12813 6018.340623795528\n",
"580 7050 4794.636511757451\n",
"581 6665 719.7944431444473\n",
"582 16350 12795.036594803416\n",
"583 25623 14184.768449790256\n",
"584 2063 9810.563762098913\n",
"585 3393 4663.9954601549625\n",
"586 2217 8773.41625094894\n",
"587 9003 3036.44495239287\n",
"588 14470 14674.536778589223\n",
"589 7603 7067.956282785245\n",
"590 8685 4819.903639940648\n",
"591 6436 3119.275984646008\n",
"592 6112 13083.263275048763\n",
"593 6127 4357.32710824466\n",
"594 1373 15735.44034049763\n",
"595 8046 9829.34768547027\n",
"596 6865 3214.003054487506\n",
"597 8286 5601.510414450099\n",
"598 6302 4623.138939835301\n",
"599 2208 11173.469568286891\n",
"600 3615 9099.567629826535\n",
"601 15940 1128.3453286817544\n",
"602 5010 12327.197143168583\n",
"603 8212 2358.011077505077\n",
"604 1272 3507.632555908359\n",
"605 2540 3225.323372800012\n",
"606 9600 4090.038562587634\n",
"607 26043 9172.521869455777\n",
"608 6103 9608.33642905634\n",
"609 2747 3357.020239766667\n",
"610 2960 6086.4085631268035\n",
"611 26043 7352.588636862007\n",
"612 11444 5749.178712087224\n",
"613 6608 7009.789042663147\n",
"614 8685 4860.877678091679\n",
"615 7809 2574.283478221735\n",
"616 10910 16177.070094482096\n",
"617 6015 7330.670097266955\n",
"618 5233 5874.080532458615\n",
"619 1425 13376.351664670756\n",
"620 11160 11489.591677776654\n",
"621 2105 8093.267208688064\n",
"622 7428 12065.410201066788\n",
"623 5204 4090.2545827148147\n",
"624 1851 4009.0006330108404\n",
"625 26043 3438.1572509050984\n",
"626 5426 2253.846596804711\n",
"627 6219 17137.025597423733\n",
"628 11212 8852.762121006672\n",
"629 8124 2764.2110979500026\n",
"630 1982 16415.374793629482\n",
"631 3694 8244.824334909112\n",
"632 6075 2457.9006791839233\n",
"633 4561 2321.330005122368\n",
"634 3042 4222.503424740425\n",
"635 19747 8223.799821601031\n",
"636 15145 1871.3160227674202\n",
"637 7072 4620.709006674663\n",
"638 2582 2230.203623949988\n",
"639 1425 5754.610018189932\n",
"640 5219 18795.832958315765\n",
"641 7182 2545.237704767577\n",
"642 8899 4793.967670294426\n",
"643 6313 3355.7302621566423\n",
"644 2435 1977.784883709689\n",
"645 3108 5286.771821824771\n",
"646 12198 6863.347568508702\n",
"647 5761 3753.5604597260553\n",
"648 8685 3501.396202209124\n",
"649 8141 6710.759936928313\n",
"650 9185 6449.711014158032\n",
"651 5331 6111.495678866401\n"
]
},
{
"ename": "IndexError",
"evalue": "index 652 is out of bounds for axis 0 with size 652",
"output_type": "error",
"traceback": [
"\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
"\u001b[0;31mIndexError\u001b[0m Traceback (most recent call last)",
"\u001b[0;32m/tmp/ipykernel_56157/1621740581.py\u001b[0m in \u001b[0;36m<module>\u001b[0;34m\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[0;32mfor\u001b[0m \u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mv\u001b[0m \u001b[0;32min\u001b[0m \u001b[0menumerate\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0my\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m----> 2\u001b[0;31m \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0mv\u001b[0m\u001b[0;34m,\u001b[0m\u001b[0my_pred_rf\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mi\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
"\u001b[0;31mIndexError\u001b[0m: index 652 is out of bounds for axis 0 with size 652"
]
}
],
"source": [
"for i,v in enumerate(y):\n",
" print(i,v,y_pred_rf[i])"
]
},
{
"cell_type": "code",
"execution_count": 7,
"id": "bba1ad86",
"metadata": {},
"outputs": [
{
"data": {
"text/plain": [
"2171"
]
},
"execution_count": 7,
"metadata": {},
"output_type": "execute_result"
}
],
"source": [
"len(y)"
]
},
{
"cell_type": "code",
"execution_count": null,
"id": "970a3733",
"metadata": {},
"outputs": [],
"source": []
}
],
"metadata": {
"kernelspec": {
"display_name": "Python 3.7.13 ('leagues')",
"language": "python",
"name": "python3"
},
"language_info": {
"codemirror_mode": {
"name": "ipython",
"version": 3
},
"file_extension": ".py",
"mimetype": "text/x-python",
"name": "python",
"nbconvert_exporter": "python",
"pygments_lexer": "ipython3",
"version": "3.7.13"
},
"vscode": {
"interpreter": {
"hash": "a07b7f3079ca8c056705d3c757c4f3f92f9509f33eeab9ad5420dacec37bc01a"
}
}
},
"nbformat": 4,
"nbformat_minor": 5
}