See attached Word docNeed to have confirmation that Problem is well understood, as well as the...

Question

See attached Word docNeed to have confirmation that Problem is well understood, as well as the Methods to be used (Decision trees, Random Forest, Gradient Boosting Trees) and validation methods (one- split and k-fold cross validation, time series split)

INSTRUCTIONS · Use of the following CLASSIFICATION Machine Learning Models · Decision Trees · Random Forest · Gradient Boosting Trees · First, given dataset “spx_tail”, the “tail events” as defined below have to be identified in order to assign them such label · All sections needed, i.e. · “Please Report” section · “Remember” section: · one-split cross validation · k-fold cross validation (use k = 5) · top K Feature Importance for Random Forest and Gradient Boosting Trees · Bonus 1 · Bonus 2 · Bonus 3 ASSIGNMENT

qfile_636772176296629059_123086_1.docx

Ximi · Accepted Answer

{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 110,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "import pandas as pd
",
    "from sklearn.model_selection import train_test_split, cross_val_score, TimeSeriesSplit
",
    "from sklearn.tree import DecisionTreeClassifier
",
    "from sklearn.metrics import accuracy_score, classification_report
",
    "from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier, VotingClassifier
",
    "import numpy as np
",
    "import matplotlib.pyplot as plt
",
    "from sklearn.linear_model import LogisticRegression
",
    "from sklearn.naive_bayes import GaussianNB
",
    "from sklearn.neighbors import KNeighborsClassifier"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "#Reading CSV file
",
    "df = pd.read_csv('spx_tail.csv')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "(4319, 254)"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "#Shape of the data
",
    "df.shape"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "
",
       "
",
       "    .dataframe thead tr:only-child th {
",
       "        text-align: right;
",
       "    }
",
       "
",
       "    .dataframe thead th {
",
       "        text-align: left;
",
       "    }
",
       "
",
       "    .dataframe tbody tr th {
",
       "        vertical-align: top;
",
       "    }
",
       "
",
       "
",
       "  
",
       "    
",
       "      
",
       "      ticker
",
       "      lag_1
",
       "      lag_2
",
       "      lag_3
",
       "      lag_4
",
       "      lag_5
",
       "      lag_6
",
       "      lag_7
",
       "      lag_8
",
       "      lag_9
",
       "      ...
",
       "      lag_244
",
       "      lag_245
",
       "      lag_246
",
       "      lag_247
",
       "      lag_248
",
       "      lag_249
",
       "      lag_250
",
       "      lag_251
",
       "      lag_252
",
       "      T1
",
       "    
",
       "  
",
       "  
",
       "    
",
       "      0
",
       "      2001-01-02
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      -0.031796
",
       "      -0.013043
",
       "      0.008038
",
       "      ...
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "      0.001920
",
       "      -0.039099
",
       "      0.000000
",
       "      False
",
       "    
",
       "    
",
       "      1
",
       "      2001-01-03
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      -0.031796
",
       "      -0.013043
",
       "      ...
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "      0.001920
",
       "      -0.039099
",
       "      False
",
       "    
",
       "    
",
       "      2
",
       "      2001-01-04
",
       "      0.048884
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      -0.031796
",
       "      ...
",
       "      -0.006856
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "      0.001920
",
       "      False
",
       "    
",
       "    
",
       "      3
",
       "      2001-01-05
",
       "      -0.010608
",
       "      0.048884
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      ...
",
       "      0.000522
",
       "      -0.006856
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "      False
",
       "    
",
       "    
",
       "      4
",
       "      2001-01-08
",
       "      -0.026593
",
       "      -0.010608
",
       "      0.048884
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      ...
",
       "      -0.007121
",
       "      0.000522
",
       "      -0.006856
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      False
",
       "    
",
       "  
",
       "
",
       "5 rows × 254 columns
",
       ""
      ],
      "text/plain": [
       "       ticker     lag_1     lag_2     lag_3     lag_4     lag_5     lag_6  \
",
       "0  2001-01-02 -0.010503  0.003980  0.010385  0.007035  0.024110  0.007970   
",
       "1  2001-01-03 -0.028432 -0.010503  0.003980  0.010385  0.007035  0.024110   
",
       "2  2001-01-04  0.048884 -0.028432 -0.010503  0.003980  0.010385  0.007035   
",
       "3  2001-01-05 -0.010608  0.048884 -0.028432 -0.010503  0.003980  0.010385   
",
       "4  2001-01-08 -0.026593 -0.010608  0.048884 -0.028432 -0.010503  0.003980   
",
       "
",
       "      lag_7     lag_8     lag_9  ...     lag_244   lag_245   lag_246  \
",
       "0 -0.031796 -0.013043  0.008038  ...    0.012096 -0.004396 -0.013149   
",
       "1  0.007970 -0.031796 -0.013043  ...    0.010615  0.012096 -0.004396   
",
       "2  0.024110  0.007970 -0.031796  ...   -0.006856  0.010615  0.012096   
",
       "3  0.007035  0.024110  0.007970  ...    0.000522 -0.006856  0.010615   
",
       "4  0.010385  0.007035  0.024110  ...   -0.007121  0.000522 -0.006856   
",
       "
",
       "    lag_247   lag_248   lag_249   lag_250   lag_251   lag_252     T1  
",
       "0  0.011128  0.026730  0.000955  0.001920 -0.039099  0.000000  False  
",
       "1 -0.013149  0.011128  0.026730  0.000955  0.001920 -0.039099  False  
",
       "2 -0.004396 -0.013149  0.011128  0.026730  0.000955  0.001920  False  
",
       "3  0.012096 -0.004396 -0.013149  0.011128  0.026730  0.000955  False  
",
       "4  0.010615  0.012096 -0.004396 -0.013149  0.011128  0.026730  False  
",
       "
",
       "[5 rows x 254 columns]"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "#A glance at the data
",
    "df.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {
    "collapsed": true
   },
   "outputs": [],
   "source": [
    "#Separating input data and output variable
",
    "X = df.iloc[:, 1:-1]
",
    "y = df.iloc[:, -1]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "
",
       "
",
       "    .dataframe thead tr:only-child th {
",
       "        text-align: right;
",
       "    }
",
       "
",
       "    .dataframe thead th {
",
       "        text-align: left;
",
       "    }
",
       "
",
       "    .dataframe tbody tr th {
",
       "        vertical-align: top;
",
       "    }
",
       "
",
       "
",
       "  
",
       "    
",
       "      
",
       "      lag_1
",
       "      lag_2
",
       "      lag_3
",
       "      lag_4
",
       "      lag_5
",
       "      lag_6
",
       "      lag_7
",
       "      lag_8
",
       "      lag_9
",
       "      lag_10
",
       "      ...
",
       "      lag_243
",
       "      lag_244
",
       "      lag_245
",
       "      lag_246
",
       "      lag_247
",
       "      lag_248
",
       "      lag_249
",
       "      lag_250
",
       "      lag_251
",
       "      lag_252
",
       "    
",
       "  
",
       "  
",
       "    
",
       "      0
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      -0.031796
",
       "      -0.013043
",
       "      0.008038
",
       "      -0.021696
",
       "      ...
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "      0.001920
",
       "      -0.039099
",
       "      0.000000
",
       "    
",
       "    
",
       "      1
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      -0.031796
",
       "      -0.013043
",
       "      0.008038
",
       "      ...
",
       "      -0.006856
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "      0.001920
",
       "      -0.039099
",
       "    
",
       "    
",
       "      2
",
       "      0.048884
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      -0.031796
",
       "      -0.013043
",
       "      ...
",
       "      0.000522
",
       "      -0.006856
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "      0.001920
",
       "    
",
       "    
",
       "      3
",
       "      -0.010608
",
       "      0.048884
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      -0.031796
",
       "      ...
",
       "      -0.007121
",
       "      0.000522
",
       "      -0.006856
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "      0.000955
",
       "    
",
       "    
",
       "      4
",
       "      -0.026593
",
       "      -0.010608
",
       "      0.048884
",
       "      -0.028432
",
       "      -0.010503
",
       "      0.003980
",
       "      0.010385
",
       "      0.007035
",
       "      0.024110
",
       "      0.007970
",
       "      ...
",
       "      -0.002917
",
       "      -0.007121
",
       "      0.000522
",
       "      -0.006856
",
       "      0.010615
",
       "      0.012096
",
       "      -0.004396
",
       "      -0.013149
",
       "      0.011128
",
       "      0.026730
",
       "    
",
       "  
",
       "
",
       "5 rows × 252 columns
",
       ""
      ],
      "text/plain": [
       "      lag_1     lag_2     lag_3     lag_4     lag_5     lag_6     lag_7  \
",
       "0 -0.010503  0.003980  0.010385  0.007035  0.024110  0.007970 -0.031796   
",
       "1 -0.028432 -0.010503  0.003980  0.010385  0.007035  0.024110  0.007970   
",
       "2  0.048884 -0.028432 -0.010503  0.003980  0.010385  0.007035  0.024110   
",
       "3 -0.010608  0.048884 -0.028432 -0.010503  0.003980  0.010385  0.007035   
",
       "4 -0.026593 -0.010608  0.048884 -0.028432 -0.010503  0.003980  0.010385   
",
       "
",
       "      lag_8     lag_9    lag_10    ...      lag_243   lag_244   lag_245  \
",
       "0 -0.013043  0.008038 -0.021696    ...     0.010615  0.012096 -0.004396   
",
       "1 -0.031796 -0.013043  0.008038    ...    -0.006856  0.010615  0.012096   
",
       "2  0.007970 -0.031796 -0.013043    ...     0.000522 -0.006856  0.010615   
",
       "3  0.024110  0.007970 -0.031796    ...    -0.007121  0.000522 -0.006856   
",
       "4  0.007035  0.024110  0.007970    ...    -0.002917 -0.007121  0.000522   
",
       "
",
       "    lag_246   lag_247   lag_248   lag_249   lag_250   lag_251   lag_252  
",
       "0 -0.013149  0.011128  0.026730  0.000955  0.001920 -0.039099  0.000000  
",
       "1 -0.004396 -0.013149  0.011128  0.026730  0.000955  0.001920 -0.039099  
",
       "2  0.012096 -0.004396 -0.013149  0.011128  0.026730  0.000955  0.001920  
",
       "3  0.010615  0.012096 -0.004396 -0.013149  0.011128  0.026730  0.000955  
",
       "4 -0.006856  0.010615  0.012096 -0.004396 -0.013149  0.011128  0.026730  
",
       "
",
       "[5 rows x 252 columns]"
      ]
     },
     "execution_count": 8,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "#Input data
",
    "X.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0    False
",
       "1    False
",
       "2    False
",
       "3    False
",
       "4    False
",
       "Name: T1, dtype: bool"
      ]
     },
     "execution_count": 9,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "#Output data
",
    "y.head()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "#Train test split or single fold split
",
    "train_x, test_x, train_y, test_y = train_test_split(X, y, test_size=0.2)
"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Decision Trees
",
    "I. Implementing decision trees with different depths and impurity functions."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 58,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Depth: 2 
",
      "Entropy function: gini
",
      "Accuracy Score: 89.814815
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      1.00      0.95       776
",
      "       True       0.50      0.01      0.02        88
",
      "
",
      "avg / total       0.86      0.90      0.85       864
",
      "
",
      "Depth: 2 
",
      "Entropy function: entropy
",
      "Accuracy Score: 89.814815
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      1.00      0.95       776
",
      "       True       0.00      0.00      0.00        88
",
      "
",
      "avg / total       0.81      0.90      0.85       864
",
      "
",
      "Depth: 5 
",
      "Entropy function: gini
",
      "Accuracy Score: 89.004630
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.99      0.94       776
",
      "       True       0.11      0.01      0.02        88
",
      "
",
      "avg / total       0.82      0.89      0.85       864
",
      "
",
      "Depth: 5 
",
      "Entropy function: entropy
",
      "Accuracy Score: 89.583333
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      1.00      0.94       776
",
      "       True       0.25      0.01      0.02        88
",
      "
",
      "avg / total       0.83      0.90      0.85       864
",
      "
",
      "Depth: 10 
",
      "Entropy function: gini
",
      "Accuracy Score: 87.037037
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.97      0.93       776
",
      "       True       0.07      0.02      0.03        88
",
      "
",
      "avg / total       0.81      0.87      0.84       864
",
      "
",
      "Depth: 10 
",
      "Entropy function: entropy
",
      "Accuracy Score: 85.879630
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.95      0.92       776
",
      "       True       0.13      0.07      0.09        88
",
      "
",
      "avg / total       0.82      0.86      0.84       864
",
      "
",
      "Depth: 15 
",
      "Entropy function: gini
",
      "Accuracy Score: 84.722222
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.94      0.92       776
",
      "       True       0.08      0.05      0.06        88
",
      "
",
      "avg / total       0.81      0.85      0.83       864
",
      "
",
      "Depth: 15 
",
      "Entropy function: entropy
",
      "Accuracy Score: 83.912037
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.92      0.91       776
",
      "       True       0.13      0.10      0.11        88
",
      "
",
      "avg / total       0.82      0.84      0.83       864
",
      "
",
      "Depth: 20 
",
      "Entropy function: gini
",
      "Accuracy Score: 83.912037
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.89      0.93      0.91       776
",
      "       True       0.05      0.03      0.04        88
",
      "
",
      "avg / total       0.81      0.84      0.82       864
",
      "
",
      "Depth: 20 
",
      "Entropy function: entropy
",
      "Accuracy Score: 81.944444
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.90      0.90       776
",
      "       True       0.14      0.15      0.14        88
",
      "
",
      "avg / total       0.82      0.82      0.82       864
",
      "
",
      "Depth: 50 
",
      "Entropy function: gini
",
      "Accuracy Score: 78.472222
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.89      0.86      0.88       776
",
      "       True       0.07      0.09      0.08        88
",
      "
",
      "avg / total       0.81      0.78      0.80       864
",
      "
",
      "Depth: 50 
",
      "Entropy function: entropy
",
      "Accuracy Score: 81.481481
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.89      0.90       776
",
      "       True       0.12      0.12      0.12        88
",
      "
",
      "avg / total       0.82      0.81      0.82       864
",
      "
"
     ]
    }
   ],
   "source": [
    "depths = [2, 5, 10, 15, 20, 50]
",
    "criterion = ['gini', 'entropy']
",
    "for depth in depths:
",
    "    for en_func in criterion:
",
    "        print ("Depth: %d \nEntropy function: %s"%(depth, en_func))
",
    "        clf = DecisionTreeClassifier(criterion=en_func, max_depth=depth)
",
    "        clf.fit(train_x, train_y)
",
    "
",
    "        #Accuracy Score
",
    "        print ("Accuracy Score: %f"%(accuracy_score(test_y, clf.predict(test_x))*100))
",
    "
",
    "        #Classification report
",
    "        print ("Classification Report: ")
",
    "        print(classification_report(test_y, clf.predict(test_x)))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Decision tree is working well in max_depth = 2 with gini impurity function and its able to predict the True class at 50% precision which is better than the rest."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Accuracy: 0.90 (+/- 0.01)
"
     ]
    }
   ],
   "source": [
    "#Cross validating with k = 5 with optimal parameters
",
    "clf = DecisionTreeClassifier(criterion='gini', max_depth=2)
",
    "scores = cross_val_score(clf, X, y, cv=5)
",
    "print("Accuracy: %0.2f (+/- %0.2f)" % (scores.mean(), scores.std() * 2))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "#### Bonus 1"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "Using balanced class_weight increased the precision for the True class indicating that classifier is able to predict more precisely the True class."
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 69,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Accuracy: 0.90 (+/- 0.00)
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      1.00      0.95       776
",
      "       True       0.50      0.01      0.02        88
",
      "
",
      "avg / total       0.86      0.90      0.85       864
",
      "
"
     ]
    }
   ],
   "source": [
    "#Tuning class_weights on optimal parameters to check performance
",
    "clf = DecisionTreeClassifier(criterion='gini', max_depth=2, class_weight={True:0.5, False:0.5})
",
    "
",
    "scores = cross_val_score(clf, X, y, cv=5)
",
    "print("Accuracy: %0.2f (+/- %0.2f)" % (scores.mean(), scores.std() * 2))
",
    "
",
    "clf.fit(train_x, train_y)
",
    "
",
    "#Classification report
",
    "print ("Classification Report: ")
",
    "print(classification_report(test_y, clf.predict(test_x)))"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### Random Forest
",
    "II. Implementing random forest with different number of trees, features and with/without bootstrap.
"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "Max features: auto 
",
      "Bootstrap: True 
",
      "No. of Trees: 10
",
      "Accuracy Score: 89.236111
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      0.99      0.94       776
",
      "       True       0.14      0.01      0.02        88
",
      "
",
      "avg / total       0.82      0.89      0.85       864
",
      "
",
      "Max features: auto 
",
      "Bootstrap: True 
",
      "No. of Trees: 60
",
      "Accuracy Score: 89.699074
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      1.00      0.95       776
",
      "       True       0.00      0.00      0.00        88
",
      "
",
      "avg / total       0.81      0.90      0.85       864
",
      "
",
      "Max features: auto 
",
      "Bootstrap: True 
",
      "No. of Trees: 100
",
      "Accuracy Score: 89.814815
",
      "Classification Report: 
",
      "             precision    recall  f1-score   support
",
      "
",
      "      False       0.90      1.00      0.95       776
",
      "       True       0.00      0.00      0.00        88
",
      "
",
      "avg / total       0.81      0.90      0.85       864
",
      "
",
      "Max features: auto 
",
      "Bootstrap: False 
",
      "No. of Trees: 10
",
      "Accuracy Score: 89.583333
",
      "Classification Report: 
",

INSTRUCTIONS · Use of the following CLASSIFICATION Machine Learning Models · Decision Trees · Random Forest · Gradient Boosting Trees · First, given dataset “spx_tail”, the “tail events” as defined...

Answer To: INSTRUCTIONS · Use of the following CLASSIFICATION Machine Learning Models · Decision Trees · Random...

Answer To This Question Is Available To Download

Related Questions & Answers

Submit New Assignment

	ticker	lag_1	lag_2	lag_3	lag_4	lag_5	lag_6	lag_7	lag_8	lag_9	...	lag_244	lag_245	lag_246	lag_247	lag_248	lag_249	lag_250	lag_251	lag_252	T1
0	2001-01-02	-0.010503	0.003980	0.010385	0.007035	0.024110	0.007970	-0.031796	-0.013043	0.008038	...	0.012096	-0.004396	-0.013149	0.011128	0.026730	0.000955	0.001920	-0.039099	0.000000	False
1	2001-01-03	-0.028432	-0.010503	0.003980	0.010385	0.007035	0.024110	0.007970	-0.031796	-0.013043	...	0.010615	0.012096	-0.004396	-0.013149	0.011128	0.026730	0.000955	0.001920	-0.039099	False
2	2001-01-04	0.048884	-0.028432	-0.010503	0.003980	0.010385	0.007035	0.024110	0.007970	-0.031796	...	-0.006856	0.010615	0.012096	-0.004396	-0.013149	0.011128	0.026730	0.000955	0.001920	False
3	2001-01-05	-0.010608	0.048884	-0.028432	-0.010503	0.003980	0.010385	0.007035	0.024110	0.007970	...	0.000522	-0.006856	0.010615	0.012096	-0.004396	-0.013149	0.011128	0.026730	0.000955	False
4	2001-01-08	-0.026593	-0.010608	0.048884	-0.028432	-0.010503	0.003980	0.010385	0.007035	0.024110	...	-0.007121	0.000522	-0.006856	0.010615	0.012096	-0.004396	-0.013149	0.011128	0.026730	False