Professional Documents
Culture Documents
Better Data Science - Hyperparameter Tuning With GridSearch
Better Data Science - Hyperparameter Tuning With GridSearch
Better Data Science - Hyperparameter Tuning With GridSearch
GridSearch
● Library imports
● You'll use the Iris dataset for training and tuning
In [1]:
import pandas as pd
from sklearn.tree import DecisionTreeClassifier
from sklearn.model_selection import train_test_split, GridSearchCV
from sklearn.metrics import accuracy_score, confusion_matrix
iris =
pd.read_csv('https://gist.githubusercontent.com/curran/a08a1080b88344b0c8a7/raw/0e7a9b0a5d22
642a06d3d5b9bcbad9890c8ee534/iris.csv')
iris.head()
Baseline model
# 3 separate models
model_1 = DecisionTreeClassifier(**params_1)
model_2 = DecisionTreeClassifier(**params_2)
model_3 = DecisionTreeClassifier(**params_3)
model_1.fit(X_train, y_train)
model_2.fit(X_train, y_train)
model_3.fit(X_train, y_train)
clf = GridSearchCV(
estimator=model,
param_grid=params,
cv=10, # 10-fold cross validation
n_jobs=-1 # run in parallel
)
clf.fit(X_train, y_train)