sandys · August 18, 2019 16:26 · Jason2Brownlee · May 16, 2024
diff --git a/gridsearchcv.py b/gridsearchcv.py
 #

 ... import xgboost.sklearn as xgb 
 ... from sklearn.model_selection import GridSearchCV 
 ... from sklearn.model_selection import TimeSeriesSplit 
 ...  
 ... cv = 2 
 ...  
 ... trainX= [[1], [2], [3], [4], [5]] 
 ... trainY = [1, 2, 1, 2, 1] 
 ...  
 ... # these are the evaluation sets 
 ... testX = trainX  
 ... testY = trainY 
 ...  
 ... paramGrid = {"subsample" : [0.5, 0.8]} 
 ...  
 ... fit_params={"early_stopping_rounds":42,  
 ...             "eval_metric" : "mae",  
 ...             "eval_set" : [[testX, testY]]} 
 ...  
 ... model = xgb.XGBRegressor() 
 ...  
 ... from sklearn.model_selection import StratifiedKFold 
 ... skf = StratifiedKFold(n_splits=cv, shuffle = True, random_state = 999) 
 ... gridsearch = GridSearchCV(model, paramGrid, verbose=1,              
 ...          cv=skf.split(trainX, trainY)) 
 ...  
 ... g = gridsearch.fit(trainX, trainY, **fit_params) 
 ... y_true, y_pred = testY, gridsearch.predict(testX) 
 ... from sklearn.metrics import r2_score  
 ... print(r2_score(y_true, y_pred)) 
 ... print(g.cv_results_)
	#

	... import xgboost.sklearn as xgb
	... from sklearn.model_selection import GridSearchCV
	... from sklearn.model_selection import TimeSeriesSplit
	...
	... cv = 2
	...
	... trainX= [[1], [2], [3], [4], [5]]
	... trainY = [1, 2, 1, 2, 1]
	...
	... # these are the evaluation sets
	... testX = trainX
	... testY = trainY
	...
	... paramGrid = {"subsample" : [0.5, 0.8]}
	...
	... fit_params={"early_stopping_rounds":42,
	... "eval_metric" : "mae",
	... "eval_set" : [[testX, testY]]}
	...
	... model = xgb.XGBRegressor()
	...
	... from sklearn.model_selection import StratifiedKFold
	... skf = StratifiedKFold(n_splits=cv, shuffle = True, random_state = 999)
	... gridsearch = GridSearchCV(model, paramGrid, verbose=1,
	... cv=skf.split(trainX, trainY))
	...
	... g = gridsearch.fit(trainX, trainY, **fit_params)
	... y_true, y_pred = testY, gridsearch.predict(testX)
	... from sklearn.metrics import r2_score
	... print(r2_score(y_true, y_pred))
	... print(g.cv_results_)