使用GridSearchCV时出错，但不使用GridSearchCV Python 3.6.7时出错

from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor from sklearn.neural_network import MLPRegressor from sklearn.model_selection import train_test_split from sklearn.neural_network import MLPRegressor from sklearn import preprocessing import pandas as pd import numpy as np def str_to_num(arr): le = preprocessing.LabelEncoder() new_arr = le.fit_transform(arr) return new_arr def compare_values(arr1, arr2): thediff = 0 thediffs = [] for thing1, thing2 in zip(arr1, arr2): thediff = abs(thing1 - thing2) thediffs.append(thediff) return thediffs def print_to_file(filepath, arr): with open(filepath, 'w') as f: for item in arr: f.write("%s\n" % item) data = pd.read_csv('data2.csv') # create the labels, or field we are trying to estimate label = data['TOTAL'] # remove the header label = label[1:] # create the data, or the data that is to be estimated data = data.drop('TOTAL', axis=1) data = data.drop('SERIALNUM', axis=1) # remove the header data = data[1:] # # split into training and testing sets X_train, X_test, y_train, y_test = train_test_split(data, label, test_size = 0.2) mlp = MLPRegressor(activation = 'relu', solver = 'lbfgs', verbose=False) mlp.fit(X_train, y_train) mlp_predictions = mlp.predict(X_test) mlp_differences = compare_values(y_test, mlp_predictions) mlp_Avg = np.average(mlp_differences) print(mlp_Avg)

from sklearn.neural_network import MLPRegressor from sklearn.model_selection import train_test_split, GridSearchCV from sklearn.neural_network import MLPRegressor from sklearn import preprocessing import pandas as pd import numpy as np def str_to_num(arr): le = preprocessing.LabelEncoder() new_arr = le.fit_transform(arr) return new_arr def compare_values(arr1, arr2): thediff = 0 thediffs = [] for thing1, thing2 in zip(arr1, arr2): thediff = abs(thing1 - thing2) thediffs.append(thediff) return thediffs def print_to_file(filepath, arr): with open(filepath, 'w') as f: for item in arr: f.write("%s\n" % item) data = pd.read_csv('data2.csv') # create the labels, or field we are trying to estimate label = data['TOTAL_DAYS_TO_COMPLETE'] # remove the header label = label[1:] # create the data, or the data that is to be estimated data = data.drop('TOTAL_DAYS_TO_COMPLETE', axis=1) data = data.drop('SERIALNUM', axis=1) # remove the header data = data[1:] # # split into training and testing sets X_train, X_test, y_train, y_test = train_test_split(data, label, test_size = 0.2) param_grid = { #'hidden_layer_sizes': [(1,),(2,),(3,),(10,),(15,),(20,),(25,)], 'activation': ['identity', 'logistic', 'relu'], #'activation': ['relu'], 'solver': ['lbfgs', 'sgd', 'adam'], #'solver': ['adam'] #'alpha': [0.0001, 0.0005, 0.0009], #'learning_rate': ['constant', 'invscaling', 'adaptive'], #'learning_rate_init': [0.001, 0.01, 0.99], #'warm_start': [True, False] #'momentum': [0.1, 0.9, 0.99] # Did not solver-specifics...yet }# Create a based model mlp = MLPRegressor()# Instantiate the grid search model grid_search = GridSearchCV(estimator = mlp, param_grid = param_grid, cv = 3, n_jobs = -1, verbose = 2) grid_search.fit(X_train, y_train) print() print(grid_search.best_params_) print(grid_search.best_score_) print() print("Grid scores on development set: ") print() answers = grid_search.predict(X_test) results = compare_values(answers, y_test) print("Accuracy: ", np.average(results)) print()

1条回答

网友

1楼 · 发布于 2024-05-13 02:54:55

问题与这一行有关：

'solver': ['lbfgs', 'sgd', 'adam'],

sgd选项需要在每个the documentation的某个阈值中使用某些参数

简单的改变 'solver': ['lbfgs', 'sgd', 'adam'],

至

'solver': ['lbfgs', 'adam'],

解决了这个问题

相关问题更多 >

编程相关推荐

热门问题

热门文章