| Download
A series of classifiers for predicting tumors from CDC NHANES data
Project: CS205-Opportunistic
Path: tumor_classifier.ipynb
Views: 508Kernel: Python 3 (Anaconda 5)
In [1]:
In [2]:
In [3]:
<module 'nhanes' from '/home/user/nhanes.py'>
In [3]:
In [4]:
In [5]:
In [7]:
(49454,)
In [324]:
Feature Importance by Random Forest
In [7]:
In [8]:
In [11]:
Text(0.5, 1.0, 'Sorted Feature Importances by Random Forest')
In [12]:
Index(['BMXBMI', 'BMXWAIST', 'BPXSY1', 'BPXDI1', 'RIDAGEYR', 'SLD010H',
'INDHHINC', 'SXQ272#2.0', 'RIDRETH1#3.0', 'DMDEDUC2#4.0',
'DMDEDUC2#3.0', 'DMDEDUC2#5.0', 'DMDEDUC2#2.0', 'RHQ131#1.0', 'RHD180',
'PAQ605#2.0', 'BPQ057#2.0', 'BPQ020#1.0', 'DMDEDUC2#1.0', 'SMD650#1.0',
'DIQ170#2.0', 'BPQ020#2.0', 'RIAGENDR#1.0', 'RIAGENDR#2.0', 'ALQ141Q',
'URXUCL#2.0', 'ALQ151#2.0', 'DIQ160#2.0', 'SMQ020#1.0', 'SMQ020#2.0',
'DIQ010#2.0', 'LBXTC', 'PAQ610', 'DIQ170#1.0', 'BPQ057#1.0',
'DIQ010#1.0', 'ARQ125C#2.0', 'MCQ160J#2.0', 'RIDRETH3#3.0',
'RIDRETH1#1.0', 'MCQ160J#1.0', 'PAQ605#1.0', 'MCQ200#2.0', 'DIQ160#1.0',
'RIDRETH1#4.0', 'RHQ131#2.0', 'SMD470#0.0', 'HEQ030#2.0', 'HEQ010#2.0',
'ALQ151#1.0', 'ALQ120Q', 'LBXHP1#0.0', 'RIDRETH1#2.0', 'MCQ200#1.0',
'LBXHP1#1.0', 'RIDRETH1#5.0', 'SXQ753#2.0', 'LBXHIVC#2.0', 'SMD650#0.0',
'RIDRETH3#4.0', 'SMD470#1.0', 'SXQ753#1.0', 'SMD480#1.0',
'RIDRETH3#2.0', 'RIDRETH3#6.0', 'RIDRETH3#7.0', 'RIDRETH3#1.0',
'SMD480#0.0', 'HEQ010#1.0', 'HEQ030#1.0', 'ARQ125C#1.0', 'SXQ272#1.0',
'LBXHIVC#1.0', 'DMDEDUC2#9.0', 'DMDEDUC2#7.0', 'URXUCL#1.0', 'ALQ160',
'SSEBV#1.0', 'SSEBV#2.0', 'PAQ560', 'PAQ677'],
dtype='object')
Mutual Information
In [7]:
In [114]:
Index(['SXQ272#2.0', 'RIDAGEYR', 'RIDRETH1#3.0', 'URXUCL#2.0', 'BPQ020#2.0',
'DIQ010#2.0', 'BPQ020#1.0', 'RHD180', 'ALQ141Q', 'RIDRETH1#1.0',
'SMQ020#1.0', 'BPXSY1', 'SMQ020#2.0', 'DIQ170#2.0', 'RIAGENDR#1.0',
'DIQ160#2.0', 'RIDRETH3#6.0', 'RIDRETH1#4.0', 'HEQ010#2.0',
'PAQ605#2.0', 'RHQ131#1.0', 'RIDRETH3#1.0', 'RIDRETH1#5.0',
'BPQ057#2.0', 'ALQ151#2.0', 'SLD010H', 'SMD650#1.0', 'BPXDI1',
'DMDEDUC2#2.0', 'LBXHP1#1.0', 'SXQ753#2.0', 'DIQ010#1.0', 'ARQ125C#1.0',
'MCQ200#1.0', 'SXQ753#1.0', 'DMDEDUC2#9.0', 'MCQ200#2.0', 'LBXHIVC#2.0',
'INDHHINC', 'DIQ170#1.0', 'ALQ151#1.0', 'RIDRETH3#3.0', 'DMDEDUC2#1.0',
'DMDEDUC2#5.0', 'SMD650#0.0', 'RIAGENDR#2.0', 'HEQ030#2.0',
'LBXHIVC#1.0', 'DMDEDUC2#4.0', 'LBXTC', 'DMDEDUC2#3.0', 'RIDRETH1#2.0',
'SMD480#1.0', 'PAQ605#1.0', 'ALQ120Q', 'PAQ610', 'ALQ160', 'SXQ272#1.0',
'BMXWAIST', 'SMD470#1.0', 'HEQ030#1.0', 'RIDRETH3#4.0', 'RIDRETH3#2.0',
'URXUCL#1.0', 'PAQ677', 'DMDEDUC2#7.0', 'PAQ560', 'HEQ010#1.0',
'BPQ057#1.0', 'MCQ160J#2.0', 'MCQ160J#1.0', 'RIDRETH3#7.0', 'BMXBMI',
'SSEBV#1.0', 'SSEBV#2.0', 'DIQ160#1.0', 'RHQ131#2.0', 'LBXHP1#0.0',
'ARQ125C#2.0', 'SMD480#0.0', 'SMD470#0.0'],
dtype='object')
In [210]:
array([2.06626772e-02, 1.89693913e-02, 1.38144986e-02, 1.32518869e-02,
1.28380246e-02, 1.07593222e-02, 9.27515420e-03, 8.03260258e-03,
7.36387332e-03, 7.23458529e-03, 6.46033268e-03, 5.87808657e-03,
4.81656519e-03, 4.48231657e-03, 4.34064741e-03, 2.95228857e-03,
2.83435668e-03, 2.79594060e-03, 2.63464534e-03, 2.57905674e-03,
2.34468943e-03, 2.19680156e-03, 2.18873058e-03, 2.18448058e-03,
2.17391712e-03, 2.11242237e-03, 1.90903123e-03, 1.89141768e-03,
1.86682013e-03, 1.80251723e-03, 1.59737350e-03, 1.57684555e-03,
1.43096499e-03, 1.40136210e-03, 1.34907328e-03, 1.27214477e-03,
1.18691828e-03, 1.15240635e-03, 1.13675840e-03, 1.09340922e-03,
1.08565166e-03, 1.06212281e-03, 1.05321770e-03, 7.71489952e-04,
7.31147870e-04, 7.08363914e-04, 6.73932548e-04, 6.06556095e-04,
4.62942093e-04, 4.51162952e-04, 4.48805360e-04, 4.37280892e-04,
3.39414191e-04, 3.11952234e-04, 1.96938758e-04, 1.96684621e-04,
1.10698902e-04, 4.77270690e-05, 1.84312855e-05, 0.00000000e+00,
0.00000000e+00, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00, 0.00000000e+00, 0.00000000e+00, 0.00000000e+00,
0.00000000e+00])
In [192]:
In [67]:
In [101]:
In [69]:
(49454, 81)
In [8]:
(49454, 40)
In [58]:
In [59]:
In [10]:
In [11]:
(49454, 37)
In [12]:
In [13]:
(49454, 37)
Classification
GridSearchCV with oversampling
In [117]:
ROC Curve
In [15]:
In [479]:
Logistic Regression
In [159]:
Performing grid search
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
/ext/anaconda5/lib/python3.6/site-packages/sklearn/linear_model/sag.py:334: ConvergenceWarning: The max_iter was reached which means the coef_ did not converge
"the coef_ did not converge", ConvergenceWarning)
Grid search complete
Performance Metrics for <class 'sklearn.linear_model.logistic.LogisticRegression'>
Performance Metrics for Train Set
0
accuracy 0.706412
precision 0.199392
recall 0.724170
f1 0.312670
roc_auc 0.777454
Performance Metrics for Test Set
Accuracy for test set is 0.71755
No Cancer Cancer
precision 0.959916 0.212102
recall 0.717576 0.717300
f1 0.821241 0.327395
AUC: 0.775
836.1863660812378
In [143]:
{'class__C': 0.1,
'class__max_iter': 1000,
'class__penalty': 'l1',
'class__solver': 'saga'}
In [152]:
Fitting 10 folds for each of 1 candidates, totalling 10 fits
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 3.4s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 3.5s remaining: 0.0s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 3.6s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 3.5s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 4.2s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 4.0s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 4.0s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 3.6s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 3.4s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 3.9s
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga
[CV] class__C=0.1, class__max_iter=1000, class__penalty=l1, class__solver=saga, total= 3.6s
[Parallel(n_jobs=1)]: Done 10 out of 10 | elapsed: 38.1s finished
Performance Metrics for <class 'sklearn.linear_model.logistic.LogisticRegression'>
Performance Metrics for Train Set
0
accuracy 0.710543
precision 0.201916
recall 0.720432
f1 0.315426
roc_auc 0.780470
Performance Metrics for Validation Set
0
accuracy 0.709552
precision 0.200600
recall 0.715999
f1 0.313368
roc_auc 0.777986
Performance Metrics for Test Set
Accuracy for test set is 0.705894
No Cancer Cancer
precision 0.961644 0.199940
recall 0.703955 0.724891
f1 0.812866 0.313429
AUC: 0.777
Support Vector Machine
In [122]:
Fitting 3 folds for each of 12 candidates, totalling 36 fits
[CV] class__C=0.001, class__gamma=scale, class__kernel=linear, class__probability=True
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] class__C=0.001, class__gamma=scale, class__kernel=linear, class__probability=True, total= 8.6s
[CV] class__C=0.001, class__gamma=scale, class__kernel=linear, class__probability=True
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 10.9s remaining: 0.0s
[CV] class__C=0.001, class__gamma=scale, class__kernel=linear, class__probability=True, total= 8.1s
[CV] class__C=0.001, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=0.001, class__gamma=scale, class__kernel=linear, class__probability=True, total= 9.2s
[CV] class__C=0.001, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=0.001, class__gamma=scale, class__kernel=poly, class__probability=True, total= 10.5s
[CV] class__C=0.001, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=0.001, class__gamma=scale, class__kernel=poly, class__probability=True, total= 10.7s
[CV] class__C=0.001, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=0.001, class__gamma=scale, class__kernel=poly, class__probability=True, total= 10.9s
[CV] class__C=0.001, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=0.001, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 16.9s
[CV] class__C=0.001, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=0.001, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 16.1s
[CV] class__C=0.001, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=0.001, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 16.3s
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True, total= 7.2s
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True, total= 7.3s
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True, total= 7.1s
[CV] class__C=0.1, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=poly, class__probability=True, total= 9.1s
[CV] class__C=0.1, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=poly, class__probability=True, total= 9.6s
[CV] class__C=0.1, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=poly, class__probability=True, total= 9.0s
[CV] class__C=0.1, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 12.0s
[CV] class__C=0.1, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 11.4s
[CV] class__C=0.1, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 11.8s
[CV] class__C=1, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=linear, class__probability=True, total= 11.7s
[CV] class__C=1, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=linear, class__probability=True, total= 10.5s
[CV] class__C=1, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=linear, class__probability=True, total= 11.6s
[CV] class__C=1, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=poly, class__probability=True, total= 8.9s
[CV] class__C=1, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=poly, class__probability=True, total= 8.2s
[CV] class__C=1, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=poly, class__probability=True, total= 7.8s
[CV] class__C=1, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 10.2s
[CV] class__C=1, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 9.5s
[CV] class__C=1, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=1, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 9.6s
[CV] class__C=10, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=linear, class__probability=True, total= 31.0s
[CV] class__C=10, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=linear, class__probability=True, total= 30.0s
[CV] class__C=10, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=linear, class__probability=True, total= 31.0s
[CV] class__C=10, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=poly, class__probability=True, total= 7.7s
[CV] class__C=10, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=poly, class__probability=True, total= 7.7s
[CV] class__C=10, class__gamma=scale, class__kernel=poly, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=poly, class__probability=True, total= 8.3s
[CV] class__C=10, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 8.0s
[CV] class__C=10, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 8.5s
[CV] class__C=10, class__gamma=scale, class__kernel=rbf, class__probability=True
[CV] class__C=10, class__gamma=scale, class__kernel=rbf, class__probability=True, total= 9.0s
[Parallel(n_jobs=1)]: Done 36 out of 36 | elapsed: 8.5min finished
Performance Metrics for <class 'sklearn.svm.classes.SVC'>
Performance Metrics for Train Set
0
accuracy 0.703998
precision 0.196118
recall 0.759184
f1 0.311700
roc_auc 0.790152
Performance Metrics for Validation Set
0
accuracy 0.697000
precision 0.187646
recall 0.730828
f1 0.298596
roc_auc 0.761293
Performance Metrics for Test Set
Accuracy for test set is 0.688
No Cancer Cancer
precision 0.968750 0.188889
recall 0.679825 0.772727
f1 0.798969 0.303571
AUC: 0.794
In [126]:
Fitting 3 folds for each of 1 candidates, totalling 3 fits
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True, total=22.0min
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 25.1min remaining: 0.0s
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True, total=21.9min
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True
[CV] class__C=0.1, class__gamma=scale, class__kernel=linear, class__probability=True, total=19.9min
[Parallel(n_jobs=1)]: Done 3 out of 3 | elapsed: 73.0min finished
Performance Metrics for <class 'sklearn.svm.classes.SVC'>
Performance Metrics for Train Set
0
accuracy 0.705571
precision 0.199935
recall 0.726378
f1 0.313554
roc_auc 0.778485
Performance Metrics for Validation Set
0
accuracy 0.703814
precision 0.197022
recall 0.715182
f1 0.308931
roc_auc 0.773729
Performance Metrics for Test Set
Accuracy for test set is 0.705995
No Cancer Cancer
precision 0.961509 0.199819
recall 0.704178 0.723799
f1 0.812966 0.313179
AUC: 0.774
In [123]:
{'class__C': 10,
'class__gamma': 'scale',
'class__kernel': 'linear',
'class__probability': True}
Random Forest
In [208]:
Fitting 3 folds for each of 4 candidates, totalling 12 fits
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 1.6s
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 2.0s remaining: 0.0s
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 1.7s
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 1.7s
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.4s
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.0s
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 2.7s
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.4s
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.2s
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.4s
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.3s
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.3s
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 3.2s
[Parallel(n_jobs=1)]: Done 12 out of 12 | elapsed: 41.0s finished
Performance Metrics for <class 'sklearn.ensemble.forest.RandomForestClassifier'>
Performance Metrics for Train Set
0
accuracy 0.758624
precision 0.212405
recall 0.641574
f1 0.319137
roc_auc 0.785137
Performance Metrics for Validation Set
0
accuracy 0.751750
precision 0.200090
recall 0.600561
f1 0.299940
roc_auc 0.763822
Performance Metrics for Test Set
Accuracy for test set is 0.735
No Cancer Cancer
precision 0.958865 0.200000
recall 0.741228 0.670455
f1 0.836116 0.308094
AUC: 0.803
In [329]:
{'class__max_depth': 3,
'class__max_features': 20,
'class__min_samples_leaf': 4,
'class__min_samples_split': 5,
'class__n_estimators': 250}
In [209]:
Fitting 3 folds for each of 4 candidates, totalling 12 fits
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 20.6s
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 24.2s remaining: 0.0s
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 16.7s
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=3, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 17.9s
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 28.3s
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 31.2s
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=8, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 28.5s
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 40.8s
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 37.2s
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=13, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 38.8s
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 44.3s
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 42.7s
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250
[CV] class__max_depth=18, class__max_features=20, class__min_samples_leaf=4, class__min_samples_split=5, class__n_estimators=250, total= 40.9s
[Parallel(n_jobs=1)]: Done 12 out of 12 | elapsed: 7.6min finished
Performance Metrics for <class 'sklearn.ensemble.forest.RandomForestClassifier'>
Performance Metrics for Train Set
0
accuracy 0.781538
precision 0.228405
recall 0.571545
f1 0.326317
roc_auc 0.777107
Performance Metrics for Validation Set
0
accuracy 0.780780
precision 0.227499
recall 0.569906
f1 0.325037
roc_auc 0.774859
Performance Metrics for Test Set
Accuracy for test set is 0.790314
No Cancer Cancer
precision 0.944595 0.228169
recall 0.816825 0.530568
f1 0.876076 0.319107
AUC: 0.772
Multi-Layer Perceptron Classifier
In [97]:
Fitting 3 folds for each of 1 candidates, totalling 3 fits
[CV] class__activation=tanh, class__alpha=0.05, class__hidden_layer_sizes=(100,), class__learning_rate=adaptive, class__solver=sgd
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
/ext/anaconda5/lib/python3.6/site-packages/sklearn/neural_network/multilayer_perceptron.py:562: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
% self.max_iter, ConvergenceWarning)
[CV] class__activation=tanh, class__alpha=0.05, class__hidden_layer_sizes=(100,), class__learning_rate=adaptive, class__solver=sgd, total= 2.7min
[CV] class__activation=tanh, class__alpha=0.05, class__hidden_layer_sizes=(100,), class__learning_rate=adaptive, class__solver=sgd
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 2.7min remaining: 0.0s
/ext/anaconda5/lib/python3.6/site-packages/sklearn/neural_network/multilayer_perceptron.py:562: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
% self.max_iter, ConvergenceWarning)
[CV] class__activation=tanh, class__alpha=0.05, class__hidden_layer_sizes=(100,), class__learning_rate=adaptive, class__solver=sgd, total= 2.5min
[CV] class__activation=tanh, class__alpha=0.05, class__hidden_layer_sizes=(100,), class__learning_rate=adaptive, class__solver=sgd
/ext/anaconda5/lib/python3.6/site-packages/sklearn/neural_network/multilayer_perceptron.py:562: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
% self.max_iter, ConvergenceWarning)
[CV] class__activation=tanh, class__alpha=0.05, class__hidden_layer_sizes=(100,), class__learning_rate=adaptive, class__solver=sgd, total= 2.6min
[Parallel(n_jobs=1)]: Done 3 out of 3 | elapsed: 7.9min finished
/ext/anaconda5/lib/python3.6/site-packages/sklearn/neural_network/multilayer_perceptron.py:562: ConvergenceWarning: Stochastic Optimizer: Maximum iterations (200) reached and the optimization hasn't converged yet.
% self.max_iter, ConvergenceWarning)
Performance Metrics for <class 'sklearn.neural_network.multilayer_perceptron.MLPClassifier'>
Performance Metrics for Train Set
0
accuracy 0.723365
precision 0.213979
recall 0.741417
f1 0.332105
roc_auc 0.803747
Performance Metrics for Validation Set
0
accuracy 0.718272
precision 0.205144
recall 0.708445
f1 0.318150
roc_auc 0.784694
Performance Metrics for Test Set
Accuracy for test set is 0.732181
No Cancer Cancer
precision 0.961796 0.212990
recall 0.734276 0.711454
f1 0.832776 0.327836
AUC: 0.801
In [380]:
{'class__activation': 'tanh',
'class__alpha': 0.05,
'class__hidden_layer_sizes': (100,),
'class__learning_rate': 'adaptive',
'class__solver': 'sgd'}
K Nearest Neighbors
In [342]:
Fitting 3 folds for each of 6 candidates, totalling 18 fits
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=uniform
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=uniform, total= 2.2s
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=uniform
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 6.9s remaining: 0.0s
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=uniform, total= 2.0s
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=uniform
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=uniform, total= 2.2s
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=distance
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=distance, total= 2.0s
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=distance
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=distance, total= 2.0s
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=distance
[CV] class__metric=euclidean, class__n_neighbors=23, class__weights=distance, total= 2.0s
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=uniform
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=uniform, total= 2.8s
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=uniform
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=uniform, total= 3.1s
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=uniform
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=uniform, total= 2.8s
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=distance
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=distance, total= 3.3s
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=distance
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=distance, total= 2.7s
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=distance
[CV] class__metric=manhattan, class__n_neighbors=23, class__weights=distance, total= 3.6s
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=uniform
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=uniform, total= 2.1s
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=uniform
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=uniform, total= 2.2s
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=uniform
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=uniform, total= 2.1s
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=distance
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=distance, total= 2.2s
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=distance
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=distance, total= 1.9s
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=distance
[CV] class__metric=minkowski, class__n_neighbors=23, class__weights=distance, total= 2.3s
[Parallel(n_jobs=1)]: Done 18 out of 18 | elapsed: 2.2min finished
Performance Metrics for <class 'sklearn.neighbors.classification.KNeighborsClassifier'>
Performance Metrics for Train Set
0
accuracy 0.605252
precision 0.177150
recall 0.950427
f1 0.298568
roc_auc 0.885837
Performance Metrics for Validation Set
0
accuracy 0.568250
precision 0.138169
recall 0.742253
f1 0.232951
roc_auc 0.710040
Performance Metrics for Test Set
Accuracy for test set is 0.58
No Cancer Cancer
precision 0.976744 0.157025
recall 0.552632 0.863636
f1 0.705882 0.265734
AUC: 0.753
In [167]:
{'class__n_neighbors': 23}
In [165]:
Fitting 3 folds for each of 1 candidates, totalling 3 fits
[CV] class__n_neighbors=23 ...........................................
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] ............................ class__n_neighbors=23, total= 2.9min
[CV] class__n_neighbors=23 ...........................................
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 8.4min remaining: 0.0s
[CV] ............................ class__n_neighbors=23, total= 3.7min
[CV] class__n_neighbors=23 ...........................................
[CV] ............................ class__n_neighbors=23, total= 2.9min
[Parallel(n_jobs=1)]: Done 3 out of 3 | elapsed: 27.9min finished
Performance Metrics for <class 'sklearn.neighbors.classification.KNeighborsClassifier'>
Performance Metrics for Train Set
0
accuracy 0.664270
precision 0.208743
recall 0.941289
f1 0.341703
roc_auc 0.900885
Performance Metrics for Validation Set
0
accuracy 0.629553
precision 0.167908
recall 0.758875
f1 0.274972
roc_auc 0.744637
Performance Metrics for Test Set
Accuracy for test set is 0.636336
No Cancer Cancer
precision 0.960919 0.169583
recall 0.624624 0.751092
f1 0.757107 0.276694
AUC: 0.746
In [442]:
Fitting 3 folds for each of 1 candidates, totalling 3 fits
[CV] class__n_neighbors=33 ...........................................
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] ............................ class__n_neighbors=33, total= 3.2min
[CV] class__n_neighbors=33 ...........................................
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 9.3min remaining: 0.0s
[CV] ............................ class__n_neighbors=33, total= 3.1min
[CV] class__n_neighbors=33 ...........................................
[CV] ............................ class__n_neighbors=33, total= 2.9min
[Parallel(n_jobs=1)]: Done 3 out of 3 | elapsed: 26.8min finished
Performance Metrics for <class 'sklearn.neighbors.classification.KNeighborsClassifier'>
Performance Metrics for Train Set
0
accuracy 0.645793
precision 0.195897
recall 0.910432
f1 0.322418
roc_auc 0.872208
Performance Metrics for Validation Set
0
accuracy 0.618861
precision 0.165836
recall 0.773620
f1 0.273124
roc_auc 0.747988
Performance Metrics for Test Set
Accuracy for test set is 0.621373
No Cancer Cancer
precision 0.962504 0.166155
recall 0.606351 0.768559
f1 0.744002 0.273239
AUC: 0.751
In [443]:
Comparison of Results
In [444]:
In [445]:
In [446]:
In [452]:
In [448]:
In [491]:
In [492]:
Relative Risks of Chlamydia and Cancer
In [509]:
0.47641197170830285
In [504]:
col_0 0.0 1.0
row_0
0 26284 477
1 1063 9
In [512]:
0.5628058397702916
In [514]:
4578
In [516]:
49454
In [515]:
26761 1072
3506 18115
4.210186838114133
In [475]:
In [476]:
In [477]:
In [478]:
Statistic | accuracy | f1 | precision | recall | roc_auc |
---|---|---|---|---|---|
Classifier | |||||
KNN | 0.621373 | 0.273239 | 0.166155 | 0.768559 | 0.751189 |
Logistic | 0.705894 | 0.313429 | 0.199940 | 0.724891 | 0.777009 |
SVM | 0.705995 | 0.313179 | 0.199819 | 0.723799 | 0.773600 |
MLP | 0.732181 | 0.327836 | 0.212990 | 0.711454 | 0.801291 |
Random Forest | 0.790314 | 0.319107 | 0.228169 | 0.530568 | 0.772473 |
In [0]:
In [454]:
In [455]:
No Cancer | Cancer | Statistic | Classifier | |
---|---|---|---|---|
recall | 0.703955 | 0.724891 | recall | Logistic |
recall | 0.704178 | 0.723799 | recall | SVM |
recall | 0.816825 | 0.530568 | recall | Random Forest |
recall | 0.734276 | 0.711454 | recall | MLP |
recall | 0.606351 | 0.768559 | recall | KNN |
In [456]:
0.27510917030567683
In [457]:
In [480]:
Fitting 3 folds for each of 20 candidates, totalling 60 fits
[CV] class__weights=uniform, class__n_neighbors=25, class__metric=minkowski
[Parallel(n_jobs=1)]: Using backend SequentialBackend with 1 concurrent workers.
[CV] class__weights=uniform, class__n_neighbors=25, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=25, class__metric=minkowski
[Parallel(n_jobs=1)]: Done 1 out of 1 | elapsed: 5.9s remaining: 0.0s
[CV] class__weights=uniform, class__n_neighbors=25, class__metric=minkowski, total= 2.2s
[CV] class__weights=uniform, class__n_neighbors=25, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=25, class__metric=minkowski, total= 2.3s
[CV] class__weights=distance, class__n_neighbors=25, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=25, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=25, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=25, class__metric=minkowski, total= 1.9s
[CV] class__weights=distance, class__n_neighbors=25, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=25, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=26, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=26, class__metric=minkowski, total= 2.4s
[CV] class__weights=uniform, class__n_neighbors=26, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=26, class__metric=minkowski, total= 2.0s
[CV] class__weights=uniform, class__n_neighbors=26, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=26, class__metric=minkowski, total= 2.2s
[CV] class__weights=distance, class__n_neighbors=26, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=26, class__metric=minkowski, total= 1.8s
[CV] class__weights=distance, class__n_neighbors=26, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=26, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=26, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=26, class__metric=minkowski, total= 2.2s
[CV] class__weights=uniform, class__n_neighbors=27, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=27, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=27, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=27, class__metric=minkowski, total= 2.3s
[CV] class__weights=uniform, class__n_neighbors=27, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=27, class__metric=minkowski, total= 2.2s
[CV] class__weights=distance, class__n_neighbors=27, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=27, class__metric=minkowski, total= 1.9s
[CV] class__weights=distance, class__n_neighbors=27, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=27, class__metric=minkowski, total= 2.1s
[CV] class__weights=distance, class__n_neighbors=27, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=27, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=28, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=28, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=28, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=28, class__metric=minkowski, total= 2.2s
[CV] class__weights=uniform, class__n_neighbors=28, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=28, class__metric=minkowski, total= 2.1s
[CV] class__weights=distance, class__n_neighbors=28, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=28, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=28, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=28, class__metric=minkowski, total= 1.9s
[CV] class__weights=distance, class__n_neighbors=28, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=28, class__metric=minkowski, total= 2.2s
[CV] class__weights=uniform, class__n_neighbors=29, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=29, class__metric=minkowski, total= 2.2s
[CV] class__weights=uniform, class__n_neighbors=29, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=29, class__metric=minkowski, total= 2.3s
[CV] class__weights=uniform, class__n_neighbors=29, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=29, class__metric=minkowski, total= 2.1s
[CV] class__weights=distance, class__n_neighbors=29, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=29, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=29, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=29, class__metric=minkowski, total= 1.9s
[CV] class__weights=distance, class__n_neighbors=29, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=29, class__metric=minkowski, total= 2.0s
[CV] class__weights=uniform, class__n_neighbors=30, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=30, class__metric=minkowski, total= 2.5s
[CV] class__weights=uniform, class__n_neighbors=30, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=30, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=30, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=30, class__metric=minkowski, total= 2.4s
[CV] class__weights=distance, class__n_neighbors=30, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=30, class__metric=minkowski, total= 2.4s
[CV] class__weights=distance, class__n_neighbors=30, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=30, class__metric=minkowski, total= 2.2s
[CV] class__weights=distance, class__n_neighbors=30, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=30, class__metric=minkowski, total= 2.8s
[CV] class__weights=uniform, class__n_neighbors=31, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=31, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=31, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=31, class__metric=minkowski, total= 2.0s
[CV] class__weights=uniform, class__n_neighbors=31, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=31, class__metric=minkowski, total= 2.7s
[CV] class__weights=distance, class__n_neighbors=31, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=31, class__metric=minkowski, total= 2.2s
[CV] class__weights=distance, class__n_neighbors=31, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=31, class__metric=minkowski, total= 2.1s
[CV] class__weights=distance, class__n_neighbors=31, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=31, class__metric=minkowski, total= 2.0s
[CV] class__weights=uniform, class__n_neighbors=32, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=32, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=32, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=32, class__metric=minkowski, total= 2.6s
[CV] class__weights=uniform, class__n_neighbors=32, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=32, class__metric=minkowski, total= 2.5s
[CV] class__weights=distance, class__n_neighbors=32, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=32, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=32, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=32, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=32, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=32, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=33, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=33, class__metric=minkowski, total= 2.2s
[CV] class__weights=uniform, class__n_neighbors=33, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=33, class__metric=minkowski, total= 2.5s
[CV] class__weights=uniform, class__n_neighbors=33, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=33, class__metric=minkowski, total= 2.7s
[CV] class__weights=distance, class__n_neighbors=33, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=33, class__metric=minkowski, total= 2.1s
[CV] class__weights=distance, class__n_neighbors=33, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=33, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=33, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=33, class__metric=minkowski, total= 2.2s
[CV] class__weights=uniform, class__n_neighbors=34, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=34, class__metric=minkowski, total= 2.3s
[CV] class__weights=uniform, class__n_neighbors=34, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=34, class__metric=minkowski, total= 2.1s
[CV] class__weights=uniform, class__n_neighbors=34, class__metric=minkowski
[CV] class__weights=uniform, class__n_neighbors=34, class__metric=minkowski, total= 2.2s
[CV] class__weights=distance, class__n_neighbors=34, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=34, class__metric=minkowski, total= 2.0s
[CV] class__weights=distance, class__n_neighbors=34, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=34, class__metric=minkowski, total= 2.1s
[CV] class__weights=distance, class__n_neighbors=34, class__metric=minkowski
[CV] class__weights=distance, class__n_neighbors=34, class__metric=minkowski, total= 2.0s
[Parallel(n_jobs=1)]: Done 60 out of 60 | elapsed: 6.4min finished
In [485]:
In [486]:
In [490]:
In [483]:
array([{'class__weights': 'uniform', 'class__n_neighbors': 27, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 34, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 31, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 33, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 31, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 29, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 29, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 32, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 32, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 33, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 34, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 25, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 26, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 26, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 25, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 27, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 28, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 28, 'class__metric': 'minkowski'},
{'class__weights': 'distance', 'class__n_neighbors': 30, 'class__metric': 'minkowski'},
{'class__weights': 'uniform', 'class__n_neighbors': 30, 'class__metric': 'minkowski'}],
dtype=object)
In [517]:
(49454, 37)
In [0]: