# ignore warnings
import warnings
warnings.filterwarnings("ignore")
import pandas as pd
from sklearn import model_selection
from sklearn.ensemble import BaggingClassifier
from sklearn.tree import DecisionTreeClassifier
# load data
filename = 'pima.indians.diabetes.data.csv'
names = ['preg', 'plas', 'pres', 'skin', 'test', 'mass', 'pedi', 'age', 'class']
dataframe = pd.read_csv(filename, names=names)
print(); print(dataframe.head())
array = dataframe.values
X = array[:,0:8]
Y = array[:,8]
seed = 7
kfold = model_selection.KFold(n_splits=10, random_state=seed)
cart = DecisionTreeClassifier()
num_trees = 1000
model = BaggingClassifier(base_estimator=cart, n_estimators=num_trees, random_state=seed)
results = model_selection.cross_val_score(model, X, Y, cv=kfold)
print(); print("Accuracy Results: ")
print(results.mean())
import pandas
from sklearn import model_selection
from sklearn.ensemble import RandomForestClassifier
# load data
filename = 'pima.indians.diabetes.data.csv'
names = ['preg', 'plas', 'pres', 'skin', 'test', 'mass', 'pedi', 'age', 'class']
dataframe = pd.read_csv(filename, names=names)
print(); print(dataframe.head())
array = dataframe.values
X = array[:,0:8]
Y = array[:,8]
seed = 7
num_trees = 1000
max_features = 6
kfold = model_selection.KFold(n_splits=10, random_state=seed)
model = RandomForestClassifier(n_estimators=num_trees, max_features=max_features)
results = model_selection.cross_val_score(model, X, Y, cv=kfold)
print(); print("Accuracy Results: ")
print(results.mean())
import pandas
from sklearn import model_selection
from sklearn.ensemble import ExtraTreesClassifier
# load data
filename = 'pima.indians.diabetes.data.csv'
names = ['preg', 'plas', 'pres', 'skin', 'test', 'mass', 'pedi', 'age', 'class']
dataframe = pd.read_csv(filename, names=names)
print(); print(dataframe.head())
array = dataframe.values
X = array[:,0:8]
Y = array[:,8]
seed = 7
num_trees = 1000
max_features = 7
kfold = model_selection.KFold(n_splits=10, random_state=seed)
model = ExtraTreesClassifier(n_estimators=num_trees, max_features=max_features)
results = model_selection.cross_val_score(model, X, Y, cv=kfold)
print(); print("Accuracy Results: ")
print(results.mean())