2020-03-13 16:13:43 +08:00
|
|
|
# Random Forest Classifier Example
|
2020-07-06 15:44:19 +08:00
|
|
|
from matplotlib import pyplot as plt
|
2020-03-13 16:13:43 +08:00
|
|
|
from sklearn.datasets import load_iris
|
|
|
|
from sklearn.ensemble import RandomForestClassifier
|
|
|
|
from sklearn.metrics import plot_confusion_matrix
|
2020-07-06 15:44:19 +08:00
|
|
|
from sklearn.model_selection import train_test_split
|
2020-03-13 16:13:43 +08:00
|
|
|
|
|
|
|
|
|
|
|
def main():
|
|
|
|
|
|
|
|
"""
|
2020-04-13 08:15:48 +08:00
|
|
|
Random Forest Classifier Example using sklearn function.
|
2020-03-13 16:13:43 +08:00
|
|
|
Iris type dataset is used to demonstrate algorithm.
|
|
|
|
"""
|
|
|
|
|
2020-04-13 08:15:48 +08:00
|
|
|
# Load Iris dataset
|
2020-03-13 16:13:43 +08:00
|
|
|
iris = load_iris()
|
|
|
|
|
|
|
|
# Split dataset into train and test data
|
2022-10-13 06:54:20 +08:00
|
|
|
x = iris["data"] # features
|
|
|
|
y = iris["target"]
|
2020-03-13 16:13:43 +08:00
|
|
|
x_train, x_test, y_train, y_test = train_test_split(
|
2022-10-13 06:54:20 +08:00
|
|
|
x, y, test_size=0.3, random_state=1
|
2020-03-13 16:13:43 +08:00
|
|
|
)
|
|
|
|
|
|
|
|
# Random Forest Classifier
|
|
|
|
rand_for = RandomForestClassifier(random_state=42, n_estimators=100)
|
|
|
|
rand_for.fit(x_train, y_train)
|
|
|
|
|
|
|
|
# Display Confusion Matrix of Classifier
|
|
|
|
plot_confusion_matrix(
|
|
|
|
rand_for,
|
|
|
|
x_test,
|
|
|
|
y_test,
|
|
|
|
display_labels=iris["target_names"],
|
|
|
|
cmap="Blues",
|
|
|
|
normalize="true",
|
|
|
|
)
|
|
|
|
plt.title("Normalized Confusion Matrix - IRIS Dataset")
|
|
|
|
plt.show()
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
main()
|