huabdul's picture
Update app.py
f7de449
raw
history blame
5.18 kB
import numpy as np
import matplotlib.pyplot as plt
from matplotlib.colors import ListedColormap
from itertools import combinations
plt.rcParams['figure.dpi'] = 100
from sklearn.datasets import load_iris
from sklearn.tree import DecisionTreeClassifier
from sklearn.neighbors import KNeighborsClassifier
from sklearn.svm import SVC
from sklearn.ensemble import VotingClassifier
import gradio as gr
#==================================================
C1, C2, C3 = '#ff0000', '#ffff00', '#0000ff'
CMAP = ListedColormap([C1, C2, C3])
GRANULARITY = 0.05
FEATURE_NAMES = ["Sepal Length", "Sepal Width", "Petal Length", "Petal Width"]
TARGET_NAMES = ["Setosa", "Versicolour", "Virginica"]
MODEL_NAMES = ['DecisionTreeClassifier', 'KNeighborsClassifier', 'SupportVectorClassifier', 'VotingClassifier']
iris = load_iris()
#==================================================
def get_decision_surface(X, y, model):
x_min, x_max = X[:, 0].min() - 1, X[:, 0].max() + 1
y_min, y_max = X[:, 1].min() - 1, X[:, 1].max() + 1
xrange = np.arange(x_min, x_max, GRANULARITY)
yrange = np.arange(y_min, y_max, GRANULARITY)
xx, yy = np.meshgrid(xrange, yrange)
Z = model.predict(np.c_[xx.ravel(), yy.ravel()])
Z = Z.reshape(xx.shape)
return xx, yy, Z
def create_plot(feature_string, max_depth, n_neighbors, gamma, weight1, weight2, weight3):
feature_list = feature_string.split(',')
feature_list = [s.strip() for s in feature_list]
idx_x = FEATURE_NAMES.index(feature_list[0])
idx_y = FEATURE_NAMES.index(feature_list[1])
X = iris.data[:, [idx_x, idx_y]]
y = iris.target
rnd_idx = np.random.permutation(X.shape[0])
X = X[rnd_idx]
y = y[rnd_idx]
clf1 = DecisionTreeClassifier(max_depth=max_depth)
clf2 = KNeighborsClassifier(n_neighbors=n_neighbors, n_jobs=-1)
clf3 = SVC(gamma=gamma, kernel="rbf", probability=True)
eclf = VotingClassifier(
estimators=[("dt", clf1), ("knn", clf2), ("svc", clf3)],
voting="soft",
weights=[weight1, weight2, weight3],
)
clf1.fit(X, y)
clf2.fit(X, y)
clf3.fit(X, y)
eclf.fit(X, y)
fig, _ = plt.subplots(2, 2, figsize=(7, 7), sharex=True, sharey=True)
for i, clf in enumerate([clf1, clf2, clf3, eclf]):
xx, yy, Z = get_decision_surface(X, y, clf)
ax = fig.add_subplot(2, 2, i+1)
ax.set_axis_off()
ax.contourf(xx, yy, Z, cmap=CMAP, alpha=0.65)
for j, label in enumerate(TARGET_NAMES):
X_label = X[y==j,:]
y_label = y[y==j]
ax.scatter(X_label[:, 0], X_label[:, 1], c=[[C1], [C2], [C3]][j]*len(y_label), edgecolor='k', s=40, label=label)
ax.legend()
ax.set_title(f'{MODEL_NAMES[i]}')
fig.supxlabel(feature_list[0]); fig.supylabel(feature_list[1])
fig.set_tight_layout(True)
fig.set_constrained_layout(True)
return fig
info = '''
# Voting Classifier Decision Surface
This app plots the decision surface of four classifiers on two selected features of the Iris dataset: DecisionTreeClassifier, KNeighborsClassifier, SupportVectorClassifier, and a VotingClassifier from all of them.
Use the controls below to tune the parameters of the classifiers and the weights of each of them in the soft voting classifier and click submit. The more weight you assign to a classifier, the more importance will be assigned to its predictions compared to the other classifiers in the vote.
Created by [@huabdul](https://huggingface.co/huabdul) based on [scikit-learn docs](https://scikit-learn.org/stable/auto_examples/ensemble/plot_voting_decision_regions.html).
'''
with gr.Blocks(analytics_enabled=False) as demo:
selections = combinations(FEATURE_NAMES, 2)
selections = [f'{s[0]}, {s[1]}' for s in selections]
with gr.Row():
with gr.Column():
gr.Markdown(info)
dd = gr.Dropdown(selections, value=selections[0], interactive=True, label="Input features")
with gr.Row():
with gr.Column(min_width=100):
slider_max_depth = gr.Slider(1, 50, value=4, step=1, label='max_depth (DecisionTree)')
slider_n_neighbors = gr.Slider(1, 20, value=7, step=1, label='n_neighbors (KNN)')
slider_gamma = gr.Slider(0, 10, value=0.1, step=0.1, label='gamma (SVC)')
with gr.Column(min_width=100):
slider_w1 = gr.Slider(0, 10, value=2, step=0.1, label='DecisionTreeClassifier weight')
slider_w2 = gr.Slider(0, 10, value=1, step=0.1, label='KNeighborsClassifier weight')
slider_w3 = gr.Slider(0, 10, value=2, step=0.1, label='SVC weight')
btn = gr.Button(value='Submit')
with gr.Column():
plot = gr.Plot(show_label=False)
btn.click(create_plot, inputs=[dd, slider_max_depth, slider_n_neighbors, slider_gamma, slider_w1, slider_w2, slider_w3], outputs=[plot])
demo.load(create_plot, inputs=[dd, slider_max_depth, slider_n_neighbors, slider_gamma, slider_w1, slider_w2, slider_w3], outputs=[plot])
demo.launch()
#==================================================