DOC remove obsolete SVM example (#27108)

adrinjalali · jeremiedbb · commit ffbe4ab45bd9 · 2024-05-21T15:57:58.000+02:00
diff --git a/doc/conf.py b/doc/conf.py
@@ -301,6 +301,7 @@
     "auto_examples/decomposition/plot_beta_divergence": (
         "auto_examples/applications/plot_topics_extraction_with_nmf_lda"
     ),
+    "auto_examples/svm/plot_svm_nonlinear": "auto_examples/svm/plot_svm_kernels",
     "auto_examples/ensemble/plot_adaboost_hastie_10_2": (
         "auto_examples/ensemble/plot_adaboost_multiclass"
     ),
diff --git a/examples/svm/plot_svm_kernels.py b/examples/svm/plot_svm_kernels.py
@@ -110,12 +110,15 @@
 from sklearn.inspection import DecisionBoundaryDisplay
 
 
-def plot_training_data_with_decision_boundary(kernel):
+def plot_training_data_with_decision_boundary(
+    kernel, ax=None, long_title=True, support_vectors=True
+):
     # Train the SVC
     clf = svm.SVC(kernel=kernel, gamma=2).fit(X, y)
 
     # Settings for plotting
-    _, ax = plt.subplots(figsize=(4, 3))
+    if ax is None:
+        _, ax = plt.subplots(figsize=(4, 3))
     x_min, x_max, y_min, y_max = -3, 3, -3, 3
     ax.set(xlim=(x_min, x_max), ylim=(y_min, y_max))
 
@@ -136,20 +139,26 @@ def plot_training_data_with_decision_boundary(kernel):
         linestyles=["--", "-", "--"],
     )
 
-    # Plot bigger circles around samples that serve as support vectors
-    ax.scatter(
-        clf.support_vectors_[:, 0],
-        clf.support_vectors_[:, 1],
-        s=250,
-        facecolors="none",
-        edgecolors="k",
-    )
+    if support_vectors:
+        # Plot bigger circles around samples that serve as support vectors
+        ax.scatter(
+            clf.support_vectors_[:, 0],
+            clf.support_vectors_[:, 1],
+            s=150,
+            facecolors="none",
+            edgecolors="k",
+        )
+
     # Plot samples by color and add legend
-    ax.scatter(X[:, 0], X[:, 1], c=y, s=150, edgecolors="k")
+    ax.scatter(X[:, 0], X[:, 1], c=y, s=30, edgecolors="k")
     ax.legend(*scatter.legend_elements(), loc="upper right", title="Classes")
-    ax.set_title(f" Decision boundaries of {kernel} kernel in SVC")
+    if long_title:
+        ax.set_title(f" Decision boundaries of {kernel} kernel in SVC")
+    else:
+        ax.set_title(kernel)
 
-    _ = plt.show()
+    if ax is None:
+        plt.show()
 
 
 # %%
@@ -237,7 +246,6 @@ def plot_training_data_with_decision_boundary(kernel):
 # using the hyperbolic tangent function (:math:`\tanh`). The kernel function
 # scales and possibly shifts the dot product of the two points
 # (:math:`\mathbf{x}_1` and :math:`\mathbf{x}_2`).
-
 plot_training_data_with_decision_boundary("sigmoid")
 
 # %%
@@ -271,3 +279,26 @@ def plot_training_data_with_decision_boundary(kernel):
 # parameters using techniques such as
 # :class:`~sklearn.model_selection.GridSearchCV` is recommended to capture the
 # underlying structures within the data.
+
+# %%
+# XOR dataset
+# -----------
+# A classical example of a dataset which is not linearly separable is the XOR
+# pattern. HEre we demonstrate how different kernels work on such a dataset.
+
+xx, yy = np.meshgrid(np.linspace(-3, 3, 500), np.linspace(-3, 3, 500))
+np.random.seed(0)
+X = np.random.randn(300, 2)
+y = np.logical_xor(X[:, 0] > 0, X[:, 1] > 0)
+
+_, ax = plt.subplots(2, 2, figsize=(8, 8))
+args = dict(long_title=False, support_vectors=False)
+plot_training_data_with_decision_boundary("linear", ax[0, 0], **args)
+plot_training_data_with_decision_boundary("poly", ax[0, 1], **args)
+plot_training_data_with_decision_boundary("rbf", ax[1, 0], **args)
+plot_training_data_with_decision_boundary("sigmoid", ax[1, 1], **args)
+plt.show()
+
+# %%
+# As you can see from the plots above, only the `rbf` kernel can find a
+# reasonable decision boundary for the above dataset.
diff --git a/examples/svm/plot_svm_nonlinear.py b/examples/svm/plot_svm_nonlinear.py