Reintroduced ordering + fixing conversion typos

PicoCentauri · PicoCentauri · commit 6e6b9a859eb7 · 2023-03-28T09:18:45.000+02:00
diff --git a/docs/source/index.rst b/docs/source/index.rst
@@ -26,6 +26,6 @@ decomposition, and selection of features and samples.
   intro
   installation
   reference
-  examples/index
+  tutorials
   contributing
   bibliography
diff --git a/docs/source/intro.rst b/docs/source/intro.rst
@@ -1,5 +1,5 @@
 What's in scikit-matter?
-========================
+=======================
 
 ``scikit-matter`` is a collection of `scikit-learn <https://scikit.org/>`_
 compatible utilities that implement methods born out of the materials science
diff --git a/docs/source/tutorials.rst b/docs/source/tutorials.rst
@@ -0,0 +1,28 @@
+.. include:: examples/index.rst
+  :start-after: inclusion-examples-start
+  :end-before: inclusion-examples-end
+
+.. toctree::
+  :glob:
+  :Caption: PCovR and KernelPCovR
+
+  examples/PCovR*
+
+.. toctree::
+  :glob:
+  :Caption: Feature and Sample Selection
+
+  examples/FeatureSelection*
+  examples/Selectors-Pipelines*
+
+.. toctree::
+  :Caption: Orthogonal Regression
+
+  examples/OrthogonalRegressionNonAnalytic
+
+.. toctree::
+  :Caption: Feature Reconstruction Measures
+
+  examples/PlotGFRE
+  examples/PlotPointwiseGFRE
+  examples/PlotLFRE
diff --git a/examples/FeatureSelection-WHODataset.py b/examples/FeatureSelection-WHODataset.py
@@ -16,7 +16,8 @@
 from skmatter.feature_selection import CUR, FPS, PCovCUR, PCovFPS
 from skmatter.preprocessing import StandardFlexibleScaler
 
-
+# %%
+#
 # Load the Dataset
 # ----------------
 
@@ -78,7 +79,7 @@
 # %%
 #
 # Scale and Center the Features and Targets
-# -----------------------------------------
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
 x_scaler = StandardFlexibleScaler(column_wise=True)
 X = x_scaler.fit_transform(X_raw)
@@ -95,7 +96,7 @@
 # %%
 #
 # Provide an estimated target for the feature selector
-# ----------------------------------------------------
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
 
 kernel_params = {"kernel": "rbf", "gamma": 0.08858667904100832}
@@ -112,7 +113,7 @@
 
 # %%
 # PCov-CUR
-# --------
+# ^^^^^^^^
 
 
 pcur = PCovCUR(n_to_select=n_select, progress_bar=True, mixing=0.0)
@@ -121,7 +122,7 @@
 # %%
 #
 # PCov-FPS
-# --------
+# ^^^^^^^^
 
 pfps = PCovFPS(
     n_to_select=n_select,
@@ -134,7 +135,7 @@
 # %%
 #
 # CUR
-# ---
+# ^^^
 
 cur = CUR(n_to_select=n_select, progress_bar=True)
 cur.fit(X_train, y_train)
@@ -143,15 +144,15 @@
 # %%
 #
 # FPS
-# ---
+# ^^^
 
 fps = FPS(n_to_select=n_select, progress_bar=True, initialize=cur.selected_idx_[0])
 fps.fit(X_train, y_train)
 
 # %%
 #
-# (For Comparison) Recurisive Feature Addition
-# --------------------------------------------
+# (For Comparison) Recursive Feature Addition
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
 
 class RecursiveFeatureAddition:
@@ -180,7 +181,7 @@ def fit(self, X, y):
 # %%
 #
 # Plot our Results
-# ================
+# ----------------
 
 
 fig, axes = plt.subplots(
diff --git a/examples/FeatureSelection.py b/examples/FeatureSelection.py
@@ -67,7 +67,7 @@
 # %%
 #
 # Non-iterative feature selection with CUR + PCovR
-# ------------------------------------------------
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 #
 # Computing a non-iterative CUR is more efficient, although can resultin poorer
 # performance for larger datasets. you can also use a greater number of
diff --git a/examples/OrthogonalRegressionNonAnalytic.py b/examples/OrthogonalRegressionNonAnalytic.py
@@ -236,9 +236,10 @@ def z_scaled_square_prism(z_scaling):
 
 ax_xy.set_title("xy plane")
 
-plt.legend(bbox_to_anchor=(1, 1), loc="upper left")
+ax_xy.legend(bbox_to_anchor=(1, 1), loc="upper left")
 
-plt.show()
+fig.tight_layout()
+fig.show()
 
 # %%
 #
@@ -279,7 +280,9 @@ def z_scaled_square_prism(z_scaling):
 )
 ax_wo_orth.set_xlabel("scaling in z direction")
 ax_wo_orth.legend(loc="upper right", bbox_to_anchor=(0.7, -0.2))
-plt.show()
+
+fig.tight_layout()
+fig.show()
 
 # %%
 #
diff --git a/examples/PCovR-WHODataset.py b/examples/PCovR-WHODataset.py
@@ -7,7 +7,6 @@
 # %%
 #
 
-
 import numpy as np
 from matplotlib import pyplot as plt
 from scipy.stats import pearsonr
@@ -23,7 +22,7 @@
 # %%
 #
 # Load the Dataset
-# ================
+# ----------------
 
 
 df = load_who_dataset()["data"]
@@ -55,14 +54,14 @@
     print(X_raw[:, columns.index(ls)].min(), X_raw[:, columns.index(ls)].max())
     if ls in columns:
         X_raw[:, columns.index(ls)] = np.log10(X_raw[:, columns.index(ls)])
-y_raw = np.array(df["SP.DYN.LE00.IN"])  # [np.where(df['Year']==2000)[0]])
+y_raw = np.array(df["SP.DYN.LE00.IN"])
 y_raw = y_raw.reshape(-1, 1)
 X_raw.shape
 
 # %%
 #
 # Scale and Center the Features and Targets
-# -----------------------------------------
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
 x_scaler = StandardFlexibleScaler(column_wise=True)
 X = x_scaler.fit_transform(X_raw)
@@ -79,7 +78,7 @@
 # %%
 #
 # Train the Different Linear DR Techniques
-# ========================================
+# ----------------------------------------
 #
 # Best Error for Linear Regression
 
@@ -90,7 +89,7 @@
 # %%
 #
 # PCovR
-# -----
+# ^^^^^
 
 pcovr = PCovR(
     n_components=n_components,
@@ -113,7 +112,7 @@
 # %%
 #
 # PCA
-# ---
+# ^^^
 
 pca = PCA(
     n_components=n_components,
@@ -140,10 +139,10 @@
 # %%
 #
 # Train the Different Kernel DR Techniques
-# ========================================
+# ----------------------------------------
 #
 # Select Kernel Hyperparameters
-# -----------------------------
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
 param_grid = {"gamma": np.logspace(-8, 3, 20), "alpha": np.logspace(-8, 3, 20)}
 clf = KernelRidge(kernel="rbf")
@@ -168,7 +167,7 @@
 # %%
 #
 # KPCovR
-# ------
+# ^^^^^^
 
 
 kpcovr = KernelPCovR(
@@ -191,7 +190,7 @@
 # %%
 #
 # KPCA
-# ----
+# ^^^^
 
 kpca = KernelPCA(n_components=n_components, **kernel_params, random_state=0).fit(
     X_train, y_train
@@ -210,15 +209,15 @@
 # %%
 #
 # Correlation of the different variables with the KPCovR axes
-# -----------------------------------------------------------
+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
 for c, x in zip(columns, X.T):
     print(c, pearsonr(x, T_kpcovr[:, 0])[0], pearsonr(x, T_kpcovr[:, 1])[0])
 
 # %%
 #
 # Plot Our Results
-# ================
+# ----------------
 
 fig, axes = plt.subplot_mosaic(
     """
diff --git a/examples/PCovR.py b/examples/PCovR.py
@@ -164,5 +164,5 @@
 # it's important to consider the nature of the property you are learning and the samples
 # you are comparing before constructing a kernel, for example, whether the analysis is
 # to be based on whole structures or individual atomic environments. For more detail,
-# see Appendix C of [Helfrecht 2020](https://iopscience.iop.org/article/10.1088/2632-2153/aba9ef)
-# or regarding kernels involving gradients [Musil 2021](https://arxiv.org/pdf/2101.08814.pdf).
+# see Appendix C of `Helfrecht 2020 <https://iopscience.iop.org/article/10.1088/2632-2153/aba9ef>`_
+# or regarding kernels involving gradients `Musil 2021 <https://arxiv.org/pdf/2101.08814.pdf>`_.
diff --git a/examples/PCovR_Regressors.py b/examples/PCovR_Regressors.py
@@ -33,7 +33,7 @@
 # %%
 #
 # Use the default regressor in PCovR
-# ==================================
+# ----------------------------------
 #
 # When there is no regressor supplied, PCovR uses
 # ``sklearn.linear_model.Ridge('alpha':1e-6, 'fit_intercept':False, 'tol':1e-12)``.
@@ -50,7 +50,7 @@
 # %%
 #
 # Use a fitted regressor
-# ======================
+# ----------------------
 #
 # You can pass a fitted regressor to PCovR to rely on the predetermined
 # regression parameters. Currently, scikit-matter supports ``scikit-learn``
@@ -80,7 +80,7 @@
 # %%
 #
 # Use a pre-predicted y
-# =====================
+# ---------------------
 #
 # With ``regressor='precomputed'``, you can pass a regression output :math:`\hat{Y}` and
 # optional regression weights :math:`W` to PCovR. If ``W=None``, then PCovR will determine
@@ -110,7 +110,7 @@
 # %%
 #
 # Comparing Results
-# =================
+# -----------------
 #
 # Because we used the same regressor in all three models, they will yield the same result.
 
diff --git a/examples/PCovR_Scaling.py b/examples/PCovR_Scaling.py
@@ -143,6 +143,6 @@
 
 # %%
 #
-# **Note: when the relative magnitude of the features or targets is important, such as
-# in load_csd_1000r, one should use the `StandardFlexibleScaler` provided by
-# ``scikit-matter``.**
+# **Note**: When the relative magnitude of the features or targets is important, such
+# as in :func:`skmatter.datasets.load_csd_1000r`, one should use the
+# :class:`skmatter.preprocessing.StandardFlexibleScaler`.
diff --git a/examples/PlotPointwiseGFRE.py b/examples/PlotPointwiseGFRE.py
@@ -50,7 +50,7 @@
 #       \exp(-\gamma \|\mathbf{x}-\mathbf{x}'\|^2),\quad \gamma\in\mathbb{R}_+
 #
 # The projected RKHS features are computed using the eigendecomposition of the
-# positive-definite kernel matrix :math:`K``
+# positive-definite kernel matrix :math:`K`
 #
 # .. math::
 #   K = ADA^T = AD^{\frac12}(AD^{\frac12})^T = \Phi\Phi^T
diff --git a/examples/README.rst b/examples/README.rst
@@ -1,9 +1,13 @@
+.. inclusion-examples-start
+
 Examples
-########
+========
 
 For a thorough tutorial of the methods introduced in `scikit-matter`, we
 suggest you check out the pedagogic notebooks in our companion project
 `kernel-tutorials <https://github.com/lab-cosmo/kernel-tutorials/>`_.
 
 The examples presented here need on top of the `scikit-matter` dependencies
 `pandas <https://pandas.pydata.org>`_ and `matplotlib <https://matplotlib.org>`_.
+
+.. inclusion-examples-end
diff --git a/examples/Selectors-Pipelines.py b/examples/Selectors-Pipelines.py
@@ -23,7 +23,7 @@
 # %%
 #
 # Simple integration of scikit-matter selectors
-# =============================================
+# ---------------------------------------------
 #
 # This example shows how to use FPS to subselect features before training a RidgeCV.
 
@@ -50,7 +50,7 @@
 # %%
 #
 # Stacking selectors one after another
-# ====================================
+# ------------------------------------
 #
 # This example shows how to use an FPS, then CUR selector
 # to subselect features before training a RidgeCV.
diff --git a/skmatter/datasets/descr/nice_dataset.rst b/skmatter/datasets/descr/nice_dataset.rst
@@ -2,7 +2,6 @@
 
 NICE dataset
 ############
-
 This is a toy dataset containing NICE[1, 4](N-body Iterative Contraction of Equivariants) features for first 500 configurations of the dataset[2, 3] with randomly displaced methane configurations. 
 
 Function Call
@@ -11,10 +10,8 @@ Function Call
 
 Data Set Characteristics
 ------------------------
-
 :Number of Instances: 500
 :Number of Features: 160
-
 The representations were computed using the NICE package[4] using the following definition of the NICE calculator:
 
 .. code-block:: python

Original file line number	Diff line number	Diff line change
`@@ -67,7 +67,7 @@`
`67`	`67`	`# %%`
`68`	`68`	`#`
`69`	`69`	`# Non-iterative feature selection with CUR + PCovR`
`70`		`-# ------------------------------------------------`
	`70`	`+# ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^`
`71`	`71`	`#`
`72`	`72`	`# Computing a non-iterative CUR is more efficient, although can resultin poorer`
`73`	`73`	`# performance for larger datasets. you can also use a greater number of`
Original file line number	Diff line number	Diff line change
`@@ -236,9 +236,10 @@ def z_scaled_square_prism(z_scaling):`
`236`	`236`
`237`	`237`	`ax_xy.set_title("xy plane")`
`238`	`238`
`239`		`-plt.legend(bbox_to_anchor=(1, 1), loc="upper left")`
	`239`	`+ax_xy.legend(bbox_to_anchor=(1, 1), loc="upper left")`
`240`	`240`
`241`		`-plt.show()`
	`241`	`+fig.tight_layout()`
	`242`	`+fig.show()`
`242`	`243`
`243`	`244`	`# %%`
`244`	`245`	`#`
`@@ -279,7 +280,9 @@ def z_scaled_square_prism(z_scaling):`
`279`	`280`	`)`
`280`	`281`	`ax_wo_orth.set_xlabel("scaling in z direction")`
`281`	`282`	`ax_wo_orth.legend(loc="upper right", bbox_to_anchor=(0.7, -0.2))`
`282`		`-plt.show()`
	`283`	`+`
	`284`	`+fig.tight_layout()`
	`285`	`+fig.show()`
`283`	`286`
`284`	`287`	`# %%`
`285`	`288`	`#`
Original file line number	Diff line number	Diff line change
`@@ -33,7 +33,7 @@`
`33`	`33`	`# %%`
`34`	`34`	`#`
`35`	`35`	`# Use the default regressor in PCovR`
`36`		`-# ==================================`
	`36`	`+# ----------------------------------`
`37`	`37`	`#`
`38`	`38`	`# When there is no regressor supplied, PCovR uses`
`39`	`39`	# ``sklearn.linear_model.Ridge('alpha':1e-6, 'fit_intercept':False, 'tol':1e-12)``.
`@@ -50,7 +50,7 @@`
`50`	`50`	`# %%`
`51`	`51`	`#`
`52`	`52`	`# Use a fitted regressor`
`53`		`-# ======================`
	`53`	`+# ----------------------`
`54`	`54`	`#`
`55`	`55`	`# You can pass a fitted regressor to PCovR to rely on the predetermined`
`56`	`56`	# regression parameters. Currently, scikit-matter supports ``scikit-learn``
`@@ -80,7 +80,7 @@`
`80`	`80`	`# %%`
`81`	`81`	`#`
`82`	`82`	`# Use a pre-predicted y`
`83`		`-# =====================`
	`83`	`+# ---------------------`
`84`	`84`	`#`
`85`	`85`	# With ``regressor='precomputed'``, you can pass a regression output :math:`\hat{Y}` and
`86`	`86`	# optional regression weights :math:`W` to PCovR. If ``W=None``, then PCovR will determine
`@@ -110,7 +110,7 @@`
`110`	`110`	`# %%`
`111`	`111`	`#`
`112`	`112`	`# Comparing Results`
`113`		`-# =================`
	`113`	`+# -----------------`
`114`	`114`	`#`
`115`	`115`	`# Because we used the same regressor in all three models, they will yield the same result.`
`116`	`116`
Original file line number	Diff line number	Diff line change
`@@ -143,6 +143,6 @@`
`143`	`143`
`144`	`144`	`# %%`
`145`	`145`	`#`
`146`		`-# **Note: when the relative magnitude of the features or targets is important, such as`
`147`		-# in load_csd_1000r, one should use the `StandardFlexibleScaler` provided by
`148`		-# ``scikit-matter``.**
	`146`	`+# Note: When the relative magnitude of the features or targets is important, such`
	`147`	+# as in :func:`skmatter.datasets.load_csd_1000r`, one should use the
	`148`	+# :class:`skmatter.preprocessing.StandardFlexibleScaler`.
Original file line number	Diff line number	Diff line change
`@@ -23,7 +23,7 @@`
`23`	`23`	`# %%`
`24`	`24`	`#`
`25`	`25`	`# Simple integration of scikit-matter selectors`
`26`		`-# =============================================`
	`26`	`+# ---------------------------------------------`
`27`	`27`	`#`
`28`	`28`	`# This example shows how to use FPS to subselect features before training a RidgeCV.`
`29`	`29`
`@@ -50,7 +50,7 @@`
`50`	`50`	`# %%`
`51`	`51`	`#`
`52`	`52`	`# Stacking selectors one after another`
`53`		`-# ====================================`
	`53`	`+# ------------------------------------`
`54`	`54`	`#`
`55`	`55`	`# This example shows how to use an FPS, then CUR selector`
`56`	`56`	`# to subselect features before training a RidgeCV.`