[DOC] MkDocs Chemistry (#899)

ericmjl · Zeroto521 · web-flow · commit 24edc3acaabc · 2021-09-04T20:17:21.000-04:00
* mkdocstrings on chemistry functions * Minor update to biology.py * Proper config for syntax highlighting * Switch to nord theme for syntax highlighting * [INF] simplify a bit linting, use pre-commit as CI linting checker (#892) * [INF] simplify a bit linting There is two similar linting CIs (pre-commit and code-checks) but also have tiny differences. We should use one of them as the standard, not both. * Update CHANGELOG.md * should be `--config` not `-c` `-c` = `--code TEXT`, Format the code passed in as a string. * remove nbstripout keep the same with the old code-checks.yml * lint via pre-commit * Update CHANGELOG.md Co-authored-by: Eric Ma <ericmjl@users.noreply.github.com> * FLake8 fix. Co-authored-by: Zero <Zeroto521@gmail.com>
diff --git a/janitor/biology.py b/janitor/biology.py
@@ -58,7 +58,6 @@ def join_fasta(
     Method chaining usage example:
 
     ```python
-
     import pandas as pd
     import janitor.biology
 
diff --git a/janitor/chemistry.py b/janitor/chemistry.py
@@ -94,36 +94,38 @@ def smiles2mol(
 
     Functional usage example:
 
-    .. code-block:: python
+    ```python
+    import pandas as pd
+    import janitor.chemistry
 
-        import pandas as pd
-        import janitor.chemistry
+    df = pd.DataFrame(...)
 
-        df = pd.DataFrame(...)
-
-        df = janitor.chemistry.smiles2mol(
-            df=df,
-            smiles_column_name='smiles',
-            mols_column_name='mols'
-        )
+    df = janitor.chemistry.smiles2mol(
+        df=df,
+        smiles_column_name='smiles',
+        mols_column_name='mols'
+    )
+    ```
 
     Method chaining usage example:
 
-    .. code-block:: python
-
-        import pandas as pd
-        import janitor.chemistry
+    ```python
+    import pandas as pd
+    import janitor.chemistry
 
-        df = pd.DataFrame(...)
+    df = pd.DataFrame(...)
 
-        df = df.smiles2mol(smiles_column_name='smiles',
-                           mols_column_name='mols')
+    df = df.smiles2mol(
+        smiles_column_name='smiles',
+        mols_column_name='mols'
+    )
+    ```
 
     A progressbar can be optionally used.
 
-    - Pass in "notebook" to show a tqdm notebook progressbar. (ipywidgets must
-      be enabled with your Jupyter installation.)
-    - Pass in "terminal" to show a tqdm progressbar. Better suited for use
+    - Pass in "notebook" to show a `tqdm` notebook progressbar.
+      (`ipywidgets` must be enabled with your Jupyter installation.)
+    - Pass in "terminal" to show a `tqdm` progressbar. Better suited for use
       with scripts.
     - "none" is the default value - progress bar will be not be shown.
 
@@ -180,67 +182,70 @@ def morgan_fingerprint(
 
     Functional usage example:
 
-    .. code-block:: python
+    ```python
+    import pandas as pd
+    import janitor.chemistry
 
-        import pandas as pd
-        import janitor.chemistry
+    df = pd.DataFrame(...)
 
-        df = pd.DataFrame(...)
-
-        # For "counts" kind
-        morgans = janitor.chemistry.morgan_fingerprint(
-            df=df.smiles2mol('smiles', 'mols'),
-            mols_column_name='mols',
-            radius=3,      # Defaults to 3
-            nbits=2048,    # Defaults to 2048
-            kind='counts'  # Defaults to "counts"
-        )
+    # For "counts" kind
+    morgans = janitor.chemistry.morgan_fingerprint(
+        df=df.smiles2mol('smiles', 'mols'),
+        mols_column_name='mols',
+        radius=3,      # Defaults to 3
+        nbits=2048,    # Defaults to 2048
+        kind='counts'  # Defaults to "counts"
+    )
 
-        # For "bits" kind
-        morgans = janitor.chemistry.morgan_fingerprint(
-            df=df.smiles2mol('smiles', 'mols'),
-            mols_column_name='mols',
-            radius=3,      # Defaults to 3
-            nbits=2048,    # Defaults to 2048
-            kind='bits'    # Defaults to "counts"
-        )
+    # For "bits" kind
+    morgans = janitor.chemistry.morgan_fingerprint(
+        df=df.smiles2mol('smiles', 'mols'),
+        mols_column_name='mols',
+        radius=3,      # Defaults to 3
+        nbits=2048,    # Defaults to 2048
+        kind='bits'    # Defaults to "counts"
+    )
+    ```
 
     Method chaining usage example:
 
-    .. code-block:: python
+    ```python
+    import pandas as pd
+    import janitor.chemistry
 
-        import pandas as pd
-        import janitor.chemistry
+    df = pd.DataFrame(...)
 
-        df = pd.DataFrame(...)
-
-        # For "counts" kind
-        morgans = (
-            df.smiles2mol('smiles', 'mols')
-              .morgan_fingerprint(mols_column_name='mols',
-                                  radius=3,      # Defaults to 3
-                                  nbits=2048,    # Defaults to 2048
-                                  kind='counts'  # Defaults to "counts"
-              )
+    # For "counts" kind
+    morgans = (
+        df.smiles2mol('smiles', 'mols')
+        .morgan_fingerprint(
+            mols_column_name='mols',
+            radius=3,      # Defaults to 3
+            nbits=2048,    # Defaults to 2048
+            kind='counts'  # Defaults to "counts"
         )
+    )
 
-        # For "bits" kind
-        morgans = (
-            df.smiles2mol('smiles', 'mols')
-              .morgan_fingerprint(mols_column_name='mols',
-                                  radius=3,    # Defaults to 3
-                                  nbits=2048,  # Defaults to 2048
-                                  kind='bits'  # Defaults to "counts"
-              )
+    # For "bits" kind
+    morgans = (
+        df
+        .smiles2mol('smiles', 'mols')
+        .morgan_fingerprint(
+            mols_column_name='mols',
+            radius=3,    # Defaults to 3
+            nbits=2048,  # Defaults to 2048
+            kind='bits'  # Defaults to "counts"
         )
+    )
+    ```
 
     If you wish to join the morgan fingerprints back into the original
     dataframe, this can be accomplished by doing a `join`,
     because the indices are preserved:
 
-    .. code-block:: python
-
-        joined = df.join(morgans)
+    ```python
+    joined = df.join(morgans)
+    ```
 
     :param df: A pandas DataFrame.
     :param mols_column_name: The name of the column that has the RDKIT
@@ -294,52 +299,57 @@ def molecular_descriptors(
 
     The molecular descriptors are from the rdkit.Chem.rdMolDescriptors:
 
-        Chi0n, Chi0v, Chi1n, Chi1v, Chi2n, Chi2v, Chi3n, Chi3v,
-        Chi4n, Chi4v, ExactMolWt, FractionCSP3, HallKierAlpha, Kappa1,
-        Kappa2, Kappa3, LabuteASA, NumAliphaticCarbocycles,
-        NumAliphaticHeterocycles, NumAliphaticRings, NumAmideBonds,
-        NumAromaticCarbocycles, NumAromaticHeterocycles, NumAromaticRings,
-        NumAtomStereoCenters, NumBridgeheadAtoms, NumHBA, NumHBD,
-        NumHeteroatoms, NumHeterocycles, NumLipinskiHBA, NumLipinskiHBD,
-        NumRings, NumSaturatedCarbocycles, NumSaturatedHeterocycles,
-        NumSaturatedRings, NumSpiroAtoms, NumUnspecifiedAtomStereoCenters,
-        TPSA.
+    ```
+    Chi0n, Chi0v, Chi1n, Chi1v, Chi2n, Chi2v, Chi3n, Chi3v,
+    Chi4n, Chi4v, ExactMolWt, FractionCSP3, HallKierAlpha, Kappa1,
+    Kappa2, Kappa3, LabuteASA, NumAliphaticCarbocycles,
+    NumAliphaticHeterocycles, NumAliphaticRings, NumAmideBonds,
+    NumAromaticCarbocycles, NumAromaticHeterocycles, NumAromaticRings,
+    NumAtomStereoCenters, NumBridgeheadAtoms, NumHBA, NumHBD,
+    NumHeteroatoms, NumHeterocycles, NumLipinskiHBA, NumLipinskiHBD,
+    NumRings, NumSaturatedCarbocycles, NumSaturatedHeterocycles,
+    NumSaturatedRings, NumSpiroAtoms, NumUnspecifiedAtomStereoCenters,
+    TPSA.
+    ```
 
     Functional usage example:
 
-    .. code-block:: python
-
-        import pandas as pd
-        import janitor.chemistry
+    ```python
+    import pandas as pd
+    import janitor.chemistry
 
-        df = pd.DataFrame(...)
+    df = pd.DataFrame(...)
 
-        mol_desc = janitor.chemistry.molecular_descriptors(
+    mol_desc = (
+        janitor.chemistry.molecular_descriptors(
             df=df.smiles2mol('smiles', 'mols'),
             mols_column_name='mols'
         )
+    )
+    ```
 
     Method chaining usage example:
 
-    .. code-block:: python
+    ```python
 
-        import pandas as pd
-        import janitor.chemistry
+    import pandas as pd
+    import janitor.chemistry
 
-        df = pd.DataFrame(...)
+    df = pd.DataFrame(...)
 
-        mol_desc = (
-            df.smiles2mol('smiles', 'mols')
-              .molecular_descriptors(mols_column_name='mols')
-        )
+    mol_desc = (
+        df.smiles2mol('smiles', 'mols')
+        .molecular_descriptors(mols_column_name='mols')
+    )
+    ```
 
     If you wish to join the molecular descriptors back into the original
     dataframe, this can be accomplished by doing a `join`,
     because the indices are preserved:
 
-    .. code-block:: python
-
-        joined = df.join(mol_desc)
+    ```python
+    joined = df.join(mol_desc)
+    ```
 
     :param df: A pandas DataFrame.
     :param mols_column_name: The name of the column that has the RDKIT mol
@@ -410,40 +420,39 @@ def maccs_keys_fingerprint(
 
     Functional usage example:
 
-    .. code-block:: python
-
-        import pandas as pd
-        import janitor.chemistry
+    ```python
+    import pandas as pd
+    import janitor.chemistry
 
-        df = pd.DataFrame(...)
+    df = pd.DataFrame(...)
 
-        maccs = janitor.chemistry.maccs_keys_fingerprint(
-            df=df.smiles2mol('smiles', 'mols'),
-            mols_column_name='mols'
-        )
+    maccs = janitor.chemistry.maccs_keys_fingerprint(
+        df=df.smiles2mol('smiles', 'mols'),
+        mols_column_name='mols'
+    )
+    ```
 
     Method chaining usage example:
 
-    .. code-block:: python
+    ```python
+    import pandas as pd
+    import janitor.chemistry
 
-        import pandas as pd
-        import janitor.chemistry
+    df = pd.DataFrame(...)
 
-        df = pd.DataFrame(...)
-
-        maccs = (
-            df.smiles2mol('smiles', 'mols')
-              .maccs_keys_fingerprint(mols_column_name='mols')
-        )
+    maccs = (
+        df.smiles2mol('smiles', 'mols')
+            .maccs_keys_fingerprint(mols_column_name='mols')
+    )
+    ```
 
     If you wish to join the maccs keys fingerprints back into the
     original dataframe, this can be accomplished by doing a `join`,
     because the indices are preserved:
 
-    .. code-block:: python
-
-        joined = df.join(maccs_keys_fingerprint)
-
+    ```python
+    joined = df.join(maccs_keys_fingerprint)
+    ```
 
     :param df: A pandas DataFrame.
     :param mols_column_name: The name of the column that has the RDKIT mol
diff --git a/mkdocs.yml b/mkdocs.yml
@@ -61,8 +61,11 @@ plugins:
 
 # Taken from here: https://squidfunk.github.io/mkdocs-material/extensions/codehilite/
 markdown_extensions:
-  - codehilite
+  # - codehilite
   - admonition
+  - pymdownx.highlight:
+      use_pygments: false
+  - pymdownx.inlinehilite
   # - pymdownx.tabbed
   # - pymdownx.arithmatex
   # - pymdownx.details
@@ -71,10 +74,16 @@ markdown_extensions:
 
 extra_javascript:
   - https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.0/MathJax.js?config=TeX-AMS-MML_HTMLorMML
+  - https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.7.2/highlight.min.js
+  - js/config.js
 
 extra_css:
   - css/nb_mods.css
   - css/apidocs.css
+  # This sets the theme for syntax highlighting.
+  # Theme names are available here: https://highlightjs.org/static/demo/
+  # Not sure how the theme names map onto CSS filenames though.
+  - https://cdnjs.cloudflare.com/ajax/libs/highlight.js/10.7.2/styles/nord.min.css
 
 repo_name: "ericmjl/pyjanitor"
 repo_url: "https://github.com/ericmjl/pyjanitor"
diff --git a/mkdocs/js/config.js b/mkdocs/js/config.js
@@ -0,0 +1 @@
+hljs.highlightAll();