docs: Added a way to build HTML docs with pdoc (#64)

* fix(python): Proper docstring formatting * docs: Added a way to build HTML docs with pdoc Signed-off-by: Luka Peschke <[email protected]>
ToucanToco · Jan 2, 2023 · ef7b490 · ef7b490
1 parent 80fbd46
commit ef7b490
Show file tree

Hide file tree

Showing 5 changed files with 43 additions and 29 deletions.
diff --git a/.gitignore b/.gitignore
@@ -7,3 +7,4 @@ __pycache__
 *.dat
 .python-version
 .venv
+docs
diff --git a/Makefile b/Makefile
@@ -9,6 +9,8 @@ pytest	= python -m pytest
 ## Rust
 clippy	= cargo clippy
 fmt	= cargo fmt
+## Docs
+pdoc	= pdoc -o docs python/fastexcel
 
 lint:
 	$(ruff)
@@ -23,7 +25,10 @@ format:
 install-test-requirements:
 	pip install -U maturin -r test-requirements.txt
 
-dev-setup: install-test-requirements
+install-doc-requirements:
+	pip install -r doc-requirements.txt
+
+dev-setup: install-test-requirements install-doc-requirements
 	pre-commit install
 
 dev-install:
@@ -35,4 +40,7 @@ prod-install:
 test:
 	$(pytest)
 
+doc:
+	$(pdoc)
+
 test-ci: dev-install test
diff --git a/README.md b/README.md
@@ -40,7 +40,11 @@ The Makefile provides the `lint` and `format` extras to ease this.
 
 `make test`
 
-### Creating a release
+## Building the docs
+
+`make doc`
+
+## Creating a release
 
 1. Create a PR containing a commit that only updates the version in `Cargo.toml`.
 2. Once it is approved, squash and merge it into main.

diff --git a/doc-requirements.txt b/doc-requirements.txt
@@ -0,0 +1 @@
+pdoc
diff --git a/python/fastexcel/__init__.py b/python/fastexcel/__init__.py
@@ -27,7 +27,7 @@ def width(self) -> int:
 
     @property
     def height(self) -> int:
-        """The sheet's height, with skip_rows and nrows applied"""
+        """The sheet's height, with `skip_rows` and `nrows` applied"""
         return self._sheet.height
 
     @property
@@ -36,17 +36,17 @@ def total_height(self) -> int:
         return self._sheet.total_height
 
     def to_arrow(self) -> bytes:
-        """Converts the sheet to an Arrow RecordBatch.
+        """Converts the sheet to an Arrow `RecordBatch`.
 
         The RecordBatch is serialized to the IPC format. It can be read with
         `pyarrow.ipc.open_stream`.
         """
         return self._sheet.to_arrow()
 
     def to_pandas(self) -> "pd.DataFrame":
-        """Converts the sheet to a pandas DataFrame.
+        """Converts the sheet to a Pandas `DataFrame`.
 
-        Requires the "pandas" extra to be installed.
+        Requires the `pandas` extra to be installed.
         """
         # We know for sure that the sheet will yield exactly one RecordBatch
         return list(pa.ipc.open_stream(self.to_arrow()))[0].to_pandas()
@@ -77,13 +77,14 @@ def load_sheet_by_name(
     ) -> ExcelSheet:
         """Loads a sheet by name.
 
-        `header_row` is the index of the row containing the column labels, default index is 0.
-        If `None`, the sheet does not have any column labels.
-        `column_names` overrides headers found in the document.
-        If `column_names` is used `header_row` will be ignored.
-        `n_rows` is the number of rows to parse.
-        `skip_rows` is the line numbers to skip after the headers.
-        If `header_row` is `None` then it skips the number of lines from 0.
+        :param name: The name of the sheet to load.
+        :param header_row: The index of the row containing the column labels, default index is 0.
+                           If `None`, the sheet does not have any column labels.
+        :param column_names: Overrides headers found in the document. If `column_names` is used,
+                             `header_row` will be ignored.
+        :param n_rows: Specifies how many rows should be loaded. If `None`, all rows are loaded
+        :param skip_rows: Specifies how many should be skipped after the header. If `header_row` is
+                          `None`, it skips the number of rows from the sheet's start.
         """
         return ExcelSheet(
             self._reader.load_sheet_by_name(
@@ -104,15 +105,16 @@ def load_sheet_by_idx(
         skip_rows: int = 0,
         n_rows: int | None = None,
     ) -> ExcelSheet:
-        """Loads a sheet by his index.
-
-        `header_row` is the index of the row containing the column labels, default index is 0.
-        If `None`, the sheet does not have any column labels.
-        `column_names` overrides headers found in the document.
-        If `column_names` is used `header_row` will be ignored.
-        `n_rows` is the number of rows to parse.
-        `skip_rows` is the line numbers to skip after the headers.
-        If `header_row` is `None` then it skips the number of lines from 0.
+        """Loads a sheet by index.
+
+        :param idx: The index (starting at 0) of the sheet to load.
+        :param header_row: The index of the row containing the column labels, default index is 0.
+                           If `None`, the sheet does not have any column labels.
+        :param column_names: Overrides headers found in the document. If `column_names` is used,
+                             `header_row` will be ignored.
+        :param n_rows: Specifies how many rows should be loaded. If `None`, all rows are loaded
+        :param skip_rows: Specifies how many should be skipped after the header. If `header_row` is
+                          `None`, it skips the number of rows from the sheet's start.
         """
         if idx < 0:
             raise ValueError(f"Expected idx to be > 0, got {idx}")
@@ -137,13 +139,7 @@ def load_sheet(
     ) -> ExcelSheet:
         """Loads a sheet by name if a string is passed or by index if an integer is passed.
 
-        `header_row` is the index of the row containing the column labels, default index is 0.
-        If `None`, the sheet does not have any column labels.
-        `column_names` overrides headers found in the document.
-        If `column_names` is used `header_row` will be ignored.
-        `n_rows` is the number of rows to parse.
-        `skip_rows` is the line numbers to skip after the headers.
-        If `header_row` is `None` then it skips the number of lines from 0.
+        See `load_sheet_by_idx` and `load_sheet_by_name` for parameter documentation.
         """
         return (
             self.load_sheet_by_idx(
@@ -168,6 +164,10 @@ def __repr__(self) -> str:
 
 
 def read_excel(path: str) -> ExcelReader:
+    """Opens and loads an excel file.
+
+    :param path: The path to the file
+    """
     return ExcelReader(_read_excel(path))
-Original file line number
+Diff line change
@@ Expand Up / @@ -7,3 +7,4 @@ __pycache__ @@
     *.dat
     .python-version
     .venv
+    docs