From 172f61329805841cefacbab278ad2b01f95411fd Mon Sep 17 00:00:00 2001
From: Martijn Govers <Martijn.Govers@Alliander.com>
Date: Tue, 1 Oct 2024 09:18:20 +0200
Subject: [PATCH 1/6] check mypy with numpy

Signed-off-by: Martijn Govers <Martijn.Govers@Alliander.com>
---
 .github/workflows/check-code-quality.yml |  2 +-
 .pre-commit-config.yaml                  |  8 +++++---
 src/power_grid_model/_utils.py           | 10 ++++++----
 3 files changed, 12 insertions(+), 8 deletions(-)

diff --git a/.github/workflows/check-code-quality.yml b/.github/workflows/check-code-quality.yml
index ab570eeae..af2918650 100644
--- a/.github/workflows/check-code-quality.yml
+++ b/.github/workflows/check-code-quality.yml
@@ -55,7 +55,7 @@ jobs:
 
       - name: Install and run mypy
         run: |
-          pip install mypy
+          pip install mypy numpy
           mypy .
 
       - name: Install and run pylint
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index cf8178661..eef0d09da 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -4,7 +4,7 @@
 
 repos:
   - repo: https://github.com/fsfe/reuse-tool
-    rev: v3.0.2
+    rev: v4.0.3
     hooks:
       - id: reuse
   - repo: https://github.com/pycqa/isort
@@ -12,13 +12,15 @@ repos:
     hooks:
       - id: isort
   - repo: https://github.com/psf/black
-    rev: 24.4.2
+    rev: 24.8.0
     hooks:
       - id: black-jupyter
   - repo: https://github.com/pre-commit/mirrors-mypy
-    rev: v1.10.0
+    rev: v1.11.2
     hooks:
       - id: mypy
+        additional_dependencies:
+          - numpy
   - repo: local
     hooks:
       - id: pylint
diff --git a/src/power_grid_model/_utils.py b/src/power_grid_model/_utils.py
index 52a195578..8bc166946 100644
--- a/src/power_grid_model/_utils.py
+++ b/src/power_grid_model/_utils.py
@@ -93,7 +93,7 @@ def convert_batch_dataset_to_batch_list(batch_data: BatchDataset) -> BatchList:
         if is_sparse(data):
             component_batches = split_sparse_batch_data_in_batches(cast(SparseBatchData, data), component)
         else:
-            component_batches = split_dense_batch_data_in_batches(data, component)
+            component_batches = split_dense_batch_data_in_batches(cast(SingleComponentData, data), component)
         for i, batch in enumerate(component_batches):
             if (isinstance(batch, dict) and batch) or (isinstance(batch, np.ndarray) and batch.size > 0):
                 list_data[i][component] = batch
@@ -151,7 +151,9 @@ def get_batch_size(batch_data: BatchComponentData) -> int:
         return indptr.size - 1
 
     data_to_check = (
-        next(iter(cast(DenseBatchColumnarData, batch_data).values())) if is_columnar(batch_data) else batch_data
+        next(iter(cast(DenseBatchColumnarData, batch_data).values()))
+        if is_columnar(batch_data)
+        else cast(DenseBatchArray, batch_data)
     )
     if data_to_check.ndim == 1:
         return 1
@@ -397,7 +399,7 @@ def _convert_data_to_row_or_columnar(
     if isinstance(attrs, (list, set)) and len(attrs) == 0:
         return {}
     if isinstance(attrs, ComponentAttributeFilterOptions):
-        names = cast(np.ndarray, data).dtype.names if not is_columnar(data) else data.keys()
+        names = cast(SingleArray, data).dtype.names if not is_columnar(data) else cast(SingleColumnarData, data).keys()
         return {attr: deepcopy(data[attr]) for attr in names}
     return {attr: deepcopy(data[attr]) for attr in attrs}
 
@@ -573,7 +575,7 @@ def _extract_columnar_data(data: ComponentData, is_batch: bool | None = None) ->
             raise TypeError("Expected columnar data")
         if attribute_array.ndim not in allowed_dims:
             raise TypeError("Expected columnar data")
-    return sub_data
+    return cast(ColumnarData, sub_data)
 
 
 def _extract_row_based_data(data: ComponentData, is_batch: bool | None = None) -> DataArray:  # pragma: no cover

From 1e4da2cd43b1603ea96c9065e3d5253b189e21f6 Mon Sep 17 00:00:00 2001
From: Santiago Figueroa Manrique <santiago.figueroa.manrique@alliander.com>
Date: Tue, 1 Oct 2024 09:42:07 +0200
Subject: [PATCH 2/6] created REUSE.toml

Signed-off-by: Santiago Figueroa Manrique <santiago.figueroa.manrique@alliander.com>
---
 .reuse/dep5 |  8 --------
 REUSE.toml  | 10 ++++++++++
 2 files changed, 10 insertions(+), 8 deletions(-)
 delete mode 100644 .reuse/dep5
 create mode 100644 REUSE.toml

diff --git a/.reuse/dep5 b/.reuse/dep5
deleted file mode 100644
index 6dbe0fae5..000000000
--- a/.reuse/dep5
+++ /dev/null
@@ -1,8 +0,0 @@
-Format: https://www.debian.org/doc/packaging-manuals/copyright-format/1.0/
-Upstream-Name: power-grid-model
-Upstream-Contact: Power Grid Model project <powergridmodel@lfenergy.org>
-Source: https://github.com/PowerGridModel/power-grid-model
-
-Files: ./*
-Copyright: Contributors to the Power Grid Model project <powergridmodel@lfenergy.org>
-License: MPL-2.0
diff --git a/REUSE.toml b/REUSE.toml
new file mode 100644
index 000000000..7d759e9f0
--- /dev/null
+++ b/REUSE.toml
@@ -0,0 +1,10 @@
+version = 1
+SPDX-PackageName = "power-grid-model"
+SPDX-PackageSupplier = "Power Grid Model project <powergridmodel@lfenergy.org>"
+SPDX-PackageDownloadLocation = "https://github.com/PowerGridModel/power-grid-model"
+
+[[annotations]]
+path = "./**"
+precedence = "aggregate"
+SPDX-FileCopyrightText = "Contributors to the Power Grid Model project <powergridmodel@lfenergy.org>"
+SPDX-License-Identifier = "MPL-2.0"

From 9a8a2759937d10fe4378d81d828d211e177ca7a1 Mon Sep 17 00:00:00 2001
From: Martijn Govers <Martijn.Govers@Alliander.com>
Date: Tue, 1 Oct 2024 09:49:30 +0200
Subject: [PATCH 3/6] fix mypy

Signed-off-by: Martijn Govers <Martijn.Govers@Alliander.com>
---
 src/power_grid_model/core/buffer_handling.py    | 13 +++++++------
 src/power_grid_model/core/power_grid_dataset.py |  2 +-
 src/power_grid_model/utils.py                   |  6 ++++--
 3 files changed, 12 insertions(+), 9 deletions(-)

diff --git a/src/power_grid_model/core/buffer_handling.py b/src/power_grid_model/core/buffer_handling.py
index 353128de6..1064fc4a4 100644
--- a/src/power_grid_model/core/buffer_handling.py
+++ b/src/power_grid_model/core/buffer_handling.py
@@ -20,6 +20,7 @@
     AttributeType,
     ComponentData,
     DenseBatchData,
+    IndexPointer,
     SingleComponentData,
     SparseBatchArray,
     SparseBatchData,
@@ -153,7 +154,7 @@ def _get_uniform_buffer_properties(
 
     if isinstance(data, np.ndarray):
         ndim = data.ndim
-        shape: tuple[int] = data.shape
+        shape = data.shape
         columns = None
     elif data:
         attribute, attribute_data = next(iter(data.items()))
@@ -317,7 +318,7 @@ def _get_attribute_buffer_views(
 
 
 def _get_uniform_buffer_view(
-    data: np.ndarray,
+    data: DenseBatchData,
     schema: ComponentMetaData,
     is_batch: bool | None,
     batch_size: int | None,
@@ -396,7 +397,7 @@ def get_buffer_view(
         the C API buffer view.
     """
     if not is_sparse(data):
-        return _get_uniform_buffer_view(data, schema, is_batch, batch_size)
+        return _get_uniform_buffer_view(cast(DenseBatchData, data), schema, is_batch, batch_size)
 
     if is_batch is not None and not is_batch:
         raise ValueError("Sparse data must be batch data")
@@ -463,13 +464,13 @@ def _create_sparse_buffer(properties: BufferProperties, schema: ComponentMetaDat
     Returns:
         A sparse buffer with the correct properties.
     """
-    data = _create_contents_buffer(
+    data: SingleComponentData = _create_contents_buffer(
         shape=properties.n_total_elements,
         dtype=schema.dtype,
         columns=properties.columns,
     )
-    indptr = np.array([0] * properties.batch_size + [properties.n_total_elements], dtype=IdxC)
-    return {"data": data, "indptr": indptr}
+    indptr: IndexPointer = np.array([0] * properties.batch_size + [properties.n_total_elements], dtype=IdxC)
+    return cast(SparseBatchData, {"data": data, "indptr": indptr})
 
 
 def _create_contents_buffer(shape, dtype, columns: list[AttributeType] | None) -> SingleComponentData | DenseBatchData:
diff --git a/src/power_grid_model/core/power_grid_dataset.py b/src/power_grid_model/core/power_grid_dataset.py
index 7be2a2ad3..ed180a736 100644
--- a/src/power_grid_model/core/power_grid_dataset.py
+++ b/src/power_grid_model/core/power_grid_dataset.py
@@ -513,6 +513,6 @@ def _get_filtered_attributes(
         return None
 
     if isinstance(component_data_filter, ComponentAttributeFilterOptions):
-        return list(schema.dtype.names)
+        return [] if schema.dtype.names is None else list(schema.dtype.names)
 
     return list(component_data_filter)
diff --git a/src/power_grid_model/utils.py b/src/power_grid_model/utils.py
index 706cadb8b..37b7112cc 100644
--- a/src/power_grid_model/utils.py
+++ b/src/power_grid_model/utils.py
@@ -37,7 +37,9 @@
     BatchComponentData,
     BatchDataset,
     Dataset,
+    DenseBatchArray,
     IndexPointer,
+    SingleComponentData,
     SingleDataset,
 )
 from power_grid_model.errors import PowerGridError, PowerGridSerializationError
@@ -69,7 +71,7 @@ def _get_dense_scenario(arr: np.ndarray) -> np.ndarray:
     def _get_sparse_scenario(arr: np.ndarray, indptr: IndexPointer) -> np.ndarray:
         return arr[indptr[scenario] : indptr[scenario + 1]]
 
-    def _get_component_scenario(component_scenarios: BatchComponentData) -> np.ndarray:
+    def _get_component_scenario(component_scenarios: BatchComponentData) -> SingleComponentData:
         data = _extract_data_from_component_data(component_scenarios)
 
         if is_sparse(component_scenarios):
@@ -83,7 +85,7 @@ def _get_component_scenario(component_scenarios: BatchComponentData) -> np.ndarr
 
         if is_columnar(component_scenarios):
             return {attribute: _get_dense_scenario(attribute_data) for attribute, attribute_data in data.items()}
-        return _get_dense_scenario(component_scenarios)
+        return _get_dense_scenario(cast_type(DenseBatchArray, component_scenarios))
 
     return {component: _get_component_scenario(component_data) for component, component_data in dataset.items()}
 

From 5b430120ee689727e93d672c2f6488fbc7e95795 Mon Sep 17 00:00:00 2001
From: Santiago Figueroa Manrique <santiago.figueroa.manrique@alliander.com>
Date: Tue, 1 Oct 2024 09:49:33 +0200
Subject: [PATCH 4/6] updated to 4.0.0

Signed-off-by: Santiago Figueroa Manrique <santiago.figueroa.manrique@alliander.com>
---
 .pre-commit-config.yaml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
index cf8178661..49a32f980 100644
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@@ -4,7 +4,7 @@
 
 repos:
   - repo: https://github.com/fsfe/reuse-tool
-    rev: v3.0.2
+    rev: v4.0.0
     hooks:
       - id: reuse
   - repo: https://github.com/pycqa/isort

From 70476c98ae36e3ac2dc12b39d3b6f943e844068e Mon Sep 17 00:00:00 2001
From: Santiago Figueroa Manrique <santiago.figueroa.manrique@alliander.com>
Date: Tue, 1 Oct 2024 09:53:06 +0200
Subject: [PATCH 5/6] Missing header

Signed-off-by: Santiago Figueroa Manrique <santiago.figueroa.manrique@alliander.com>
---
 REUSE.toml | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/REUSE.toml b/REUSE.toml
index 7d759e9f0..1097f0db1 100644
--- a/REUSE.toml
+++ b/REUSE.toml
@@ -1,3 +1,7 @@
+# SPDX-FileCopyrightText: Contributors to the Power Grid Model project <powergridmodel@lfenergy.org>
+#
+# SPDX-License-Identifier: MPL-2.0
+
 version = 1
 SPDX-PackageName = "power-grid-model"
 SPDX-PackageSupplier = "Power Grid Model project <powergridmodel@lfenergy.org>"

From f85e8ed269e8df2a41696a8e860fe02376317172 Mon Sep 17 00:00:00 2001
From: Martijn Govers <Martijn.Govers@Alliander.com>
Date: Tue, 1 Oct 2024 10:04:57 +0200
Subject: [PATCH 6/6] fix scripts mypy

Signed-off-by: Martijn Govers <Martijn.Govers@Alliander.com>
---
 src/power_grid_model/core/power_grid_meta.py | 3 ++-
 src/power_grid_model/data_types.py           | 8 +++++---
 2 files changed, 7 insertions(+), 4 deletions(-)

diff --git a/src/power_grid_model/core/power_grid_meta.py b/src/power_grid_model/core/power_grid_meta.py
index 1e1fe5544..e2ecbaadd 100644
--- a/src/power_grid_model/core/power_grid_meta.py
+++ b/src/power_grid_model/core/power_grid_meta.py
@@ -21,6 +21,7 @@
     _str_to_datatype,
 )
 from power_grid_model.core.power_grid_core import AttributePtr, ComponentPtr, DatasetPtr, power_grid_core as pgc
+from power_grid_model.data_types import DenseBatchArray, SingleArray
 
 
 # constant enum for ctype
@@ -171,7 +172,7 @@ def initialize_array(
     component_type: ComponentTypeLike,
     shape: tuple | int,
     empty: bool = False,
-) -> np.ndarray:
+) -> SingleArray | DenseBatchArray:
     """
     Initializes an array for use in Power Grid Model calculations
 
diff --git a/src/power_grid_model/data_types.py b/src/power_grid_model/data_types.py
index 150b62d35..98bfdbd68 100644
--- a/src/power_grid_model/data_types.py
+++ b/src/power_grid_model/data_types.py
@@ -167,22 +167,25 @@ class SparseBatchColumnarData(TypedDict):
 Columnar data can be :class:`SingleColumnarData` or :class:`BatchColumnarData`.
 """
 
+_SingleComponentData = TypeVar("_SingleComponentData", SingleArray, SingleColumnarData)  # deduction helper
 SingleComponentData = SingleArray | SingleColumnarData
 """
 Single component data can be :class:`SingleArray` or :class:`SingleColumnarData`.
 """
 
+_BatchComponentData = TypeVar("_BatchComponentData", BatchArray, BatchColumnarData)  # deduction helper
 BatchComponentData = BatchArray | BatchColumnarData
 """
 Batch component data can be :class:`BatchArray` or :class:`BatchColumnarData`.
 """
 
+_ComponentData = TypeVar("_ComponentData", SingleComponentData, BatchComponentData)  # deduction helper
 ComponentData = DataArray | ColumnarData
 """
 Component data can be :class:`DataArray` or :class:`ColumnarData`.
 """
 
-SingleDataset = dict[ComponentTypeVar, SingleComponentData]
+SingleDataset = dict[ComponentTypeVar, _SingleComponentData]
 """
 A single dataset is a dictionary where the keys are the component types and the values are
 :class:`ComponentData`
@@ -190,7 +193,7 @@ class SparseBatchColumnarData(TypedDict):
 - Example: {"node": :class:`SingleArray`, "line": :class:`SingleColumnarData`}
 """
 
-BatchDataset = dict[ComponentTypeVar, BatchComponentData]
+BatchDataset = dict[ComponentTypeVar, _BatchComponentData]
 """
 A batch dataset is a dictionary where the keys are the component types and the values are :class:`BatchComponentData`
 
@@ -198,7 +201,6 @@ class SparseBatchColumnarData(TypedDict):
             "link": :class:`DenseBatchColumnarData`, "transformer": :class:`SparseBatchColumnarData`}
 """
 
-_ComponentData = TypeVar("_ComponentData", SingleComponentData, BatchComponentData)  # deduction helper
 Dataset = dict[ComponentTypeVar, _ComponentData]
 """
 A general data set can be a :class:`SingleDataset` or a :class:`BatchDataset`.