iiasa · meksor · Feb 29, 2024 · Feb 29, 2024 · Feb 29, 2024 · Feb 29, 2024
diff --git a/.github/workflows/pytest.yaml b/.github/workflows/pytest.yaml
@@ -8,10 +8,14 @@ jobs:
     strategy:
       matrix:
         python-version:
-        - "3.10"  # Earliest version supported by ixmp4
-        - "3.11"
-        - "3.12"  # Latest version supported by ixmp4
-
+          - "3.10" # Earliest version supported by ixmp4
+          - "3.11"
+          - "3.12" # Latest version supported by ixmp4
+        with-pyarrow:
+          - false
+        include:
+          - python-version: "3.12"
+            with-pyarrow: true
     runs-on: ubuntu-latest
     services:
       postgres:
@@ -65,6 +69,10 @@ jobs:
       #----------------------------------------------
       # install your root project, if required
       #----------------------------------------------
+      - name: Install PyArrow
+        if: ${{ matrix.with-pyarrow }}
+        run: pip install pyarrow
+
       - name: Install library
         run: poetry install --no-interaction
       #----------------------------------------------

diff --git a/ixmp4/data/db/base.py b/ixmp4/data/db/base.py
@@ -391,7 +391,14 @@ def bulk_upsert_chunk(self, df: pd.DataFrame) -> None:
             for col in self.model_class.updateable_columns:
                 updated_col = col + self.merge_suffix
                 if updated_col in df.columns:
-                    cond.append(df[col] != df[updated_col])
+                    # coerce to same type so the inequality
+                    # operation works with pyarrow installed
+                    df[updated_col] = df[updated_col].astype(df[col].dtype)
+                    are_not_equal = df[col] != df[updated_col]
+                    # extra check if both values are NA because NA == NA = NA
+                    # in pandas with pyarrow
+                    both_are_na = pd.isna(df[col]) & pd.isna(df[updated_col])
+                    cond.append(~both_are_na | are_not_equal)
 
             df["differs"] = np.where(np.logical_or.reduce(cond), True, False)