Query-farm
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎tests/test_filter_pushdown_extension.py‎
Lines changed: 24 additions & 6 deletions b/‎tests/test_filter_pushdown_extension.py‎
Lines changed: 24 additions & 6 deletions
diff --git a/‎uv.lock‎
Lines changed: 1 addition & 1 deletion b/‎uv.lock‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎vgi/_test_fixtures/aggregate/window.py‎
Lines changed: 4 additions & 2 deletions b/‎vgi/_test_fixtures/aggregate/window.py‎
Lines changed: 4 additions & 2 deletions
diff --git a/‎vgi/_test_fixtures/simple_writable.py‎
Lines changed: 6 additions & 5 deletions b/‎vgi/_test_fixtures/simple_writable.py‎
Lines changed: 6 additions & 5 deletions
diff --git a/‎vgi/_test_fixtures/table/partition_columns.py‎
Lines changed: 5 additions & 3 deletions b/‎vgi/_test_fixtures/table/partition_columns.py‎
Lines changed: 5 additions & 3 deletions
diff --git a/‎vgi/aggregate_function.py‎
Lines changed: 1 addition & 1 deletion b/‎vgi/aggregate_function.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎vgi/client/cli_catalog.py‎
Lines changed: 2 additions & 1 deletion b/‎vgi/client/cli_catalog.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎vgi/client/cli_schema.py‎
Lines changed: 10 additions & 5 deletions b/‎vgi/client/cli_schema.py‎
Lines changed: 10 additions & 5 deletions
@@ -1,6 +1,6 @@
 [project]
 name = "vgi"
-version = "0.7.4"
+version = "0.8.0"
 description = "Vector Gateway Interface - Connect DuckDB to external programs via Apache Arrow"
 readme = "README.md"
 requires-python = ">=3.13"
 
@@ -51,6 +51,7 @@ class TestBoolColumnBool8Literal:
     """
 
     def test_eq_true(self) -> None:
+        """EQ against a bool8 literal matches the plain-bool column."""
         batch = _batch_with_bool("flag", [True, False, None, True])
         f = ConstantFilter(
             column_name="flag",
@@ -62,6 +63,7 @@ def test_eq_true(self) -> None:
         assert result.to_pylist() == [True, False, None, True]
 
     def test_eq_false(self) -> None:
+        """EQ against a false bool8 literal."""
         batch = _batch_with_bool("flag", [True, False, None, True])
         f = ConstantFilter(
             column_name="flag",
@@ -72,6 +74,7 @@ def test_eq_false(self) -> None:
         assert f.evaluate(batch).to_pylist() == [False, True, None, False]
 
     def test_ne_true(self) -> None:
+        """NE against a bool8 literal."""
         batch = _batch_with_bool("flag", [True, False, None, True])
         f = ConstantFilter(
             column_name="flag",
@@ -95,6 +98,7 @@ class TestBool8ColumnBool8Literal:
     """
 
     def test_eq_true(self) -> None:
+        """EQ with bool8 on both sides of the kernel."""
         batch = _batch_with_bool8("flag", [True, False, None, True])
         f = ConstantFilter(
             column_name="flag",
@@ -105,6 +109,7 @@ def test_eq_true(self) -> None:
         assert f.evaluate(batch).to_pylist() == [True, False, None, True]
 
     def test_eq_false(self) -> None:
+        """EQ against a false literal with bool8 on both sides."""
         batch = _batch_with_bool8("flag", [True, False, None, True])
         f = ConstantFilter(
             column_name="flag",
@@ -128,11 +133,13 @@ class TestPlainTypesUnchanged:
     """
 
     def test_int32_eq(self) -> None:
+        """Plain int32 EQ flows through normalisation unchanged."""
         batch = pa.RecordBatch.from_pydict({"n": pa.array([1, 2, 3, 4], type=pa.int32())})
         f = ConstantFilter(column_name="n", column_index=0, op=ComparisonOp.EQ, value=pa.scalar(2, type=pa.int32()))
         assert f.evaluate(batch).to_pylist() == [False, True, False, False]
 
     def test_string_eq(self) -> None:
+        """Plain string EQ flows through normalisation unchanged."""
         batch = pa.RecordBatch.from_pydict({"s": ["a", "b", "c"]})
         f = ConstantFilter(column_name="s", column_index=0, op=ComparisonOp.EQ, value=pa.scalar("b"))
         assert f.evaluate(batch).to_pylist() == [False, True, False]
@@ -158,6 +165,7 @@ class TestInFilterExtension:
     """
 
     def test_in_bool_with_bool8_values(self) -> None:
+        """IN with bool8 values against a plain-bool column."""
         batch = _batch_with_bool("flag", [True, False, None, True])
         # Build the values array as a bool8 extension array
         storage = pa.array([1], type=pa.int8())
@@ -173,11 +181,14 @@ def test_in_bool_with_bool8_values(self) -> None:
 
 
 class TestPlainLiteralBool8Column:
-    """Defensive: if some future code path emits a plain bool literal but
-    the column happens to be bool8, normalisation should still align them.
+    """Defensive symmetry check: plain bool literal against a bool8 column.
+
+    If some future code path emits a plain bool literal but the column
+    happens to be bool8, normalisation should still align them.
     """
 
     def test_plain_bool_literal_bool8_column(self) -> None:
+        """Plain bool literal against a bool8 column."""
         batch = _batch_with_bool8("flag", [True, False, None, True])
         f = ConstantFilter(
             column_name="flag",
@@ -197,8 +208,10 @@ def test_plain_bool_literal_bool8_column(self) -> None:
 
 
 def test_pyarrow_kernel_gap_still_present() -> None:
-    """Documents the underlying PyArrow gap. If this passes in a future
-    PyArrow release the normalisation helper is over-defensive but harmless.
+    """Document the underlying PyArrow gap.
+
+    If this passes in a future PyArrow release the normalisation helper
+    is over-defensive but harmless.
     """
     import pyarrow.compute as pc
 
@@ -245,6 +258,7 @@ class TestUuidExtension:
     ]
 
     def test_eq(self) -> None:
+        """EQ with arrow.uuid on both sides."""
         batch = pa.RecordBatch.from_arrays([_uuid_array(self.UUIDS)], names=["id"])
         f = ConstantFilter(
             column_name="id",
@@ -255,6 +269,7 @@ def test_eq(self) -> None:
         assert f.evaluate(batch).to_pylist() == [False, True, None, False]
 
     def test_ne(self) -> None:
+        """NE with arrow.uuid on both sides."""
         batch = pa.RecordBatch.from_arrays([_uuid_array(self.UUIDS)], names=["id"])
         f = ConstantFilter(
             column_name="id",
@@ -265,6 +280,7 @@ def test_ne(self) -> None:
         assert f.evaluate(batch).to_pylist() == [True, False, None, True]
 
     def test_in(self) -> None:
+        """IN with an arrow.uuid values array."""
         batch = pa.RecordBatch.from_arrays([_uuid_array(self.UUIDS)], names=["id"])
         values = _uuid_array(
             [
@@ -282,8 +298,10 @@ def test_in(self) -> None:
 
 
 def test_pyarrow_interval_kernel_gap() -> None:
-    """PyArrow has no ``equal`` kernel for any of the interval types
-    (``month_day_nano_interval``, ``day_time_interval``, ``month_interval``).
+    """PyArrow has no ``equal`` kernel for any interval type.
+
+    The affected types are ``month_day_nano_interval``,
+    ``day_time_interval``, and ``month_interval``.
 
     This means a filter pushdown like ``WHERE col = INTERVAL '1 day'``
     cannot be evaluated on the worker side regardless of whether we strip
 
@@ -273,8 +273,10 @@ def window(
 
 
 class WindowSumBatchFunction(AggregateFunction[SumState]):
-    """Windowed running-sum that overrides ``window_batch`` to return a
-    pre-built ``pa.Array`` rather than a Python list.
+    """Windowed running-sum returning a pre-built ``pa.Array``.
+
+    Overrides ``window_batch`` to return a pre-built ``pa.Array`` rather
+    than a Python list.
 
     Functionally equivalent to :class:`WindowSumFunction`. The point of this
     fixture is to exercise the framework's polymorphic batch return: when
 
@@ -476,11 +476,12 @@ def process(
 
 
 class BrokenReturningInsert(TableInOutGenerator[None, None]):
-    """Misbehaving INSERT handler: claims RETURNING support but always emits a
-    (count BIGINT) batch — same shape that triggered the original SIGSEGV in
-    the kafka worker. Used to verify the C++ extension's runtime schema
-    validator throws a clean IOException instead of crashing inside
-    ArrowToDuckDB.
+    """Misbehaving INSERT handler that lies about its RETURNING support.
+
+    Claims RETURNING support but always emits a (count BIGINT) batch —
+    same shape that triggered the original SIGSEGV in the kafka worker.
+    Used to verify the C++ extension's runtime schema validator throws a
+    clean IOException instead of crashing inside ArrowToDuckDB.
     """
 
     class Meta:
 
@@ -75,9 +75,11 @@ class _CountryPartitionedArgs:
 
 @dataclass(kw_only=True)
 class _CountryPartitionedState(ArrowSerializableDataclass):
-    """Per-worker cursor. ``current_country`` is set after the worker
-    pops a queue item; ``current_idx`` advances through emitted rows
-    until the per-country quota is reached, then it pops the next item.
+    """Per-worker cursor over countries.
+
+    ``current_country`` is set after the worker pops a queue item;
+    ``current_idx`` advances through emitted rows until the per-country
+    quota is reached, then it pops the next item.
     """
 
     current_country: str | None = None
 
@@ -420,7 +420,7 @@ def window_prepare(
         window_state: Any,
         params: ProcessParams[Any],
     ) -> Any:
-        """Optional hook: derive per-partition state for the window() loop.
+        """Derive per-partition state for the window() loop (optional hook).
 
         Called once per partition, after ``window_init`` (or after the state
         is rehydrated from storage on a cold reload), before any
 
@@ -160,7 +160,8 @@ def catalog_version(
     )
     if is_stateful and catalog_name:
         click.echo(
-            "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",
+            "Warning: Using --catalog with a stateful catalog. "
+            "Consider using --attach-opaque-data for session persistence.",
             err=True,
         )
     version = client.catalog_version(
 
@@ -53,7 +53,8 @@ def schema_list(
     )
     if is_stateful and catalog_name:
         click.echo(
-            "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",
+            "Warning: Using --catalog with a stateful catalog. "
+            "Consider using --attach-opaque-data for session persistence.",
             err=True,
         )
     for schema_info in client.schemas(
@@ -92,7 +93,8 @@ def schema_get(
     )
     if is_stateful and catalog_name:
         click.echo(
-            "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",
+            "Warning: Using --catalog with a stateful catalog. "
+            "Consider using --attach-opaque-data for session persistence.",
             err=True,
         )
     schema_info = client.schema_get(
@@ -139,7 +141,8 @@ def schema_create(
     )
     if is_stateful and catalog_name:
         click.echo(
-            "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",
+            "Warning: Using --catalog with a stateful catalog. "
+            "Consider using --attach-opaque-data for session persistence.",
             err=True,
         )
     tags_dict = parse_json_option(tags, "--tags")
@@ -186,7 +189,8 @@ def schema_drop(
     )
     if is_stateful and catalog_name:
         click.echo(
-            "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",
+            "Warning: Using --catalog with a stateful catalog. "
+            "Consider using --attach-opaque-data for session persistence.",
             err=True,
         )
     client.schema_drop(
@@ -238,7 +242,8 @@ def schema_contents(
     )
     if is_stateful and catalog_name:
         click.echo(
-            "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",
+            "Warning: Using --catalog with a stateful catalog. "
+            "Consider using --attach-opaque-data for session persistence.",
             err=True,
         )
Original file line number	Diff line number	Diff line change
`@@ -160,7 +160,8 @@ def catalog_version(`
`160`	`160`	`)`
`161`	`161`	`if is_stateful and catalog_name:`
`162`	`162`	`click.echo(`
`163`		`- "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",`
	`163`	`+ "Warning: Using --catalog with a stateful catalog. "`
	`164`	`+ "Consider using --attach-opaque-data for session persistence.",`
`164`	`165`	`err=True,`
`165`	`166`	`)`
`166`	`167`	`version = client.catalog_version(`
Original file line number	Diff line number	Diff line change
`@@ -53,7 +53,8 @@ def schema_list(`
`53`	`53`	`)`
`54`	`54`	`if is_stateful and catalog_name:`
`55`	`55`	`click.echo(`
`56`		`- "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",`
	`56`	`+ "Warning: Using --catalog with a stateful catalog. "`
	`57`	`+ "Consider using --attach-opaque-data for session persistence.",`
`57`	`58`	`err=True,`
`58`	`59`	`)`
`59`	`60`	`for schema_info in client.schemas(`
`@@ -92,7 +93,8 @@ def schema_get(`
`92`	`93`	`)`
`93`	`94`	`if is_stateful and catalog_name:`
`94`	`95`	`click.echo(`
`95`		`- "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",`
	`96`	`+ "Warning: Using --catalog with a stateful catalog. "`
	`97`	`+ "Consider using --attach-opaque-data for session persistence.",`
`96`	`98`	`err=True,`
`97`	`99`	`)`
`98`	`100`	`schema_info = client.schema_get(`
`@@ -139,7 +141,8 @@ def schema_create(`
`139`	`141`	`)`
`140`	`142`	`if is_stateful and catalog_name:`
`141`	`143`	`click.echo(`
`142`		`- "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",`
	`144`	`+ "Warning: Using --catalog with a stateful catalog. "`
	`145`	`+ "Consider using --attach-opaque-data for session persistence.",`
`143`	`146`	`err=True,`
`144`	`147`	`)`
`145`	`148`	`tags_dict = parse_json_option(tags, "--tags")`
`@@ -186,7 +189,8 @@ def schema_drop(`
`186`	`189`	`)`
`187`	`190`	`if is_stateful and catalog_name:`
`188`	`191`	`click.echo(`
`189`		`- "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",`
	`192`	`+ "Warning: Using --catalog with a stateful catalog. "`
	`193`	`+ "Consider using --attach-opaque-data for session persistence.",`
`190`	`194`	`err=True,`
`191`	`195`	`)`
`192`	`196`	`client.schema_drop(`
`@@ -238,7 +242,8 @@ def schema_contents(`
`238`	`242`	`)`
`239`	`243`	`if is_stateful and catalog_name:`
`240`	`244`	`click.echo(`
`241`		`- "Warning: Using --catalog with a stateful catalog. Consider using --attach-opaque-data for session persistence.",`
	`245`	`+ "Warning: Using --catalog with a stateful catalog. "`
	`246`	`+ "Consider using --attach-opaque-data for session persistence.",`
`242`	`247`	`err=True,`
`243`	`248`	`)`
`244`	`249`