zilliztech
diff --git a/‎.gitignore‎
Lines changed: 3 additions & 0 deletions b/‎.gitignore‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎README.md‎
Lines changed: 45 additions & 10 deletions b/‎README.md‎
Lines changed: 45 additions & 10 deletions
diff --git a/‎install/requirements_py3.11.txt‎
Lines changed: 2 additions & 1 deletion b/‎install/requirements_py3.11.txt‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎pyproject.toml‎
Lines changed: 5 additions & 34 deletions b/‎pyproject.toml‎
Lines changed: 5 additions & 34 deletions
diff --git a/‎tests/pytest.ini‎
Lines changed: 2 additions & 1 deletion b/‎tests/pytest.ini‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎tests/test_bench_runner.py‎
Lines changed: 2 additions & 1 deletion b/‎tests/test_bench_runner.py‎
Lines changed: 2 additions & 1 deletion
diff --git a/‎tests/test_concurrent_runner.py‎
Lines changed: 159 additions & 0 deletions b/‎tests/test_concurrent_runner.py‎
Lines changed: 159 additions & 0 deletions
@@ -13,6 +13,9 @@ venv/
 results/
 logs/
 
+# Worktrees
+.worktrees/
+
 # AI rules
 CLAUDE.md
 AGENTS.md
@@ -27,11 +27,6 @@ python >= 3.11
 pip install vectordb-bench
 ```
 
-**Install all database clients**
-
-``` shell
-pip install 'vectordb-bench[all]'
-```
 **Install the specific database client**
 
 ```shell
@@ -42,7 +37,6 @@ All the database client supported
 | Optional database client | install command                             |
 |--------------------------|---------------------------------------------|
 | pymilvus, zilliz_cloud (*default*)     | `pip install vectordb-bench`                |
-| all (*clients requirements might be conflict with each other*) | `pip install vectordb-bench[all]`           |
 | qdrant                   | `pip install vectordb-bench[qdrant]`        |
 | pinecone                 | `pip install vectordb-bench[pinecone]`      |
 | weaviate                 | `pip install vectordb-bench[weaviate]`      |
@@ -62,6 +56,7 @@ All the database client supported
 | hologres                 | `pip install vectordb-bench[hologres]`      |
 | tencent_es               | `pip install vectordb-bench[tencent_es]`    |
 | alisql                   | `pip install 'vectordb-bench[alisql]'`      |
+| polardb                  | `pip install vectordb-bench[polardb]`       |
 | doris                    | `pip install vectordb-bench[doris]`         |
 | zvec                     | `pip install vectordb-bench[zvec]`          |
 | endee                    | `pip install vectordb-bench[endee]`         |
@@ -225,7 +220,6 @@ Options:
 
   --ondisk                        Ondisk mode with binary quantization(32x compression)
   --oversample-factor             Controls the degree of oversampling applied to minority classes in imbalanced datasets to improve model performance by balancing class distributions.(default 1.0)
-  
 
   # Quantization Type
   --quantization-type TEXT        which type of quantization to use valid values [fp32, fp16, bq]
@@ -294,13 +288,13 @@ Options:
   # Connection
   --cloud-id TEXT                 Elastic Cloud ID  [required]
   --password TEXT                 Elastic Cloud password  [required]
-  
+
   # HNSW Index Parameters
   --m INTEGER                     HNSW M parameter  [default: 16]
   --ef-construction INTEGER       HNSW efConstruction parameter  [default: 100]
   --num-candidates INTEGER        Number of candidates for search  [default: 100]
   --element-type [float|byte]     Element type for vectors (float: 4 bytes, byte: 1 byte)  [default: float]
-  
+
   # Index Configuration
   --number-of-shards INTEGER      Number of shards  [default: 1]
   --number-of-replicas INTEGER    Number of replicas  [default: 0]
@@ -311,7 +305,7 @@ Options:
   --use-routing BOOLEAN           Whether to use routing  [default: False]
   --use-rescore BOOLEAN           Whether to use rescore  [default: False]
   --oversample-ratio FLOAT        Oversample ratio for rescore  [default: 2.0]
-  
+
   # Common Options
   --case-type [CapacityDim128|CapacityDim960|Performance768D100M|...]
                                   Case type
@@ -527,6 +521,47 @@ To list the options for Lindorm, execute `vectordbbench lindormhnsw --help`, The
   --ef-search INTEGER             hnsw ef-search  [required]
 ```
 
+### Run PolarDB from command line
+
+PolarDB supports index types: faiss_hnsw_flat, faiss_hnsw_pq, and faiss_hnsw_sq.
+
+**Example: Run faiss_hnsw_flat benchmark**
+
+```shell
+vectordbbench polardbhnswflat \
+  --case-type Performance768D1M \
+  --username <db_user> \
+  --password '<db_password>' \
+  --host <db_host> \
+  --port 3306 \
+  --m 16 \
+  --ef-construction 256 \
+  --ef-search 256 \
+  --insert-workers 64 \
+  --num-concurrency '10,20,40,60,80' \
+  --concurrency-duration 60 \
+  --task-label <task_label> \
+  --db-label <db_label> \
+  --skip-search-serial \
+  --post-load-index
+```
+
+To list the options for PolarDB, execute `vectordbbench polardbhnswflat --help`. The following are some PolarDB-specific command-line options.
+
+```text
+  --username TEXT                  Username  [required]
+  --password TEXT                  Password
+  --host TEXT                      Db host  [default: 127.0.0.1]
+  --port INTEGER                   Db Port  [default: 3306]
+  --database TEXT                  Database name  [default: vectordbbench]
+  --m INTEGER                      M parameter (max_degree) in HNSW
+  --ef-construction INTEGER        ef_construction parameter in HNSW
+  --ef-search INTEGER              polar_vector_index_hnsw_ef_search session variable
+  --insert-workers INTEGER         Number of concurrent threads for data insertion
+  --post-load-index / --inline-index
+                                   Create index after load or inline at table creation
+```
+
 #### Using a configuration file.
 
 The vectordbbench command can optionally read some or all the options from a yaml formatted configuration file.
 
@@ -26,5 +26,6 @@ pymilvus
 clickhouse_connect
 pyvespa
 mysql-connector-python
+PyMySQL
 packaging
-hdrhistogram>=0.10.1
+hdrhistogram>=0.10.1
@@ -39,9 +39,9 @@ dependencies = [
     "environs",
     "pydantic<v2",
     "scikit-learn",
-    "pymilvus", # with pandas, numpy, ujson
-    "ujson",
+    "pymilvus", # with pandas, numpy
     "hdrhistogram>=0.10.1",
+    "ujson",
 ]
 dynamic = ["version"]
 
@@ -51,37 +51,7 @@ test = [
     "ruff",
     "pytest",
 ]
-restful = [ "flask" ]
-
-all = [
-    "grpcio==1.53.0", # for qdrant-client and pymilvus
-    "grpcio-tools==1.53.0", # for qdrant-client and pymilvus
-    "qdrant-client",
-    "pinecone",
-    "weaviate-client",
-    "elasticsearch",
-    "sqlalchemy",
-    "redis",
-    "chromadb",
-    "pgvector",
-    "psycopg",
-    "psycopg-binary",
-    "pgvecto_rs[psycopg3]>=0.2.2",
-    "opensearch-dsl",
-    "opensearch-py",
-    "memorydb",
-    "alibabacloud_ha3engine_vector",
-    "mariadb",
-    "PyMySQL",
-    "clickhouse-connect",
-    "pyvespa",
-    "lancedb",
-    "mysql-connector-python",
-    "turbopuffer[fast]",
-    'zvec',
-    "endee==0.1.10", # compatible with pydantic<2
-]
-
+restful         = [ "flask" ]
 qdrant          = [ "qdrant-client" ]
 pinecone        = [ "pinecone" ]
 weaviate        = [ "weaviate-client" ]
@@ -106,6 +76,7 @@ vespa           = [ "pyvespa" ]
 lancedb         = [ "lancedb" ]
 oceanbase       = [ "mysql-connector-python" ]
 alisql          = [ "mysql-connector-python" ]
+polardb         = [ "PyMySQL" ]
 doris           = [ "doris-vector-search" ]
 turbopuffer     = [ "turbopuffer" ]
 zvec            = [ "zvec" ]
@@ -156,7 +127,7 @@ lint.ignore = [
     "INP001", # TODO
     "TID252", # TODO
     "N801", "N802", "N815",
-    "S101", "S108", "S603", "S311",
+    "S101", "S108", "S603", "S311", "S608",
     "PLR2004",
     "RUF017",
     "C416",
 
@@ -1,4 +1,5 @@
 [pytest]
 
-filterwarnings = 
+filterwarnings =
     ignore::UserWarning
+    ignore::DeprecationWarning
@@ -1,5 +1,7 @@
 import time
 import logging
+
+import ujson
 from vectordb_bench.interface import BenchMarkRunner
 from vectordb_bench.models import (
     DB, IndexType, CaseType, TaskConfig, CaseConfig,
@@ -55,6 +57,5 @@ def test_performance_case_no_error(self):
         d = t.json(exclude={'db_config': {'password', 'api_key'}})
         log.info(f"{d}")
 
-        import ujson
         loads = ujson.loads(d)
         log.info(f"{loads}")
@@ -0,0 +1,159 @@
+"""Tests for ConcurrentInsertRunner against a running Milvus instance.
+
+Includes:
+  - Correctness tests (threading & async backends)
+  - Parameterized benchmark: serial vs concurrent across (batch_size, workers) matrix
+
+NUM_PER_BATCH is set via os.environ before each run. Since runners execute
+task() in a spawn subprocess that re-imports config, the env var takes effect.
+
+Requires:
+  - Milvus running at localhost:19530
+  - Network access to download OpenAI 50K dataset
+
+Usage:
+  pytest tests/test_concurrent_runner.py -v -s     # correctness tests only
+  python tests/test_concurrent_runner.py             # full benchmark matrix
+"""
+
+# ruff: noqa: T201
+
+from __future__ import annotations
+
+import logging
+import os
+import time
+
+from vectordb_bench.backend.clients import DB
+from vectordb_bench.backend.clients.milvus.config import FLATConfig
+from vectordb_bench.backend.dataset import Dataset, DatasetSource
+from vectordb_bench.backend.runner.concurrent_runner import ConcurrentInsertRunner, ExecutorBackend
+from vectordb_bench.backend.runner.serial_runner import SerialInsertRunner
+
+log = logging.getLogger("vectordb_bench")
+log.setLevel(logging.INFO)
+
+DATASET_SIZE = 50_000
+
+
+# ── Shared helpers ──────────────────────────────────────────────────────
+
+
+def get_milvus_db(collection_name: str):
+    return DB.Milvus.init_cls(
+        dim=1536,
+        db_config={"uri": "http://localhost:19530", "user": "", "password": ""},
+        db_case_config=FLATConfig(metric_type="COSINE"),
+        collection_name=collection_name,
+        drop_old=True,
+    )
+
+
+def prepare_dataset():
+    dataset = Dataset.OPENAI.manager(DATASET_SIZE)
+    dataset.prepare(DatasetSource.AliyunOSS)
+    return dataset
+
+
+def set_batch_size(batch_size: int) -> None:
+    os.environ["NUM_PER_BATCH"] = str(batch_size)
+
+
+def timed_run(runner: SerialInsertRunner | ConcurrentInsertRunner) -> tuple[int, float]:
+    start = time.perf_counter()
+    count = runner.run()
+    return count, time.perf_counter() - start
+
+
+# ── Correctness tests (pytest) ──────────────────────────────────────────
+
+
+def test_concurrent_insert_threading():
+    """Test concurrent insert with threading backend."""
+    db = get_milvus_db("test_conc_threading")
+    runner = ConcurrentInsertRunner(
+        db=db,
+        dataset=prepare_dataset(),
+        normalize=False,
+        max_workers=4,
+        backend=ExecutorBackend.THREADING,
+    )
+    count = runner.run()
+    assert count == DATASET_SIZE, f"Expected {DATASET_SIZE}, got {count}"
+
+
+def test_concurrent_insert_async():
+    """Test concurrent insert with async backend."""
+    db = get_milvus_db("test_conc_async")
+    runner = ConcurrentInsertRunner(
+        db=db,
+        dataset=prepare_dataset(),
+        normalize=False,
+        max_workers=4,
+        backend=ExecutorBackend.ASYNC,
+    )
+    count = runner.run()
+    assert count == DATASET_SIZE, f"Expected {DATASET_SIZE}, got {count}"
+
+
+# ── Parameterized benchmark ────────────────────────────────────────────
+
+
+def run_serial(batch_size: int) -> tuple[int, float]:
+    set_batch_size(batch_size)
+    runner = SerialInsertRunner(
+        db=get_milvus_db(f"bench_serial_b{batch_size}"),
+        dataset=prepare_dataset(),
+        normalize=False,
+    )
+    return timed_run(runner)
+
+
+def run_concurrent(batch_size: int, workers: int) -> tuple[int, float]:
+    set_batch_size(batch_size)
+    runner = ConcurrentInsertRunner(
+        db=get_milvus_db(f"bench_conc_b{batch_size}_w{workers}"),
+        dataset=prepare_dataset(),
+        normalize=False,
+        max_workers=workers,
+        backend=ExecutorBackend.THREADING,
+    )
+    return timed_run(runner)
+
+
+def bench_matrix():
+    batch_sizes = [100, 500, 1000, 5000]
+    worker_counts = [1, 2, 4, 8]
+
+    conc_headers = [f"conc({w}w)" for w in worker_counts]
+    speedup_headers = [f"speedup({w}w)" for w in worker_counts]
+    print(f"\n{'Batch':>6} {'#Bat':>5} {'serial':>8}", end="")
+    for h in conc_headers:
+        print(f" {h:>10}", end="")
+    for h in speedup_headers:
+        print(f" {h:>12}", end="")
+    print()
+    print("-" * (22 + 10 * len(worker_counts) + 12 * len(worker_counts)))
+
+    for bs in batch_sizes:
+        n_batches = DATASET_SIZE // bs
+        _, dur_s = run_serial(bs)
+
+        conc_durs = []
+        for w in worker_counts:
+            _, dur_c = run_concurrent(bs, w)
+            conc_durs.append(dur_c)
+
+        print(f"{bs:>6} {n_batches:>5} {dur_s:>7.2f}s", end="")
+        for dur_c in conc_durs:
+            print(f" {dur_c:>9.2f}s", end="")
+        for dur_c in conc_durs:
+            print(f" {dur_s / dur_c:>11.2f}x", end="")
+        print()
+
+    # restore default
+    set_batch_size(100)
+
+
+if __name__ == "__main__":
+    bench_matrix()