This is an automated email from the ASF dual-hosted git repository.
lzljs3620320 pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/paimon.git
The following commit(s) were added to refs/heads/master by this push:
new 610ab4a8d9 [hotfix] Remove useless codes for faiss and lucene
610ab4a8d9 is described below
commit 610ab4a8d9527193611e409bf62318dc23a409a7
Author: JingsongLi <[email protected]>
AuthorDate: Mon Mar 2 15:36:58 2026 +0800
[hotfix] Remove useless codes for faiss and lucene
---
.gitignore | 1 -
.../pypaimon/common/options/core_options.py | 111 ---------------------
paimon-python/pypaimon/index/index_file_meta.py | 2 +-
3 files changed, 1 insertion(+), 113 deletions(-)
diff --git a/.gitignore b/.gitignore
index ef892fae40..8b1d01ba8e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -9,7 +9,6 @@
*.iml
*.ipr
*.iws
-paimon-lucene/.idea/
paimon-python/.idea/
# VS Code
.vscode/
diff --git a/paimon-python/pypaimon/common/options/core_options.py
b/paimon-python/pypaimon/common/options/core_options.py
index 103956d60e..33384316cf 100644
--- a/paimon-python/pypaimon/common/options/core_options.py
+++ b/paimon-python/pypaimon/common/options/core_options.py
@@ -350,84 +350,6 @@ class CoreOptions:
)
)
- # FAISS Vector Index options
- VECTOR_DIM: ConfigOption[int] = (
- ConfigOptions.key("vector.dim")
- .int_type()
- .default_value(128)
- .with_description("The dimension of the vector.")
- )
-
- VECTOR_METRIC: ConfigOption[str] = (
- ConfigOptions.key("vector.metric")
- .string_type()
- .default_value("L2")
- .with_description("The similarity metric for vector search (L2,
INNER_PRODUCT).")
- )
-
- VECTOR_INDEX_TYPE: ConfigOption[str] = (
- ConfigOptions.key("vector.index-type")
- .string_type()
- .default_value("IVF_SQ8")
- .with_description("The type of FAISS index (FLAT, HNSW, IVF, IVF_PQ,
IVF_SQ8).")
- )
-
- VECTOR_M: ConfigOption[int] = (
- ConfigOptions.key("vector.m")
- .int_type()
- .default_value(32)
- .with_description("Maximum connections per element in HNSW index.")
- )
-
- VECTOR_EF_CONSTRUCTION: ConfigOption[int] = (
- ConfigOptions.key("vector.ef-construction")
- .int_type()
- .default_value(40)
- .with_description("Size of dynamic candidate list during HNSW
construction.")
- )
-
- VECTOR_EF_SEARCH: ConfigOption[int] = (
- ConfigOptions.key("vector.ef-search")
- .int_type()
- .default_value(16)
- .with_description("Size of dynamic candidate list during HNSW search.")
- )
-
- VECTOR_NLIST: ConfigOption[int] = (
- ConfigOptions.key("vector.nlist")
- .int_type()
- .default_value(100)
- .with_description("Number of inverted lists (clusters) for IVF index.")
- )
-
- VECTOR_NPROBE: ConfigOption[int] = (
- ConfigOptions.key("vector.nprobe")
- .int_type()
- .default_value(64)
- .with_description("Number of clusters to visit during IVF search.")
- )
-
- VECTOR_SIZE_PER_INDEX: ConfigOption[int] = (
- ConfigOptions.key("vector.size-per-index")
- .int_type()
- .default_value(2000000)
- .with_description("Size of vectors stored in each vector index file.")
- )
-
- VECTOR_SEARCH_FACTOR: ConfigOption[int] = (
- ConfigOptions.key("vector.search-factor")
- .int_type()
- .default_value(10)
- .with_description("Multiplier for search limit when filtering is
applied.")
- )
-
- VECTOR_NORMALIZE: ConfigOption[bool] = (
- ConfigOptions.key("vector.normalize")
- .boolean_type()
- .default_value(False)
- .with_description("Whether to L2 normalize vectors for cosine
similarity.")
- )
-
READ_BATCH_SIZE: ConfigOption[int] = (
ConfigOptions.key("read.batch-size")
.int_type()
@@ -591,38 +513,5 @@ class CoreOptions:
def global_index_thread_num(self) -> Optional[int]:
return self.options.get(CoreOptions.GLOBAL_INDEX_THREAD_NUM)
- def vector_dim(self, default=None):
- return self.options.get(CoreOptions.VECTOR_DIM, default)
-
- def vector_metric(self, default=None):
- return self.options.get(CoreOptions.VECTOR_METRIC, default)
-
- def vector_index_type(self, default=None):
- return self.options.get(CoreOptions.VECTOR_INDEX_TYPE, default)
-
- def vector_m(self, default=None):
- return self.options.get(CoreOptions.VECTOR_M, default)
-
- def vector_ef_construction(self, default=None):
- return self.options.get(CoreOptions.VECTOR_EF_CONSTRUCTION, default)
-
- def vector_ef_search(self, default=None):
- return self.options.get(CoreOptions.VECTOR_EF_SEARCH, default)
-
- def vector_nlist(self, default=None):
- return self.options.get(CoreOptions.VECTOR_NLIST, default)
-
- def vector_nprobe(self, default=None):
- return self.options.get(CoreOptions.VECTOR_NPROBE, default)
-
- def vector_size_per_index(self, default=None):
- return self.options.get(CoreOptions.VECTOR_SIZE_PER_INDEX, default)
-
- def vector_search_factor(self, default=None):
- return self.options.get(CoreOptions.VECTOR_SEARCH_FACTOR, default)
-
- def vector_normalize(self, default=None):
- return self.options.get(CoreOptions.VECTOR_NORMALIZE, default)
-
def read_batch_size(self, default=None) -> int:
return self.options.get(CoreOptions.READ_BATCH_SIZE, default or 1024)
diff --git a/paimon-python/pypaimon/index/index_file_meta.py
b/paimon-python/pypaimon/index/index_file_meta.py
index 6726780a58..5ee6af521b 100644
--- a/paimon-python/pypaimon/index/index_file_meta.py
+++ b/paimon-python/pypaimon/index/index_file_meta.py
@@ -40,7 +40,7 @@ class IndexFileMeta:
dv_ranges: Optional[Dict[str, DeletionVectorMeta]] = field(default=None)
# External path for the index file (optional)
external_path: Optional[str] = None
- # For global index (e.g., FAISS vector index)
+ # For global index
global_index_meta: Optional[GlobalIndexMeta] = None
def __eq__(self, other):