update name

jerry-024 · jerry-024 · commit d68e04838f0e · 2025-12-11T18:13:34.000+08:00
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneByteVectorIndex.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneByteVectorIndex.java
@@ -22,12 +22,12 @@
 import org.apache.lucene.index.IndexableField;
 import org.apache.lucene.index.VectorSimilarityFunction;
 
-/** Vector index for byte vector. */
-public class ByteVectorIndex extends VectorIndex<byte[]> {
+/** Lucene vector index for byte vector. */
+public class LuceneByteVectorIndex extends LuceneVectorIndex<byte[]> {
     private final long rowId;
     private final byte[] vector;
 
-    public ByteVectorIndex(long rowId, byte[] vector) {
+    public LuceneByteVectorIndex(long rowId, byte[] vector) {
         this.rowId = rowId;
         this.vector = vector;
     }
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneFloatVectorIndex.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneFloatVectorIndex.java
@@ -22,12 +22,12 @@
 import org.apache.lucene.index.IndexableField;
 import org.apache.lucene.index.VectorSimilarityFunction;
 
-/** Vector index for float vector. */
-public class FloatVectorIndex extends VectorIndex<float[]> {
+/** Lucene vector index for float vector. */
+public class LuceneFloatVectorIndex extends LuceneVectorIndex<float[]> {
     private final long rowId;
     private final float[] vector;
 
-    public FloatVectorIndex(long rowId, float[] vector) {
+    public LuceneFloatVectorIndex(long rowId, float[] vector) {
         this.rowId = rowId;
         this.vector = vector;
     }
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneIndexMMapDirectory.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneIndexMMapDirectory.java
@@ -34,15 +34,15 @@
 import java.nio.file.Path;
 import java.util.UUID;
 
-/** A wrapper of MMapDirectory for vector index. */
-public class IndexMMapDirectory implements AutoCloseable {
+/** A wrapper of Lucene MMapDirectory for vector index. */
+public class LuceneIndexMMapDirectory implements AutoCloseable {
 
     private static final int VERSION = 1;
 
     private final Path path;
     private final MMapDirectory mmapDirectory;
 
-    public IndexMMapDirectory() throws IOException {
+    public LuceneIndexMMapDirectory() throws IOException {
         this.path = Files.createTempDirectory("paimon-lucene-" + UUID.randomUUID());
         this.mmapDirectory = new MMapDirectory(path);
     }
@@ -93,8 +93,8 @@ public void serialize(OutputStream out) throws IOException {
         }
     }
 
-    public static IndexMMapDirectory deserialize(SeekableInputStream in) throws IOException {
-        IndexMMapDirectory indexMMapDirectory = new IndexMMapDirectory();
+    public static LuceneIndexMMapDirectory deserialize(SeekableInputStream in) throws IOException {
+        LuceneIndexMMapDirectory luceneIndexMMapDirectory = new LuceneIndexMMapDirectory();
         try {
             DataInputStream dataInputStream = new DataInputStream(in);
             int version = dataInputStream.readInt();
@@ -110,7 +110,9 @@ public static IndexMMapDirectory deserialize(SeekableInputStream in) throws IOEx
                 String fileName = new String(nameBytes, StandardCharsets.UTF_8);
                 long fileLength = dataInputStream.readLong();
                 try (IndexOutput output =
-                        indexMMapDirectory.directory().createOutput(fileName, IOContext.READONCE)) {
+                        luceneIndexMMapDirectory
+                                .directory()
+                                .createOutput(fileName, IOContext.READONCE)) {
                     long remaining = fileLength;
                     while (remaining > 0) {
                         int toRead = (int) Math.min(buffer.length, remaining);
@@ -120,10 +122,10 @@ public static IndexMMapDirectory deserialize(SeekableInputStream in) throws IOEx
                     }
                 }
             }
-            return indexMMapDirectory;
+            return luceneIndexMMapDirectory;
         } catch (Exception e) {
             try {
-                indexMMapDirectory.close();
+                luceneIndexMMapDirectory.close();
             } catch (Exception ignored) {
             }
             if (e instanceof IOException) {
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexReader.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexReader.java
@@ -50,13 +50,13 @@
  * <p>This implementation uses Lucene's native KnnFloatVectorQuery with HNSW graph for efficient
  * approximate nearest neighbor search.
  */
-public class VectorGlobalIndexReader implements GlobalIndexReader {
+public class LuceneVectorGlobalIndexReader implements GlobalIndexReader {
 
     private final List<IndexSearcher> searchers;
-    private final List<IndexMMapDirectory> directories;
+    private final List<LuceneIndexMMapDirectory> directories;
     private final List<GlobalIndexIOMeta> ioMetas;
 
-    public VectorGlobalIndexReader(
+    public LuceneVectorGlobalIndexReader(
             GlobalIndexFileReader fileReader, List<GlobalIndexIOMeta> ioMetas) throws IOException {
         this.ioMetas = ioMetas;
         this.searchers = new ArrayList<>();
@@ -72,12 +72,14 @@ public VectorGlobalIndexReader(
      * @return global index result containing row IDs
      */
     public GlobalIndexResult search(float[] query, int k) {
-        KnnFloatVectorQuery knnQuery = new KnnFloatVectorQuery(VectorIndex.VECTOR_FIELD, query, k);
+        KnnFloatVectorQuery knnQuery =
+                new KnnFloatVectorQuery(LuceneVectorIndex.VECTOR_FIELD, query, k);
         return search(knnQuery, k);
     }
 
     public GlobalIndexResult search(byte[] query, int k) {
-        KnnByteVectorQuery knnQuery = new KnnByteVectorQuery(VectorIndex.VECTOR_FIELD, query, k);
+        KnnByteVectorQuery knnQuery =
+                new KnnByteVectorQuery(LuceneVectorIndex.VECTOR_FIELD, query, k);
         return search(knnQuery, k);
     }
 
@@ -100,7 +102,7 @@ public void close() throws IOException {
         searchers.clear();
 
         // Close directories
-        for (IndexMMapDirectory directory : directories) {
+        for (LuceneIndexMMapDirectory directory : directories) {
             try {
                 directory.close();
             } catch (Throwable t) {
@@ -132,10 +134,11 @@ private GlobalIndexResult search(Query query, int k) {
             try {
                 TopDocs topDocs = searcher.search(query, k);
                 StoredFields storedFields = searcher.storedFields();
-                Set<String> fieldsToLoad = Set.of(VectorIndex.ROW_ID_FIELD);
+                Set<String> fieldsToLoad = Set.of(LuceneVectorIndex.ROW_ID_FIELD);
                 for (org.apache.lucene.search.ScoreDoc scoreDoc : topDocs.scoreDocs) {
                     Document doc = storedFields.document(scoreDoc.doc, fieldsToLoad);
-                    long rowId = doc.getField(VectorIndex.ROW_ID_FIELD).numericValue().longValue();
+                    long rowId =
+                            doc.getField(LuceneVectorIndex.ROW_ID_FIELD).numericValue().longValue();
                     if (topK.size() < k) {
                         topK.offer(new ScoredRow(rowId, scoreDoc.score));
                     } else {
@@ -171,11 +174,11 @@ private void loadIndices(GlobalIndexFileReader fileReader, List<GlobalIndexIOMet
             throws IOException {
         for (GlobalIndexIOMeta meta : files) {
             try (SeekableInputStream in = fileReader.getInputStream(meta.fileName())) {
-                IndexMMapDirectory directory = null;
+                LuceneIndexMMapDirectory directory = null;
                 IndexReader reader = null;
                 boolean success = false;
                 try {
-                    directory = IndexMMapDirectory.deserialize(in);
+                    directory = LuceneIndexMMapDirectory.deserialize(in);
                     reader = DirectoryReader.open(directory.directory());
                     IndexSearcher searcher = new IndexSearcher(reader);
                     directories.add(directory);
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexWriter.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexWriter.java
@@ -44,33 +44,33 @@
  * <p>This implementation uses Lucene's native KnnFloatVectorField with HNSW algorithm for efficient
  * approximate nearest neighbor search.
  */
-public class VectorGlobalIndexWriter implements GlobalIndexWriter {
+public class LuceneVectorGlobalIndexWriter implements GlobalIndexWriter {
 
     private final GlobalIndexFileWriter fileWriter;
-    private final VectorIndexOptions vectorOptions;
+    private final LuceneVectorIndexOptions vectorOptions;
     private final VectorSimilarityFunction similarityFunction;
     private final int sizePerIndex;
-    private final VectorIndexFactory vectorIndexFactory;
+    private final LuceneVectorIndexFactory vectorIndexFactory;
 
     private long count = 0;
-    private final List<VectorIndex> vectorIndices;
+    private final List<LuceneVectorIndex> vectorIndices;
     private final List<ResultEntry> results;
 
-    public VectorGlobalIndexWriter(
+    public LuceneVectorGlobalIndexWriter(
             GlobalIndexFileWriter fileWriter, DataType fieldType, Options options) {
-        this.vectorIndexFactory = VectorIndexFactory.init(fieldType);
+        this.vectorIndexFactory = LuceneVectorIndexFactory.init(fieldType);
         this.fileWriter = fileWriter;
         this.vectorIndices = new ArrayList<>();
         this.results = new ArrayList<>();
-        this.vectorOptions = new VectorIndexOptions(options);
+        this.vectorOptions = new LuceneVectorIndexOptions(options);
         this.similarityFunction = vectorOptions.metric().vectorSimilarityFunction();
         this.sizePerIndex = vectorOptions.sizePerIndex();
     }
 
     @Override
     public void write(Object key) {
         count++;
-        VectorIndex index = vectorIndexFactory.create(count, key);
+        LuceneVectorIndex index = vectorIndexFactory.create(count, key);
         index.checkDimension(vectorOptions.dimension());
         vectorIndices.add(index);
         if (vectorIndices.size() >= sizePerIndex) {
@@ -96,7 +96,7 @@ public List<ResultEntry> finish() {
     }
 
     private void flush() throws IOException {
-        String fileName = fileWriter.newFileName(VectorGlobalIndexerFactory.IDENTIFIER);
+        String fileName = fileWriter.newFileName(LuceneVectorGlobalIndexerFactory.IDENTIFIER);
         try (OutputStream out = new BufferedOutputStream(fileWriter.newOutputStream(fileName))) {
             buildIndex(
                     vectorIndices,
@@ -112,24 +112,25 @@ private void flush() throws IOException {
     }
 
     private void buildIndex(
-            List<VectorIndex> batchVectors,
+            List<LuceneVectorIndex> batchVectors,
             int m,
             int efConstruction,
             int writeBufferSize,
             OutputStream out) {
 
         IndexWriterConfig config = getIndexWriterConfig(m, efConstruction, writeBufferSize);
-        try (IndexMMapDirectory indexMMapDirectory = new IndexMMapDirectory()) {
-            try (IndexWriter writer = new IndexWriter(indexMMapDirectory.directory(), config)) {
-                for (VectorIndex vectorIndex : batchVectors) {
+        try (LuceneIndexMMapDirectory luceneIndexMMapDirectory = new LuceneIndexMMapDirectory()) {
+            try (IndexWriter writer =
+                    new IndexWriter(luceneIndexMMapDirectory.directory(), config)) {
+                for (LuceneVectorIndex luceneVectorIndex : batchVectors) {
                     Document doc = new Document();
-                    doc.add(vectorIndex.indexableField(similarityFunction));
-                    doc.add(vectorIndex.rowIdStoredField());
+                    doc.add(luceneVectorIndex.indexableField(similarityFunction));
+                    doc.add(luceneVectorIndex.rowIdStoredField());
                     writer.addDocument(doc);
                 }
                 writer.commit();
             }
-            indexMMapDirectory.serialize(out);
+            luceneIndexMMapDirectory.serialize(out);
         } catch (Exception e) {
             throw new RuntimeException(e);
         }
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexer.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexer.java
@@ -30,25 +30,25 @@
 import java.io.IOException;
 import java.util.List;
 
-/** Vector global indexer. */
-public class VectorGlobalIndexer implements GlobalIndexer {
+/** Lucene vector global indexer. */
+public class LuceneVectorGlobalIndexer implements GlobalIndexer {
 
     private final DataType fieldType;
     private final Options options;
 
-    public VectorGlobalIndexer(DataType fieldType, Options options) {
+    public LuceneVectorGlobalIndexer(DataType fieldType, Options options) {
         this.fieldType = fieldType;
         this.options = options;
     }
 
     @Override
     public GlobalIndexWriter createWriter(GlobalIndexFileWriter fileWriter) throws IOException {
-        return new VectorGlobalIndexWriter(fileWriter, fieldType, options);
+        return new LuceneVectorGlobalIndexWriter(fileWriter, fieldType, options);
     }
 
     @Override
     public GlobalIndexReader createReader(
             GlobalIndexFileReader fileReader, List<GlobalIndexIOMeta> files) throws IOException {
-        return new VectorGlobalIndexReader(fileReader, files);
+        return new LuceneVectorGlobalIndexReader(fileReader, files);
     }
 }
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexerFactory.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexerFactory.java
@@ -23,10 +23,10 @@
 import org.apache.paimon.options.Options;
 import org.apache.paimon.types.DataType;
 
-/** Factory for creating lucene hnsw vector global indexers. */
-public class VectorGlobalIndexerFactory implements GlobalIndexerFactory {
+/** Factory for creating Lucene vector index. */
+public class LuceneVectorGlobalIndexerFactory implements GlobalIndexerFactory {
 
-    public static final String IDENTIFIER = "lucene-hnsw";
+    public static final String IDENTIFIER = "lucene-vector-knn";
 
     @Override
     public String identifier() {
@@ -35,6 +35,6 @@ public String identifier() {
 
     @Override
     public GlobalIndexer create(DataType type, Options options) {
-        return new VectorGlobalIndexer(type, options);
+        return new LuceneVectorGlobalIndexer(type, options);
     }
 }
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorIndex.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorIndex.java
@@ -22,8 +22,8 @@
 import org.apache.lucene.index.IndexableField;
 import org.apache.lucene.index.VectorSimilarityFunction;
 
-/** Vector index interface. */
-public abstract class VectorIndex<T> {
+/** Lucene vector index interface. */
+public abstract class LuceneVectorIndex<T> {
 
     public static final String VECTOR_FIELD = "vector";
     public static final String ROW_ID_FIELD = "id";
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorIndexFactory.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorIndexFactory.java
@@ -23,36 +23,36 @@
 import org.apache.paimon.types.FloatType;
 import org.apache.paimon.types.TinyIntType;
 
-/** Factory for creating vector index instances based on data type. */
-public abstract class VectorIndexFactory {
+/** Factory for creating Lucene vector index instances based on data type. */
+public abstract class LuceneVectorIndexFactory {
 
-    public static VectorIndexFactory init(DataType dataType) {
+    public static LuceneVectorIndexFactory init(DataType dataType) {
         if (dataType instanceof ArrayType
                 && ((ArrayType) dataType).getElementType() instanceof FloatType) {
-            return new FloatVectorIndexFactory();
+            return new LuceneFloatVectorIndexFactory();
         } else if (dataType instanceof ArrayType
                 && ((ArrayType) dataType).getElementType() instanceof TinyIntType) {
-            return new ByteVectorIndexFactory();
+            return new LuceneByteVectorIndexFactory();
         } else {
             throw new IllegalArgumentException("Unsupported data type: " + dataType);
         }
     }
 
-    public abstract VectorIndex create(long rowId, Object vector);
+    public abstract LuceneVectorIndex create(long rowId, Object vector);
 
-    /** Factory for creating FloatVectorIndex instances. */
-    public static class FloatVectorIndexFactory extends VectorIndexFactory {
+    /** Factory for creating LuceneFloatVectorIndex instances. */
+    public static class LuceneFloatVectorIndexFactory extends LuceneVectorIndexFactory {
         @Override
-        public VectorIndex create(long rowId, Object vector) {
-            return new FloatVectorIndex(rowId, (float[]) vector);
+        public LuceneVectorIndex create(long rowId, Object vector) {
+            return new LuceneFloatVectorIndex(rowId, (float[]) vector);
         }
     }
 
-    /** Factory for creating FloatVectorIndex instances. */
-    public static class ByteVectorIndexFactory extends VectorIndexFactory {
+    /** Factory for creating LuceneByteVectorIndex instances. */
+    public static class LuceneByteVectorIndexFactory extends LuceneVectorIndexFactory {
         @Override
-        public VectorIndex create(long rowId, Object vector) {
-            return new ByteVectorIndex(rowId, (byte[]) vector);
+        public LuceneVectorIndex create(long rowId, Object vector) {
+            return new LuceneByteVectorIndex(rowId, (byte[]) vector);
         }
     }
 }
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorIndexOptions.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorIndexOptions.java
diff --git a/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorMetric.java b/paimon-lucene/src/main/java/org/apache/paimon/lucene/index/LuceneVectorMetric.java
diff --git a/paimon-lucene/src/main/resources/META-INF/services/org.apache.paimon.globalindex.GlobalIndexerFactory b/paimon-lucene/src/main/resources/META-INF/services/org.apache.paimon.globalindex.GlobalIndexerFactory
diff --git a/paimon-lucene/src/test/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexTest.java b/paimon-lucene/src/test/java/org/apache/paimon/lucene/index/LuceneVectorGlobalIndexTest.java