apache · liangkaiwen · Jun 11, 2025 · Jun 11, 2025 · Jun 23, 2025 · Jun 23, 2025
diff --git a/solr/core/src/java/org/apache/solr/core/SchemaCodecFactory.java b/solr/core/src/java/org/apache/solr/core/SchemaCodecFactory.java
@@ -28,19 +28,24 @@
 import org.apache.lucene.codecs.PostingsFormat;
 import org.apache.lucene.codecs.lucene912.Lucene912Codec;
 import org.apache.lucene.codecs.lucene912.Lucene912Codec.Mode;
+import org.apache.lucene.codecs.lucene99.Lucene99HnswScalarQuantizedVectorsFormat;
 import org.apache.lucene.codecs.lucene99.Lucene99HnswVectorsFormat;
+import org.apache.lucene.codecs.lucene99.Lucene99ScalarQuantizedVectorsFormat;
 import org.apache.lucene.index.SegmentReadState;
 import org.apache.lucene.index.SegmentWriteState;
 import org.apache.solr.common.SolrException;
 import org.apache.solr.common.SolrException.ErrorCode;
 import org.apache.solr.common.util.NamedList;
 import org.apache.solr.schema.DenseVectorField;
 import org.apache.solr.schema.FieldType;
+import org.apache.solr.schema.ScalarQuantizedDenseVectorField;
 import org.apache.solr.schema.SchemaField;
 import org.apache.solr.util.plugin.SolrCoreAware;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+import static org.apache.lucene.codecs.lucene99.Lucene99HnswVectorsFormat.DEFAULT_NUM_MERGE_WORKER;
+
 /**
  * Per-field CodecFactory implementation, extends Lucene's and returns postings format
  * implementations according to the schema configuration. <br>
@@ -126,19 +131,13 @@ public DocValuesFormat getDocValuesFormatForField(String field) {
           public KnnVectorsFormat getKnnVectorsFormatForField(String field) {
             final SchemaField schemaField = core.getLatestSchema().getFieldOrNull(field);
             FieldType fieldType = (schemaField == null ? null : schemaField.getType());
-            if (fieldType instanceof DenseVectorField vectorType) {
-              String knnAlgorithm = vectorType.getKnnAlgorithm();
-              if (DenseVectorField.HNSW_ALGORITHM.equals(knnAlgorithm)) {
-                int maxConn = vectorType.getHnswMaxConn();
-                int beamWidth = vectorType.getHnswBeamWidth();
-                var delegate = new Lucene99HnswVectorsFormat(maxConn, beamWidth);
-                return new SolrDelegatingKnnVectorsFormat(delegate, vectorType.getDimension());
-              } else {
-                throw new SolrException(
-                    ErrorCode.SERVER_ERROR, knnAlgorithm + " KNN algorithm is not supported");
-              }
+            if (fieldType instanceof DenseVectorField) {
+              final DenseVectorField vectorField = (DenseVectorField) fieldType;
+              return new SolrDelegatingKnnVectorsFormat(vectorField.buildKnnVectorsFormat(),
+                      vectorField.getDimension());
+            } else {
+              throw new SolrException(ErrorCode.SERVER_ERROR, "field is not a support KNN vector type");
             }
-            return super.getKnnVectorsFormatForField(field);
           }
         };
   }

diff --git a/solr/core/src/java/org/apache/solr/schema/DenseVectorField.java b/solr/core/src/java/org/apache/solr/schema/DenseVectorField.java
@@ -26,6 +26,7 @@
 import java.util.Locale;
 import java.util.Map;
 import org.apache.lucene.codecs.KnnVectorsFormat;
+import org.apache.lucene.codecs.lucene99.Lucene99HnswVectorsFormat;
 import org.apache.lucene.document.FieldType;
 import org.apache.lucene.document.KnnByteVectorField;
 import org.apache.lucene.document.KnnFloatVectorField;
@@ -64,6 +65,7 @@
 public class DenseVectorField extends FloatPointField {
   private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
   public static final String HNSW_ALGORITHM = "hnsw";
+  public static final String FLAT_ALGORITHM = "flat";
   public static final String DEFAULT_KNN_ALGORITHM = HNSW_ALGORITHM;
   static final String KNN_VECTOR_DIMENSION = "vectorDimension";
   static final String KNN_ALGORITHM = "knnAlgorithm";
@@ -346,6 +348,10 @@ public DenseVectorParser getVectorBuilder(
     }
   }
 
+  public KnnVectorsFormat buildKnnVectorsFormat() {
+    return new Lucene99HnswVectorsFormat(hnswMaxConn, hnswBeamWidth);
+  }
+
   @Override
   public UninvertingReader.Type getUninversionType(SchemaField sf) {
     return null;

diff --git a/solr/core/src/java/org/apache/solr/schema/ScalarQuantizedDenseVectorField.java b/solr/core/src/java/org/apache/solr/schema/ScalarQuantizedDenseVectorField.java
@@ -0,0 +1,128 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.solr.schema;
+
+import org.apache.lucene.codecs.KnnVectorsFormat;
+import org.apache.lucene.codecs.lucene99.Lucene99HnswScalarQuantizedVectorsFormat;
+import org.apache.lucene.codecs.lucene99.Lucene99ScalarQuantizedVectorsFormat;
+import org.apache.lucene.index.VectorEncoding;
+import org.apache.lucene.index.VectorSimilarityFunction;
+import org.apache.solr.common.SolrException;
+
+import java.util.Map;
+
+import static java.util.Optional.ofNullable;
+import static org.apache.lucene.codecs.lucene99.Lucene99HnswVectorsFormat.DEFAULT_NUM_MERGE_WORKER;
+
+public class ScalarQuantizedDenseVectorField extends DenseVectorField {
+    public static final String BITS = "bits"; //
+    public static final String CONFIDENCE_INTERVAL = "confidenceInterval";
+    public static final String DYNAMIC_CONFIDENCE_INTERVAL = "dynamicConfidenceInterval";
+    public static final String COMPRESS = "compress"; // can only be enabled when bits = 4 per Lucene codec spec
+
+    private static final int DEFAULT_BITS = 7; // use signed byte as default when unspecified
+    private static final Float DEFAULT_CONFIDENCE_INTERVAL = null; // use dimension scaled confidence interval
+
+    /**
+     * Number of bits to use for storage
+     * Must be 4 (half-byte) or 7 (signed-byte) per Lucene codec spec
+     */
+    private int bits;
+
+    /**
+     * Confidence interval to use for scalar quantization
+     * Default is calculated as `1-1/(vector_dimensions + 1)`
+     */
+    private Float confidenceInterval;
+
+    /**
+     * When enabled, in conjunction with 4 bit size, will pair values into single bytes for 50% reduction in memory usage
+     * (comes at the cost of some decode speed penalty)
+     */
+    private boolean compress;
+
+    public ScalarQuantizedDenseVectorField(int dimension,
+                                           VectorSimilarityFunction similarityFunction,
+                                           VectorEncoding vectorEncoding,
+                                           int bits,
+                                           Float confidenceInterval,
+                                           boolean compress) {
+        super(dimension, similarityFunction, vectorEncoding);
+        this.bits = bits;
+        this.confidenceInterval = confidenceInterval;
+        this.compress = compress;
+    }
+
+    @Override
+    public void init(IndexSchema schema, Map<String, String> args) {
+        super.init(schema, args);
+
+        this.bits = ofNullable(args.remove(BITS))
+                .map(Integer::parseInt)
+                .orElse(DEFAULT_BITS);
+
+        this.compress = ofNullable(args.remove(COMPRESS))
+                .map(Boolean::parseBoolean)
+                .orElse(false);
+
+        this.confidenceInterval = ofNullable(args.remove(CONFIDENCE_INTERVAL))
+                .map(Float::parseFloat)
+                .orElse(DEFAULT_CONFIDENCE_INTERVAL);
+
+        if (ofNullable(args.remove(DYNAMIC_CONFIDENCE_INTERVAL))
+                .map(Boolean::parseBoolean)
+                .orElse(false)) {
+            this.confidenceInterval = Lucene99ScalarQuantizedVectorsFormat.DYNAMIC_CONFIDENCE_INTERVAL;
+        }
+    }
+
+    @Override
+    public KnnVectorsFormat buildKnnVectorsFormat() {
+        final String knnAlgorithm = getKnnAlgorithm();
+        if (KNN_ALGORITHM.equals(knnAlgorithm)) {
+            return new Lucene99HnswScalarQuantizedVectorsFormat(
+                    getHnswMaxConn(),
+                    getHnswBeamWidth(),
+                    DEFAULT_NUM_MERGE_WORKER,
+                    getBits(),
+                    useCompression(),
+                    getConfidenceInterval(),
+                    null
+            );
+        } else if (FLAT_ALGORITHM.equals(knnAlgorithm)) {
+            return new Lucene99ScalarQuantizedVectorsFormat(
+                    getConfidenceInterval(),
+                    getBits(),
+                    useCompression());
+        } else {
+            throw new SolrException(SolrException.ErrorCode.SERVER_ERROR, String.format("Unrecognized KNN algorithm: %s", knnAlgorithm));
+        }
+    }
+
+    public int getBits() {
+        return bits;
+    }
+
+    public boolean useCompression() {
+        return compress;
+    }
+
+    public Float getConfidenceInterval() {
+        return confidenceInterval;
+    }
+
+}