apache · liangkaiwen · Jun 11, 2025 · Jun 11, 2025 · Jun 23, 2025 · Jun 23, 2025
diff --git a/solr/core/src/java/org/apache/solr/core/SchemaCodecFactory.java b/solr/core/src/java/org/apache/solr/core/SchemaCodecFactory.java
@@ -28,19 +28,24 @@
 import org.apache.lucene.codecs.PostingsFormat;
 import org.apache.lucene.codecs.lucene912.Lucene912Codec;
 import org.apache.lucene.codecs.lucene912.Lucene912Codec.Mode;
+import org.apache.lucene.codecs.lucene99.Lucene99HnswScalarQuantizedVectorsFormat;
 import org.apache.lucene.codecs.lucene99.Lucene99HnswVectorsFormat;
+import org.apache.lucene.codecs.lucene99.Lucene99ScalarQuantizedVectorsFormat;
 import org.apache.lucene.index.SegmentReadState;
 import org.apache.lucene.index.SegmentWriteState;
 import org.apache.solr.common.SolrException;
 import org.apache.solr.common.SolrException.ErrorCode;
 import org.apache.solr.common.util.NamedList;
 import org.apache.solr.schema.DenseVectorField;
 import org.apache.solr.schema.FieldType;
+import org.apache.solr.schema.ScalarQuantizedDenseVectorField;
 import org.apache.solr.schema.SchemaField;
 import org.apache.solr.util.plugin.SolrCoreAware;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 
+import static org.apache.lucene.codecs.lucene99.Lucene99HnswVectorsFormat.DEFAULT_NUM_MERGE_WORKER;
+
 /**
  * Per-field CodecFactory implementation, extends Lucene's and returns postings format
  * implementations according to the schema configuration. <br>
@@ -126,16 +131,41 @@ public DocValuesFormat getDocValuesFormatForField(String field) {
           public KnnVectorsFormat getKnnVectorsFormatForField(String field) {
             final SchemaField schemaField = core.getLatestSchema().getFieldOrNull(field);
             FieldType fieldType = (schemaField == null ? null : schemaField.getType());
-            if (fieldType instanceof DenseVectorField vectorType) {
+            KnnVectorsFormat delegate;
+            if (fieldType instanceof ScalarQuantizedDenseVectorField scalarQuantizedVectorType) {
+              final String knnAlgorithm = scalarQuantizedVectorType.getKnnAlgorithm();
+              switch (knnAlgorithm) {
+                case DenseVectorField.FLAT_ALGORITHM:
+                  delegate = new Lucene99ScalarQuantizedVectorsFormat(
+                          scalarQuantizedVectorType.getConfidenceInterval(),
+                          scalarQuantizedVectorType.getBits(),
+                          scalarQuantizedVectorType.useCompression());
+                  break;
+                case DenseVectorField.HNSW_ALGORITHM:
+                  int maxConn = scalarQuantizedVectorType.getHnswMaxConn();
+                  int beamWidth = scalarQuantizedVectorType.getHnswBeamWidth();
+                  delegate = new Lucene99HnswScalarQuantizedVectorsFormat(maxConn,
+                          beamWidth,
+                          DEFAULT_NUM_MERGE_WORKER,
+                          scalarQuantizedVectorType.getBits(),
+                          scalarQuantizedVectorType.useCompression(),
+                          scalarQuantizedVectorType.getConfidenceInterval(),
+                          null);
+                  break;
+                default:
+                  throw new SolrException(ErrorCode.SERVER_ERROR, knnAlgorithm + " KNN algorithm is not supported");
+              }
+              return new SolrDelegatingKnnVectorsFormat(delegate, scalarQuantizedVectorType.getDimension());
+            } else if (fieldType instanceof DenseVectorField vectorType) {
               String knnAlgorithm = vectorType.getKnnAlgorithm();
               if (DenseVectorField.HNSW_ALGORITHM.equals(knnAlgorithm)) {
                 int maxConn = vectorType.getHnswMaxConn();
                 int beamWidth = vectorType.getHnswBeamWidth();
-                var delegate = new Lucene99HnswVectorsFormat(maxConn, beamWidth);
+                delegate = new Lucene99HnswVectorsFormat(maxConn, beamWidth);
                 return new SolrDelegatingKnnVectorsFormat(delegate, vectorType.getDimension());
               } else {
                 throw new SolrException(
-                    ErrorCode.SERVER_ERROR, knnAlgorithm + " KNN algorithm is not supported");
+                        ErrorCode.SERVER_ERROR, knnAlgorithm + " KNN algorithm is not supported");
               }
             }
             return super.getKnnVectorsFormatForField(field);

diff --git a/solr/core/src/java/org/apache/solr/schema/DenseVectorField.java b/solr/core/src/java/org/apache/solr/schema/DenseVectorField.java
@@ -64,6 +64,7 @@
 public class DenseVectorField extends FloatPointField {
   private static final Logger log = LoggerFactory.getLogger(MethodHandles.lookup().lookupClass());
   public static final String HNSW_ALGORITHM = "hnsw";
+  public static final String FLAT_ALGORITHM = "flat";
   public static final String DEFAULT_KNN_ALGORITHM = HNSW_ALGORITHM;
   static final String KNN_VECTOR_DIMENSION = "vectorDimension";
   static final String KNN_ALGORITHM = "knnAlgorithm";

diff --git a/solr/core/src/java/org/apache/solr/schema/ScalarQuantizedDenseVectorField.java b/solr/core/src/java/org/apache/solr/schema/ScalarQuantizedDenseVectorField.java
@@ -0,0 +1,107 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one or more
+ * contributor license agreements.  See the NOTICE file distributed with
+ * this work for additional information regarding copyright ownership.
+ * The ASF licenses this file to You under the Apache License, Version 2.0
+ * (the "License"); you may not use this file except in compliance with
+ * the License.  You may obtain a copy of the License at
+ *
+ *     http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+package org.apache.solr.schema;
+
+import org.apache.lucene.codecs.lucene99.Lucene99ScalarQuantizedVectorsFormat;
+import org.apache.lucene.index.VectorEncoding;
+import org.apache.lucene.index.VectorSimilarityFunction;
+
+import java.util.Map;
+
+import static java.util.Optional.ofNullable;
+
+public class ScalarQuantizedDenseVectorField extends DenseVectorField {
+    public static final String BITS = "bits"; //
+    public static final String CONFIDENCE_INTERVAL = "confidenceInterval";
+    public static final String DYNAMIC_CONFIDENCE_INTERVAL = "dynamicConfidenceInterval";
+    public static final String COMPRESS = "compress"; // can only be enabled when bits = 4 per Lucene codec spec
+
+    private static final int DEFAULT_BITS = 7; // use signed byte as default when unspecified
+    private static final Float DEFAULT_CONFIDENCE_INTERVAL = null; // use dimension scaled confidence interval
+
+    /**
+     * Number of bits to use for storage
+     * Must be 4 (half-byte) or 7 (signed-byte) per Lucene codec spec
+     */
+    private int bits;
+
+    /**
+     * Confidence interval to use for scalar quantization
+     * Default is calculated as `1-1/(vector_dimensions + 1)`
+     */
+    private Float confidenceInterval;
+
+    /**
+     * When enabled, in conjunction with 4 bit size, will pair values into single bytes for 50% reduction in memory usage
+     * (comes at the cost of some decode speed penalty)
+     */
+    private boolean compress;
+
+    public ScalarQuantizedDenseVectorField(int dimension,
+                                           VectorSimilarityFunction similarityFunction,
+                                           VectorEncoding vectorEncoding,
+                                           int bits,
+                                           Float confidenceInterval,
+                                           boolean compress) {
+        super(dimension, similarityFunction, vectorEncoding);
+        this.bits = bits;
+        this.confidenceInterval = confidenceInterval;
+        this.compress = compress;
+    }
+
+    @Override
+    public void init(IndexSchema schema, Map<String, String> args) {
+        super.init(schema, args);
+
+        this.bits = ofNullable(args.get(BITS))
+                .map(Integer::parseInt)
+                .orElse(DEFAULT_BITS);
+        args.remove(BITS);
+
+        this.compress = ofNullable(args.get(COMPRESS))
+                .map(Boolean::parseBoolean)
+                .orElse(false);
+        args.remove(COMPRESS);
+
+        boolean useDynamicConfidenceInterval = ofNullable(args.get(DYNAMIC_CONFIDENCE_INTERVAL))
+                .map(Boolean::parseBoolean)
+                .orElse(false);
+        args.remove(DYNAMIC_CONFIDENCE_INTERVAL);
+
+        if (useDynamicConfidenceInterval) {
+            this.confidenceInterval = Lucene99ScalarQuantizedVectorsFormat.DYNAMIC_CONFIDENCE_INTERVAL;
+        }
+
+        this.confidenceInterval = ofNullable(args.get(CONFIDENCE_INTERVAL))
+                .map(Float::parseFloat)
+                .orElse(DEFAULT_CONFIDENCE_INTERVAL);
+        args.remove(CONFIDENCE_INTERVAL);
+    }
+
+    public int getBits() {
+        return bits;
+    }
+
+    public boolean useCompression() {
+        return compress;
+    }
+
+    public Float getConfidenceInterval() {
+        return confidenceInterval;
+    }
+
+}