-
Notifications
You must be signed in to change notification settings - Fork 985
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Support for SimpleVectorStore with metdata filter expressions
Signed-off-by: Jemin Huh <hjm1980@gmail.com>
- Loading branch information
1 parent
cd871ea
commit d5cd6e7
Showing
4 changed files
with
610 additions
and
5 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
147 changes: 147 additions & 0 deletions
147
...framework/ai/vectorstore/filter/converter/SimpleVectorStoreFilterExpressionConverter.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,147 @@ | ||
/* | ||
* Copyright 2023-2024 the original author or authors. | ||
* | ||
* Licensed under the Apache License, Version 2.0 (the "License"); | ||
* you may not use this file except in compliance with the License. | ||
* You may obtain a copy of the License at | ||
* | ||
* https://www.apache.org/licenses/LICENSE-2.0 | ||
* | ||
* Unless required by applicable law or agreed to in writing, software | ||
* distributed under the License is distributed on an "AS IS" BASIS, | ||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
* See the License for the specific language governing permissions and | ||
* limitations under the License. | ||
*/ | ||
|
||
package org.springframework.ai.vectorstore.filter.converter; | ||
|
||
import org.springframework.ai.vectorstore.filter.Filter; | ||
import org.springframework.ai.vectorstore.filter.Filter.Expression; | ||
|
||
import java.text.ParseException; | ||
import java.text.SimpleDateFormat; | ||
import java.util.Date; | ||
import java.util.List; | ||
import java.util.TimeZone; | ||
import java.util.regex.Pattern; | ||
|
||
/** | ||
* Converts {@link Expression} into SpEL metadata filter expression format. | ||
* (https://docs.spring.io/spring-framework/reference/core/expressions.html) | ||
* | ||
* @author Jemin Huh | ||
*/ | ||
public class SimpleVectorStoreFilterExpressionConverter extends AbstractFilterExpressionConverter { | ||
|
||
private static final Pattern DATE_FORMAT_PATTERN = Pattern.compile("\\d{4}-\\d{2}-\\d{2}T\\d{2}:\\d{2}:\\d{2}Z"); | ||
|
||
private final SimpleDateFormat dateFormat; | ||
|
||
public SimpleVectorStoreFilterExpressionConverter() { | ||
this.dateFormat = new SimpleDateFormat("yyyy-MM-dd'T'HH:mm:ss'Z'"); | ||
this.dateFormat.setTimeZone(TimeZone.getTimeZone("UTC")); | ||
} | ||
|
||
@Override | ||
protected void doExpression(Filter.Expression expression, StringBuilder context) { | ||
this.convertOperand(expression.left(), context); | ||
context.append(getOperationSymbol(expression)); | ||
this.convertOperand(expression.right(), context); | ||
} | ||
|
||
private String getOperationSymbol(Filter.Expression exp) { | ||
return switch (exp.type()) { | ||
case AND -> " and "; | ||
case OR -> " or "; | ||
case EQ -> " == "; | ||
case LT -> " < "; | ||
case LTE -> " <= "; | ||
case GT -> " > "; | ||
case GTE -> " >= "; | ||
case NE -> " != "; | ||
case IN -> " in "; | ||
case NIN -> " not in "; | ||
default -> throw new RuntimeException("Not supported expression type: " + exp.type()); | ||
}; | ||
} | ||
|
||
@Override | ||
protected void doKey(Filter.Key key, StringBuilder context) { | ||
var identifier = hasOuterQuotes(key.key()) ? removeOuterQuotes(key.key()) : key.key(); | ||
context.append("#metadata['").append(identifier).append("']"); | ||
} | ||
|
||
@Override | ||
protected void doValue(Filter.Value filterValue, StringBuilder context) { | ||
if (filterValue.value() instanceof List<?> list) { | ||
var formattedList = new StringBuilder("{"); | ||
int c = 0; | ||
for (Object v : list) { | ||
this.doSingleValue(v, formattedList); | ||
if (c++ < list.size() - 1) { | ||
this.doAddValueRangeSpitter(filterValue, formattedList); | ||
} | ||
} | ||
formattedList.append("}"); | ||
|
||
if (context.lastIndexOf("in ") == -1) { | ||
context.append(formattedList); | ||
} | ||
else { | ||
appendSpELContains(formattedList, context); | ||
} | ||
} | ||
else { | ||
this.doSingleValue(filterValue.value(), context); | ||
} | ||
} | ||
|
||
private void appendSpELContains(StringBuilder formattedList, StringBuilder context) { | ||
int metadataStart = context.lastIndexOf("#metadata"); | ||
if (metadataStart == -1) | ||
throw new RuntimeException("Wrong SpEL expression: " + context); | ||
|
||
int metadataEnd = context.indexOf(" ", metadataStart); | ||
String metadata = context.substring(metadataStart, metadataEnd); | ||
context.setLength(context.lastIndexOf("in ")); | ||
context.delete(metadataStart, metadataEnd + 1); | ||
context.append(formattedList).append(".contains(").append(metadata).append(")"); | ||
} | ||
|
||
@Override | ||
protected void doSingleValue(Object value, StringBuilder context) { | ||
if (value instanceof Date date) { | ||
context.append("'"); | ||
context.append(this.dateFormat.format(date)); | ||
context.append("'"); | ||
} | ||
else if (value instanceof String text) { | ||
context.append("'"); | ||
if (DATE_FORMAT_PATTERN.matcher(text).matches()) { | ||
try { | ||
Date date = this.dateFormat.parse(text); | ||
context.append(this.dateFormat.format(date)); | ||
} | ||
catch (ParseException e) { | ||
throw new IllegalArgumentException("Invalid date type:" + text, e); | ||
} | ||
} | ||
else { | ||
context.append(text); | ||
} | ||
context.append("'"); | ||
} | ||
else { | ||
context.append(value); | ||
} | ||
} | ||
|
||
@Override | ||
protected void doGroup(Filter.Group group, StringBuilder context) { | ||
context.append("("); | ||
super.doGroup(group, context); | ||
context.append(")"); | ||
} | ||
|
||
} |
Oops, something went wrong.