Skip to content

Commit

Permalink
ES|QL: Fix RLIKE folding with (unsupported) case insensitive pattern (e…
Browse files Browse the repository at this point in the history
  • Loading branch information
luigidellaquila authored and nik9000 committed Dec 26, 2024
1 parent 7908f55 commit 549eea7
Show file tree
Hide file tree
Showing 12 changed files with 66 additions and 45 deletions.
5 changes: 5 additions & 0 deletions docs/changelog/118454.yaml
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
pr: 118454
summary: Fix RLIKE folding with (unsupported) case insensitive pattern
area: ES|QL
type: bug
issues: []
Original file line number Diff line number Diff line change
Expand Up @@ -8,12 +8,11 @@

import org.elasticsearch.common.io.stream.StreamOutput;
import org.elasticsearch.xpack.esql.core.expression.Expression;
import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
import org.elasticsearch.xpack.esql.core.tree.Source;

import java.io.IOException;

public class RLike extends RegexMatch<RLikePattern> {
public abstract class RLike extends RegexMatch<RLikePattern> {

public RLike(Source source, Expression value, RLikePattern pattern) {
super(source, value, pattern, false);
Expand All @@ -33,13 +32,4 @@ public String getWriteableName() {
throw new UnsupportedOperationException();
}

@Override
protected NodeInfo<RLike> info() {
return NodeInfo.create(this, RLike::new, field(), pattern(), caseInsensitive());
}

@Override
protected RLike replaceChild(Expression newChild) {
return new RLike(source(), newChild, pattern(), caseInsensitive());
}
}
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,6 @@

package org.elasticsearch.xpack.esql.core.expression.predicate.regex;

import org.apache.lucene.util.BytesRef;
import org.elasticsearch.xpack.esql.core.expression.Expression;
import org.elasticsearch.xpack.esql.core.expression.Nullability;
import org.elasticsearch.xpack.esql.core.expression.function.scalar.UnaryScalarFunction;
Expand Down Expand Up @@ -64,11 +63,7 @@ public boolean foldable() {

@Override
public Boolean fold() {
Object val = field().fold();
if (val instanceof BytesRef br) {
val = br.utf8ToString();
}
return RegexOperation.match(val, pattern().asJavaRegex());
throw new UnsupportedOperationException();
}

@Override
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -8,12 +8,11 @@

import org.elasticsearch.common.io.stream.StreamOutput;
import org.elasticsearch.xpack.esql.core.expression.Expression;
import org.elasticsearch.xpack.esql.core.tree.NodeInfo;
import org.elasticsearch.xpack.esql.core.tree.Source;

import java.io.IOException;

public class WildcardLike extends RegexMatch<WildcardPattern> {
public abstract class WildcardLike extends RegexMatch<WildcardPattern> {

public WildcardLike(Source source, Expression left, WildcardPattern pattern) {
this(source, left, pattern, false);
Expand All @@ -33,14 +32,4 @@ public String getWriteableName() {
throw new UnsupportedOperationException();
}

@Override
protected NodeInfo<WildcardLike> info() {
return NodeInfo.create(this, WildcardLike::new, field(), pattern(), caseInsensitive());
}

@Override
protected WildcardLike replaceChild(Expression newLeft) {
return new WildcardLike(source(), newLeft, pattern(), caseInsensitive());
}

}
Original file line number Diff line number Diff line change
Expand Up @@ -11,8 +11,6 @@
import org.elasticsearch.xpack.esql.core.expression.FieldAttribute;
import org.elasticsearch.xpack.esql.core.expression.Literal;
import org.elasticsearch.xpack.esql.core.expression.predicate.Range;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLike;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLikePattern;
import org.elasticsearch.xpack.esql.core.tree.Source;
import org.elasticsearch.xpack.esql.core.type.DataType;
import org.elasticsearch.xpack.esql.core.type.EsField;
Expand Down Expand Up @@ -46,10 +44,6 @@ public static Range rangeOf(Expression value, Expression lower, boolean includeL
return new Range(EMPTY, value, lower, includeLower, upper, includeUpper, randomZone());
}

public static RLike rlike(Expression left, String exp) {
return new RLike(EMPTY, left, new RLikePattern(exp));
}

public static FieldAttribute fieldAttribute() {
return fieldAttribute(randomAlphaOfLength(10), randomFrom(DataType.types()));
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -580,3 +580,39 @@ Mokhtar |Bernatsky |38992 |BM
Parto |Bamford |61805 |BP
Premal |Baek |52833 |BP
;


caseInsensitiveRegex
from employees | where first_name RLIKE "(?i)geor.*" | keep first_name
;

first_name:keyword
;


caseInsensitiveRegex2
from employees | where first_name RLIKE "(?i)Geor.*" | keep first_name
;

first_name:keyword
;


caseInsensitiveRegexFold
required_capability: fixed_regex_fold
row foo = "Bar" | where foo rlike "(?i)ba.*"
;

foo:keyword
;


caseInsensitiveRegexFold2
required_capability: fixed_regex_fold
row foo = "Bar" | where foo rlike "(?i)Ba.*"
;

foo:keyword
;


Original file line number Diff line number Diff line change
Expand Up @@ -407,7 +407,12 @@ public enum Cap {
/**
* Fix pushdown of LIMIT past MV_EXPAND
*/
ADD_LIMIT_INSIDE_MV_EXPAND;
ADD_LIMIT_INSIDE_MV_EXPAND,

/**
* Fix for regex folding with case-insensitive pattern https://github.com/elastic/elasticsearch/issues/118371
*/
FIXED_REGEX_FOLD;

private final boolean enabled;

Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -79,7 +79,7 @@ public String getWriteableName() {
}

@Override
protected NodeInfo<org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLike> info() {
protected NodeInfo<RLike> info() {
return NodeInfo.create(this, RLike::new, field(), pattern(), caseInsensitive());
}

Expand All @@ -93,6 +93,11 @@ protected TypeResolution resolveType() {
return isString(field(), sourceText(), DEFAULT);
}

@Override
public Boolean fold() {
return (Boolean) EvaluatorMapper.super.fold();
}

@Override
public EvalOperator.ExpressionEvaluator.Factory toEvaluator(ToEvaluator toEvaluator) {
return AutomataMatch.toEvaluator(source(), toEvaluator.apply(field()), pattern().createAutomaton());
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -99,6 +99,11 @@ protected TypeResolution resolveType() {
return isString(field(), sourceText(), DEFAULT);
}

@Override
public Boolean fold() {
return (Boolean) EvaluatorMapper.super.fold();
}

@Override
public EvalOperator.ExpressionEvaluator.Factory toEvaluator(ToEvaluator toEvaluator) {
return AutomataMatch.toEvaluator(
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -17,13 +17,11 @@
import org.elasticsearch.xpack.esql.core.expression.predicate.logical.And;
import org.elasticsearch.xpack.esql.core.expression.predicate.logical.Not;
import org.elasticsearch.xpack.esql.core.expression.predicate.logical.Or;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.Like;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.LikePattern;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLike;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLikePattern;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.WildcardLike;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.WildcardPattern;
import org.elasticsearch.xpack.esql.core.type.DataType;
import org.elasticsearch.xpack.esql.expression.function.scalar.string.RLike;
import org.elasticsearch.xpack.esql.expression.function.scalar.string.WildcardLike;
import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Add;
import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Div;
import org.elasticsearch.xpack.esql.expression.predicate.operator.arithmetic.Mod;
Expand Down Expand Up @@ -101,7 +99,6 @@ public void testConstantNot() {
}

public void testConstantFoldingLikes() {
assertEquals(TRUE, new ConstantFolding().rule(new Like(EMPTY, of("test_emp"), new LikePattern("test%", (char) 0))).canonical());
assertEquals(TRUE, new ConstantFolding().rule(new WildcardLike(EMPTY, of("test_emp"), new WildcardPattern("test*"))).canonical());
assertEquals(TRUE, new ConstantFolding().rule(new RLike(EMPTY, of("test_emp"), new RLikePattern("test.emp"))).canonical());
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -199,7 +199,7 @@ public void testPushDownFilterOnAliasInEval() {

public void testPushDownLikeRlikeFilter() {
EsRelation relation = relation();
org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLike conditionA = rlike(getFieldAttribute("a"), "foo");
RLike conditionA = rlike(getFieldAttribute("a"), "foo");
WildcardLike conditionB = wildcardLike(getFieldAttribute("b"), "bar");

Filter fa = new Filter(EMPTY, relation, conditionA);
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -13,11 +13,11 @@
import org.elasticsearch.xpack.esql.core.expression.predicate.nulls.IsNotNull;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.Like;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.LikePattern;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLike;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.RLikePattern;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.WildcardLike;
import org.elasticsearch.xpack.esql.core.expression.predicate.regex.WildcardPattern;
import org.elasticsearch.xpack.esql.core.util.StringUtils;
import org.elasticsearch.xpack.esql.expression.function.scalar.string.RLike;
import org.elasticsearch.xpack.esql.expression.function.scalar.string.WildcardLike;
import org.elasticsearch.xpack.esql.expression.predicate.operator.comparison.Equals;

import static java.util.Arrays.asList;
Expand Down

0 comments on commit 549eea7

Please sign in to comment.