Skip to content

Commit

Permalink
Fix the issue that missing identifiers from ANTLR keywords (opensearc…
Browse files Browse the repository at this point in the history
…h-project#821)

Signed-off-by: Lantao Jin <[email protected]>
  • Loading branch information
LantaoJin authored Oct 29, 2024
1 parent ce50567 commit 9d2f94d
Show file tree
Hide file tree
Showing 3 changed files with 55 additions and 69 deletions.
4 changes: 0 additions & 4 deletions ppl-spark-integration/src/main/antlr4/OpenSearchPPLLexer.g4
Original file line number Diff line number Diff line change
Expand Up @@ -74,13 +74,9 @@ INDEX: 'INDEX';
D: 'D';
DESC: 'DESC';
DATASOURCES: 'DATASOURCES';
VALUE: 'VALUE';
USING: 'USING';
WITH: 'WITH';

// CLAUSE KEYWORDS
SORTBY: 'SORTBY';

// FIELD KEYWORDS
AUTO: 'AUTO';
STR: 'STR';
Expand Down
106 changes: 54 additions & 52 deletions ppl-spark-integration/src/main/antlr4/OpenSearchPPLParser.g4
Original file line number Diff line number Diff line change
Expand Up @@ -55,6 +55,35 @@ commands
| fieldsummaryCommand
;

commandName
: SEARCH
| DESCRIBE
| SHOW
| AD
| ML
| KMEANS
| WHERE
| CORRELATE
| JOIN
| FIELDS
| STATS
| EVENTSTATS
| DEDUP
| EXPLAIN
| SORT
| HEAD
| TOP
| RARE
| EVAL
| GROK
| PARSE
| PATTERNS
| LOOKUP
| RENAME
| FILLNULL
| FIELDSUMMARY
;

searchCommand
: (SEARCH)? fromClause # searchFrom
| (SEARCH)? fromClause logicalExpression # searchFromFilter
Expand Down Expand Up @@ -360,14 +389,6 @@ statsFunctionName
| STDDEV_POP
;

takeAggFunction
: TAKE LT_PRTHS fieldExpression (COMMA size = integerLiteral)? RT_PRTHS
;

percentileAggFunction
: PERCENTILE LESS value = integerLiteral GREATER LT_PRTHS aggField = fieldExpression RT_PRTHS
;

// expressions
expression
: logicalExpression
Expand Down Expand Up @@ -999,46 +1020,37 @@ keywordsCanBeId
| mathematicalFunctionName
| positionFunctionName
| cryptographicFunctionName
// commands
| SEARCH
| DESCRIBE
| SHOW
| FROM
| WHERE
| CORRELATE
| FIELDS
| RENAME
| STATS
| DEDUP
| SORT
| EVAL
| HEAD
| TOP
| RARE
| PARSE
| METHOD
| REGEX
| PUNCT
| GROK
| PATTERN
| PATTERNS
| NEW_FIELD
| KMEANS
| AD
| ML
| EXPLAIN
| singleFieldRelevanceFunctionName
| multiFieldRelevanceFunctionName
| commandName
| comparisonOperator
| explainMode
| correlationType
// commands assist keywords
| IN
| SOURCE
| INDEX
| DESC
| DATASOURCES
// CLAUSEKEYWORDS
| SORTBY
// FIELDKEYWORDSAUTO
| AUTO
| STR
| IP
| NUM
| FROM
| PATTERN
| NEW_FIELD
| SCOPE
| MAPPING
| WITH
| USING
| CAST
| GET_FORMAT
| EXTRACT
| INTERVAL
| PLUS
| MINUS
| INCLUDEFIELDS
| NULLS
// ARGUMENT KEYWORDS
| KEEPEMPTY
| CONSECUTIVE
Expand All @@ -1061,27 +1073,21 @@ keywordsCanBeId
| TRAINING_DATA_SIZE
| ANOMALY_SCORE_THRESHOLD
// AGGREGATIONS
| AVG
| COUNT
| statsFunctionName
| DISTINCT_COUNT
| PERCENTILE
| PERCENTILE_APPROX
| ESTDC
| ESTDC_ERROR
| MAX
| MEAN
| MEDIAN
| MIN
| MODE
| RANGE
| STDEV
| STDEVP
| SUM
| SUMSQ
| VAR_SAMP
| VAR_POP
| STDDEV_SAMP
| STDDEV_POP
| PERCENTILE
| PERCENTILE_APPROX
| TAKE
| FIRST
| LAST
Expand All @@ -1099,10 +1105,6 @@ keywordsCanBeId
| SPARKLINE
| C
| DC
// FIELD SUMMARY
| FIELDSUMMARY
| INCLUDEFIELDS
| NULLS
// JOIN TYPE
| OUTER
| INNER
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -22,7 +22,6 @@
import org.opensearch.sql.ast.expression.DataType;
import org.opensearch.sql.ast.expression.EqualTo;
import org.opensearch.sql.ast.expression.Field;
import org.opensearch.sql.ast.expression.FieldList;
import org.opensearch.sql.ast.expression.Function;
import org.opensearch.sql.ast.expression.In;
import org.opensearch.sql.ast.expression.subquery.ExistsSubquery;
Expand All @@ -42,7 +41,6 @@
import org.opensearch.sql.ast.expression.UnresolvedExpression;
import org.opensearch.sql.ast.expression.When;
import org.opensearch.sql.ast.expression.Xor;
import org.opensearch.sql.ast.tree.UnresolvedPlan;
import org.opensearch.sql.common.utils.StringUtils;
import org.opensearch.sql.ppl.utils.ArgumentFactory;

Expand All @@ -54,8 +52,6 @@
import java.util.stream.IntStream;
import java.util.stream.Stream;

import static org.opensearch.flint.spark.ppl.OpenSearchPPLParser.INCLUDEFIELDS;
import static org.opensearch.flint.spark.ppl.OpenSearchPPLParser.NULLS;
import static org.opensearch.sql.expression.function.BuiltinFunctionName.EQUAL;
import static org.opensearch.sql.expression.function.BuiltinFunctionName.IS_NOT_NULL;
import static org.opensearch.sql.expression.function.BuiltinFunctionName.IS_NULL;
Expand All @@ -81,7 +77,7 @@ public void setAstBuilder(AstBuilder astBuilder) {
/**
* The function name mapping between fronted and core engine.
*/
private static Map<String, String> FUNCTION_NAME_MAPPING =
private static final Map<String, String> FUNCTION_NAME_MAPPING =
new ImmutableMap.Builder<String, String>()
.put("isnull", IS_NULL.getName().getFunctionName())
.put("isnotnull", IS_NOT_NULL.getName().getFunctionName())
Expand Down Expand Up @@ -217,14 +213,6 @@ public UnresolvedExpression visitDistinctCountFunctionCall(OpenSearchPPLParser.D
return new AggregateFunction("count", visit(ctx.valueExpression()), true);
}

@Override
public UnresolvedExpression visitPercentileAggFunction(OpenSearchPPLParser.PercentileAggFunctionContext ctx) {
return new AggregateFunction(
ctx.PERCENTILE().getText(),
visit(ctx.aggField),
Collections.singletonList(new Argument("rank", (Literal) visit(ctx.value))));
}

@Override
public UnresolvedExpression visitPercentileFunctionCall(OpenSearchPPLParser.PercentileFunctionCallContext ctx) {
return new AggregateFunction(
Expand Down

0 comments on commit 9d2f94d

Please sign in to comment.