QueryBuilder: Support : in field values
Prior to this change, "field:foo:bar" is parsed as "field:foo", silently discarding the ":bar". Worse, "field:foo:bar baz:quux" is _also_ parsed as "field:foo", discarding not just part of the first term but the entire second term. Fix this by treating "SINGLE_WORD ':' fieldValue" as a valid definition of a field value, and add tests. This solution seems inelegant in general; it seems like we should be able to concatenate the tokens together into a single AST node at the Antlr level. Also, it doesn't work in all cases: it fails to parse field values ending in ':' I'm far from an Antlr expert and there may be a better/easier way to do this. But this change is still strictly better than it was before, and it sets an example of how to write tests for parser functionality. Change-Id: If275623b3244b02f81114fb2997ba16ee1492a4f
This commit is contained in:
@@ -120,13 +120,24 @@ conditionNot
|
|||||||
;
|
;
|
||||||
conditionBase
|
conditionBase
|
||||||
: '('! conditionOr ')'!
|
: '('! conditionOr ')'!
|
||||||
| (FIELD_NAME ':') => FIELD_NAME^ ':'! fieldValue
|
| (FIELD_NAME COLON) => FIELD_NAME^ COLON! fieldValue
|
||||||
| fieldValue -> ^(DEFAULT_FIELD fieldValue)
|
| fieldValue -> ^(DEFAULT_FIELD fieldValue)
|
||||||
;
|
;
|
||||||
|
|
||||||
fieldValue
|
fieldValue
|
||||||
// Rewrite by invoking SINGLE_WORD fragment lexer rule, passing the field name as an argument.
|
// Rewrite by invoking SINGLE_WORD fragment lexer rule, passing the field name as an argument.
|
||||||
: n=FIELD_NAME -> SINGLE_WORD[n]
|
: n=FIELD_NAME -> SINGLE_WORD[n]
|
||||||
|
|
||||||
|
// Allow field values to contain a colon. We can't do this at the lexer level, because we need to
|
||||||
|
// emit a separate token for the field name. If we were to allow ':' in SINGLE_WORD, then
|
||||||
|
// everything would just lex as DEFAULT_FIELD.
|
||||||
|
//
|
||||||
|
// Field values with a colon may be lexed either as <field>:<rest> or <word>:<rest>, depending on
|
||||||
|
// whether the part before the colon looks like a field name.
|
||||||
|
// TODO(dborowitz): Field values ending in colon still don't work.
|
||||||
|
| (FIELD_NAME COLON) => n=FIELD_NAME COLON fieldValue -> SINGLE_WORD[n] COLON fieldValue
|
||||||
|
| (SINGLE_WORD COLON) => SINGLE_WORD COLON fieldValue
|
||||||
|
|
||||||
| SINGLE_WORD
|
| SINGLE_WORD
|
||||||
| EXACT_PHRASE
|
| EXACT_PHRASE
|
||||||
;
|
;
|
||||||
@@ -135,6 +146,8 @@ AND: 'AND' ;
|
|||||||
OR: 'OR' ;
|
OR: 'OR' ;
|
||||||
NOT: 'NOT' ;
|
NOT: 'NOT' ;
|
||||||
|
|
||||||
|
COLON: ':' ;
|
||||||
|
|
||||||
WS
|
WS
|
||||||
: ( ' ' | '\r' | '\t' | '\n' ) { $channel=HIDDEN; }
|
: ( ' ' | '\r' | '\t' | '\n' ) { $channel=HIDDEN; }
|
||||||
;
|
;
|
||||||
@@ -173,7 +186,7 @@ fragment NON_WORD
|
|||||||
// '-' permit
|
// '-' permit
|
||||||
// '.' permit
|
// '.' permit
|
||||||
// '/' permit
|
// '/' permit
|
||||||
| ':'
|
| COLON
|
||||||
| ';'
|
| ';'
|
||||||
// '<' permit
|
// '<' permit
|
||||||
// '=' permit
|
// '=' permit
|
||||||
|
@@ -18,6 +18,7 @@ import static com.google.gerrit.index.query.Predicate.and;
|
|||||||
import static com.google.gerrit.index.query.Predicate.not;
|
import static com.google.gerrit.index.query.Predicate.not;
|
||||||
import static com.google.gerrit.index.query.Predicate.or;
|
import static com.google.gerrit.index.query.Predicate.or;
|
||||||
import static com.google.gerrit.index.query.QueryParser.AND;
|
import static com.google.gerrit.index.query.QueryParser.AND;
|
||||||
|
import static com.google.gerrit.index.query.QueryParser.COLON;
|
||||||
import static com.google.gerrit.index.query.QueryParser.DEFAULT_FIELD;
|
import static com.google.gerrit.index.query.QueryParser.DEFAULT_FIELD;
|
||||||
import static com.google.gerrit.index.query.QueryParser.EXACT_PHRASE;
|
import static com.google.gerrit.index.query.QueryParser.EXACT_PHRASE;
|
||||||
import static com.google.gerrit.index.query.QueryParser.FIELD_NAME;
|
import static com.google.gerrit.index.query.QueryParser.FIELD_NAME;
|
||||||
@@ -217,24 +218,41 @@ public abstract class QueryBuilder<T> {
|
|||||||
return defaultField(onlyChildOf(r));
|
return defaultField(onlyChildOf(r));
|
||||||
|
|
||||||
case FIELD_NAME:
|
case FIELD_NAME:
|
||||||
return operator(r.getText(), onlyChildOf(r));
|
return operator(r.getText(), concatenateChildText(r));
|
||||||
|
|
||||||
default:
|
default:
|
||||||
throw error("Unsupported operator: " + r);
|
throw error("Unsupported operator: " + r);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
private Predicate<T> operator(String name, Tree val) throws QueryParseException {
|
private static String concatenateChildText(Tree r) throws QueryParseException {
|
||||||
switch (val.getType()) {
|
if (r.getChildCount() == 0) {
|
||||||
case SINGLE_WORD:
|
throw error("Expected children under: " + r);
|
||||||
case EXACT_PHRASE:
|
}
|
||||||
if (val.getChildCount() != 0) {
|
if (r.getChildCount() == 1) {
|
||||||
throw error("Expected no children under: " + val);
|
return getFieldValue(r.getChild(0));
|
||||||
}
|
}
|
||||||
return operator(name, val.getText());
|
StringBuilder sb = new StringBuilder();
|
||||||
|
for (int i = 0; i < r.getChildCount(); i++) {
|
||||||
|
sb.append(getFieldValue(r.getChild(i)));
|
||||||
|
}
|
||||||
|
return sb.toString();
|
||||||
|
}
|
||||||
|
|
||||||
|
private static String getFieldValue(Tree r) throws QueryParseException {
|
||||||
|
if (r.getChildCount() != 0) {
|
||||||
|
throw error("Expected no children under: " + r);
|
||||||
|
}
|
||||||
|
switch (r.getType()) {
|
||||||
|
case SINGLE_WORD:
|
||||||
|
case COLON:
|
||||||
|
case EXACT_PHRASE:
|
||||||
|
return r.getText();
|
||||||
default:
|
default:
|
||||||
throw error("Unsupported node in operator " + name + ": " + val);
|
throw error(
|
||||||
|
String.format(
|
||||||
|
"Unsupported %s node in operator %s: %s",
|
||||||
|
QueryParser.tokenNames[r.getType()], r.getParent(), r));
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@@ -75,6 +75,41 @@ public class QueryBuilderTest extends GerritBaseTests {
|
|||||||
.isEqualTo("line 1:2 no viable alternative at input '('");
|
.isEqualTo("line 1:2 no viable alternative at input '('");
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueThatLooksLikeFieldNameColonValue() throws Exception {
|
||||||
|
assertThat(parse("a:foo:bar")).isEqualTo(new TestPredicate("a", "foo:bar"));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueThatLooksLikeWordColonValue() throws Exception {
|
||||||
|
assertThat(parse("a:*:bar")).isEqualTo(new TestPredicate("a", "*:bar"));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueWithMultipleColons() throws Exception {
|
||||||
|
assertThat(parse("a:*:*:*")).isEqualTo(new TestPredicate("a", "*:*:*"));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void exactPhraseWithQuotes() throws Exception {
|
||||||
|
assertThat(parse("a:\"foo bar\"")).isEqualTo(new TestPredicate("a", "foo bar"));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void exactPhraseWithQuotesAndColon() throws Exception {
|
||||||
|
assertThat(parse("a:\"foo:bar\"")).isEqualTo(new TestPredicate("a", "foo:bar"));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void exactPhraseWithBraces() throws Exception {
|
||||||
|
assertThat(parse("a:{foo bar}")).isEqualTo(new TestPredicate("a", "foo bar"));
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void exactPhraseWithBracesAndColon() throws Exception {
|
||||||
|
assertThat(parse("a:{foo:bar}")).isEqualTo(new TestPredicate("a", "foo:bar"));
|
||||||
|
}
|
||||||
|
|
||||||
private static Predicate<Object> parse(String query) throws Exception {
|
private static Predicate<Object> parse(String query) throws Exception {
|
||||||
return new TestQueryBuilder().parse(query);
|
return new TestQueryBuilder().parse(query);
|
||||||
}
|
}
|
||||||
|
@@ -14,6 +14,9 @@
|
|||||||
|
|
||||||
package com.google.gerrit.index.query;
|
package com.google.gerrit.index.query;
|
||||||
|
|
||||||
|
import static com.google.common.truth.Truth.assert_;
|
||||||
|
import static com.google.gerrit.index.query.QueryParser.AND;
|
||||||
|
import static com.google.gerrit.index.query.QueryParser.COLON;
|
||||||
import static com.google.gerrit.index.query.QueryParser.FIELD_NAME;
|
import static com.google.gerrit.index.query.QueryParser.FIELD_NAME;
|
||||||
import static com.google.gerrit.index.query.QueryParser.SINGLE_WORD;
|
import static com.google.gerrit.index.query.QueryParser.SINGLE_WORD;
|
||||||
import static com.google.gerrit.index.query.QueryParser.parse;
|
import static com.google.gerrit.index.query.QueryParser.parse;
|
||||||
@@ -34,4 +37,163 @@ public class QueryParserTest extends GerritBaseTests {
|
|||||||
assertThat(r).child(0).hasText("tools/gerrit");
|
assertThat(r).child(0).hasText("tools/gerrit");
|
||||||
assertThat(r).child(0).hasNoChildren();
|
assertThat(r).child(0).hasNoChildren();
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueThatLooksLikeFieldNameColon() throws Exception {
|
||||||
|
// This should work, but doesn't due to a known issue.
|
||||||
|
assertParseFails("project:foo:");
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueThatLooksLikeFieldNameColonValue() throws Exception {
|
||||||
|
Tree r = parse("project:foo:bar");
|
||||||
|
assertThat(r).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).hasText("project");
|
||||||
|
assertThat(r).hasChildCount(3);
|
||||||
|
assertThat(r).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).hasText("foo");
|
||||||
|
assertThat(r).child(0).hasNoChildren();
|
||||||
|
assertThat(r).child(1).hasType(COLON);
|
||||||
|
assertThat(r).child(1).hasText(":");
|
||||||
|
assertThat(r).child(1).hasNoChildren();
|
||||||
|
assertThat(r).child(2).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(2).hasText("bar");
|
||||||
|
assertThat(r).child(2).hasNoChildren();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueThatLooksLikeWordColonValue() throws Exception {
|
||||||
|
Tree r = parse("project:x*y:a*b");
|
||||||
|
assertThat(r).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).hasText("project");
|
||||||
|
assertThat(r).hasChildCount(3);
|
||||||
|
assertThat(r).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).hasText("x*y");
|
||||||
|
assertThat(r).child(0).hasNoChildren();
|
||||||
|
assertThat(r).child(1).hasType(COLON);
|
||||||
|
assertThat(r).child(1).hasText(":");
|
||||||
|
assertThat(r).child(1).hasNoChildren();
|
||||||
|
assertThat(r).child(2).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(2).hasText("a*b");
|
||||||
|
assertThat(r).child(2).hasNoChildren();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueThatLooksLikeWordColon() throws Exception {
|
||||||
|
// This should work, but doesn't due to a known issue.
|
||||||
|
assertParseFails("project:x*y:");
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueWithMultipleColons() throws Exception {
|
||||||
|
Tree r = parse("project:*:*:*");
|
||||||
|
assertThat(r).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).hasText("project");
|
||||||
|
assertThat(r).hasChildCount(5);
|
||||||
|
assertThat(r).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).hasText("*");
|
||||||
|
assertThat(r).child(0).hasNoChildren();
|
||||||
|
assertThat(r).child(1).hasType(COLON);
|
||||||
|
assertThat(r).child(1).hasText(":");
|
||||||
|
assertThat(r).child(1).hasNoChildren();
|
||||||
|
assertThat(r).child(2).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(2).hasText("*");
|
||||||
|
assertThat(r).child(2).hasNoChildren();
|
||||||
|
assertThat(r).child(3).hasType(COLON);
|
||||||
|
assertThat(r).child(3).hasText(":");
|
||||||
|
assertThat(r).child(3).hasNoChildren();
|
||||||
|
assertThat(r).child(4).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(4).hasText("*");
|
||||||
|
assertThat(r).child(4).hasNoChildren();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueWithColonFollowedByAnotherField() throws Exception {
|
||||||
|
Tree r = parse("project:foo:bar file:baz");
|
||||||
|
assertThat(r).hasType(AND);
|
||||||
|
assertThat(r).hasChildCount(2);
|
||||||
|
|
||||||
|
assertThat(r).child(0).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).child(0).hasText("project");
|
||||||
|
assertThat(r).child(0).hasChildCount(3);
|
||||||
|
assertThat(r).child(0).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).child(0).hasText("foo");
|
||||||
|
assertThat(r).child(0).child(0).hasNoChildren();
|
||||||
|
assertThat(r).child(0).child(1).hasType(COLON);
|
||||||
|
assertThat(r).child(0).child(1).hasText(":");
|
||||||
|
assertThat(r).child(0).child(1).hasNoChildren();
|
||||||
|
assertThat(r).child(0).child(2).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).child(2).hasText("bar");
|
||||||
|
assertThat(r).child(0).child(2).hasNoChildren();
|
||||||
|
|
||||||
|
assertThat(r).child(1).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).child(1).hasText("file");
|
||||||
|
assertThat(r).child(1).hasChildCount(1);
|
||||||
|
assertThat(r).child(1).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(1).child(0).hasText("baz");
|
||||||
|
assertThat(r).child(1).child(0).hasNoChildren();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueWithColonFollowedByOpenParen() throws Exception {
|
||||||
|
Tree r = parse("project:foo:bar (file:baz)");
|
||||||
|
assertThat(r).hasType(AND);
|
||||||
|
assertThat(r).hasChildCount(2);
|
||||||
|
|
||||||
|
assertThat(r).child(0).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).child(0).hasText("project");
|
||||||
|
assertThat(r).child(0).hasChildCount(3);
|
||||||
|
assertThat(r).child(0).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).child(0).hasText("foo");
|
||||||
|
assertThat(r).child(0).child(0).hasNoChildren();
|
||||||
|
assertThat(r).child(0).child(1).hasType(COLON);
|
||||||
|
assertThat(r).child(0).child(1).hasText(":");
|
||||||
|
assertThat(r).child(0).child(1).hasNoChildren();
|
||||||
|
assertThat(r).child(0).child(2).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).child(2).hasText("bar");
|
||||||
|
assertThat(r).child(0).child(2).hasNoChildren();
|
||||||
|
|
||||||
|
assertThat(r).child(1).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).child(1).hasText("file");
|
||||||
|
assertThat(r).child(1).hasChildCount(1);
|
||||||
|
assertThat(r).child(1).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(1).child(0).hasText("baz");
|
||||||
|
assertThat(r).child(1).child(0).hasNoChildren();
|
||||||
|
}
|
||||||
|
|
||||||
|
@Test
|
||||||
|
public void fieldNameAndValueWithColonFollowedByCloseParen() throws Exception {
|
||||||
|
Tree r = parse("(project:foo:bar) file:baz");
|
||||||
|
assertThat(r).hasType(AND);
|
||||||
|
assertThat(r).hasChildCount(2);
|
||||||
|
|
||||||
|
assertThat(r).child(0).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).child(0).hasText("project");
|
||||||
|
assertThat(r).child(0).hasChildCount(3);
|
||||||
|
assertThat(r).child(0).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).child(0).hasText("foo");
|
||||||
|
assertThat(r).child(0).child(0).hasNoChildren();
|
||||||
|
assertThat(r).child(0).child(1).hasType(COLON);
|
||||||
|
assertThat(r).child(0).child(1).hasText(":");
|
||||||
|
assertThat(r).child(0).child(1).hasNoChildren();
|
||||||
|
assertThat(r).child(0).child(2).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(0).child(2).hasText("bar");
|
||||||
|
assertThat(r).child(0).child(2).hasNoChildren();
|
||||||
|
|
||||||
|
assertThat(r).child(1).hasType(FIELD_NAME);
|
||||||
|
assertThat(r).child(1).hasText("file");
|
||||||
|
assertThat(r).child(1).hasChildCount(1);
|
||||||
|
assertThat(r).child(1).child(0).hasType(SINGLE_WORD);
|
||||||
|
assertThat(r).child(1).child(0).hasText("baz");
|
||||||
|
assertThat(r).child(1).child(0).hasNoChildren();
|
||||||
|
}
|
||||||
|
|
||||||
|
private static void assertParseFails(String query) {
|
||||||
|
try {
|
||||||
|
parse(query);
|
||||||
|
assert_().fail("expected parse to fail: %s", query);
|
||||||
|
} catch (QueryParseException e) {
|
||||||
|
// Expected.
|
||||||
|
}
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
Reference in New Issue
Block a user