elastic · matriv · Jan 31, 2019 · Jan 26, 2019 · Jan 30, 2019 · Jan 30, 2019
diff --git a/docs/reference/sql/functions/aggs.asciidoc b/docs/reference/sql/functions/aggs.asciidoc
@@ -113,6 +113,129 @@ Returns the total number of _distinct non-null_ values in input values.
 include-tagged::{sql-specs}/docs.csv-spec[aggCountDistinct]
 --------------------------------------------------
 
+[[sql-functions-aggs-first]]
+===== `FIRST/FIRST_VALUE`
+
+.Synopsis:
+[source, sql]
+--------------------------------------------------
+FIRST(field_name<1>, sort_by_field_name<2>)
+--------------------------------------------------
+
+*Input*:
+
+<1> a field name
+<2> a field name; optional
+
+*Output*: same type as the input
+
+.Description:
+
+When only one argument is provided it returns the first **non-NULL** value across input values in the field
+`field_name`. It will return **NULL** only if all values in `field_name` are null. When a second argument
+is provided then it returns the first **non-NULL** value across input values in the field `field_name` ordered
+ascending by the **non-NULL** values of `sort_by_field_name`. E.g.:
+
+[cols="<,<"]
+|===
+s|a|b
+| 100 | 1
+| 200 | 1
+| 1 | 2
+| 2 | 2
+| 10 | null
+| 20 | null
+|
+|===
+
+[source, sql]
+-------------------------
+SELECT FIRST(a, b) FROM t
+-------------------------
+
+will result in:
+[cols="<"]
+|===
+s|FIRST(a, b)
+| 100
+|===
+
+
+["source","sql",subs="attributes,macros"]
+-----------------------------------------------------------
+include-tagged::{sql-specs}/docs.csv-spec[firstWithOneArg]
+-----------------------------------------------------------
+
+["source","sql",subs="attributes,macros"]
+-----------------------------------------------------------
+include-tagged::{sql-specs}/docs.csv-spec[firstWithTwoArgs]
+-----------------------------------------------------------
+
+[NOTE]
+`FIRST` cannot be used in to create a filter in a `HAVING` clause of a `GROUP BY` query.
+
+[[sql-functions-aggs-last]]
+===== `LAST/LAST_VALUE`
+
+.Synopsis:
+[source, sql]
+--------------------------------------------------
+LAST(field_name<1>, sort_by_field_name<2>)
+--------------------------------------------------
+
+*Input*:
+
+<1> a field name
+<2> a field name; optional
+
+*Output*: same type as the input
+
+.Description:
+
+It's the inverse of <<sql-functions-aggs-first>>. When only one argument is provided it returns the
+last **non-NULL** value across input values in the field `field_name`. It will return **NULL** only if
+all values in `field_name` are null. When a second argument is provided then it returns the last
+**non-NULL** value across input values in the field `field_name` ordered descending by the **non-NULL**
+values of `sort_by_field_name`. E.g.:
+
+[cols="<,<"]
+|===
+s|a|b
+| 10 | 1
+| 20 | 1
+| 1 | 2
+| 2 | 2
+| 100 | null
+| 200 | null
+|===
+
+[source, sql]
+------------------------
+SELECT LAST(a, b) FROM t
+------------------------
+
+will result in:
+[cols="<"]
+|===
+s|LAST(a, b)
+| 2
+|===
+
+
+["source","sql",subs="attributes,macros"]
+-----------------------------------------------------------
+include-tagged::{sql-specs}/docs.csv-spec[lastWithOneArg]
+-----------------------------------------------------------
+
+["source","sql",subs="attributes,macros"]
+-----------------------------------------------------------
+include-tagged::{sql-specs}/docs.csv-spec[lastWithTwoArgs]
+-----------------------------------------------------------
+
+[NOTE]
+`LAST` cannot be used in to create a filter in a `HAVING` clause of a `GROUP BY` query.
+
+
 [[sql-functions-aggs-max]]
 ===== `MAX`
 
@@ -161,6 +284,9 @@ Returns the minimum value across input values in the field `field_name`.
 include-tagged::{sql-specs}/docs.csv-spec[aggMin]
 --------------------------------------------------
 
+[NOTE]
+`MIN` on a field of type <<text, `text`>> or <<keyword, `keyword`>> is translated into <<sql-functions-aggs-first>>.
+
 [[sql-functions-aggs-sum]]
 ===== `SUM`
 

diff --git a/x-pack/plugin/sql/qa/src/main/java/org/elasticsearch/xpack/sql/qa/cli/ShowTestCase.java b/x-pack/plugin/sql/qa/src/main/java/org/elasticsearch/xpack/sql/qa/cli/ShowTestCase.java
@@ -31,6 +31,10 @@ public void testShowFunctions() throws IOException {
         assertThat(readLine(), containsString(HEADER_SEPARATOR));
         assertThat(readLine(), RegexMatcher.matches("\\s*AVG\\s*\\|\\s*AGGREGATE\\s*"));
         assertThat(readLine(), RegexMatcher.matches("\\s*COUNT\\s*\\|\\s*AGGREGATE\\s*"));
+        assertThat(readLine(), RegexMatcher.matches("\\s*FIRST\\s*\\|\\s*AGGREGATE\\s*"));
+        assertThat(readLine(), RegexMatcher.matches("\\s*FIRST_VALUE\\s*\\|\\s*AGGREGATE\\s*"));
+        assertThat(readLine(), RegexMatcher.matches("\\s*LAST\\s*\\|\\s*AGGREGATE\\s*"));
+        assertThat(readLine(), RegexMatcher.matches("\\s*LAST_VALUE\\s*\\|\\s*AGGREGATE\\s*"));
         assertThat(readLine(), RegexMatcher.matches("\\s*MAX\\s*\\|\\s*AGGREGATE\\s*"));
         assertThat(readLine(), RegexMatcher.matches("\\s*MIN\\s*\\|\\s*AGGREGATE\\s*"));
         String line = readLine();
@@ -58,6 +62,8 @@ public void testShowFunctions() throws IOException {
     public void testShowFunctionsLikePrefix() throws IOException {
         assertThat(command("SHOW FUNCTIONS LIKE 'L%'"), RegexMatcher.matches("\\s*name\\s*\\|\\s*type\\s*"));
         assertThat(readLine(), containsString(HEADER_SEPARATOR));
+        assertThat(readLine(), RegexMatcher.matches("\\s*LAST\\s*\\|\\s*AGGREGATE\\s*"));
+        assertThat(readLine(), RegexMatcher.matches("\\s*LAST_VALUE\\s*\\|\\s*AGGREGATE\\s*"));
         assertThat(readLine(), RegexMatcher.matches("\\s*LEAST\\s*\\|\\s*CONDITIONAL\\s*"));
         assertThat(readLine(), RegexMatcher.matches("\\s*LOG\\s*\\|\\s*SCALAR\\s*"));
         assertThat(readLine(), RegexMatcher.matches("\\s*LOG10\\s*\\|\\s*SCALAR\\s*"));

diff --git a/x-pack/plugin/sql/qa/src/main/resources/agg.csv-spec b/x-pack/plugin/sql/qa/src/main/resources/agg.csv-spec
@@ -373,3 +373,36 @@ SELECT COUNT(ALL last_name)=COUNT(ALL first_name) AS areEqual, COUNT(ALL first_n
 ---------------+---------------+---------------
 false          |90             |100
 ;
+
+topHitsWithOneArgAndGroupBy
+schema::gender:s|first:s|last:s
+SELECT gender, FIRST(first_name) as first, LAST(first_name) as last FROM test_emp GROUP BY gender ORDER BY gender;
+
+    gender     |   first       |   last
+---------------+---------------+------------
+null           |   Berni       |   Patricio
+F              |   Alejandro   |   Xinglin
+M              |   Amabile     |   Zvonko
+;
+
+topHitsWithTwoArgsAndGroupBy
+schema::gender:s|first:s|last:s
+SELECT gender, FIRST(first_name, birth_date) as first, LAST(first_name, birth_date) as last FROM test_emp GROUP BY gender ORDER BY gender;
+
+    gender     |   first       |   last
+---------------+---------------+-----------------
+null           |   Lillian     |   Eberhardt
+F              |   Sumant      |   Valdiodio
+M              |   Remzi       |   Hilari
+;
+
+topHitsOnDatetime
+schema::gender:s|first:i|last:i
+SELECT gender, month(first(birth_date, languages)) first, month(last(birth_date, languages)) last FROM test_emp GROUP BY gender ORDER BY gender;
+
+    gender     |   first       |   last
+---------------+---------------+---------------
+null           |   1           |   10
+F              |   4           |   6
+M              |   1           |   4
+;
diff --git a/x-pack/plugin/sql/qa/src/main/resources/command.csv-spec b/x-pack/plugin/sql/qa/src/main/resources/command.csv-spec
@@ -8,8 +8,12 @@ SHOW FUNCTIONS;
 
     name:s       |    type:s
 AVG              |AGGREGATE      
-COUNT            |AGGREGATE      
-MAX              |AGGREGATE      
+COUNT            |AGGREGATE
+FIRST            |AGGREGATE
+FIRST_VALUE      |AGGREGATE
+LAST             |AGGREGATE
+LAST_VALUE       |AGGREGATE
+MAX              |AGGREGATE
 MIN              |AGGREGATE      
 SUM              |AGGREGATE      
 KURTOSIS         |AGGREGATE      

diff --git a/x-pack/plugin/sql/qa/src/main/resources/docs.csv-spec b/x-pack/plugin/sql/qa/src/main/resources/docs.csv-spec
@@ -185,7 +185,11 @@ SHOW FUNCTIONS;
       name       |     type      
 -----------------+---------------
 AVG              |AGGREGATE      
-COUNT            |AGGREGATE      
+COUNT            |AGGREGATE
+FIRST            |AGGREGATE
+FIRST_VALUE      |AGGREGATE
+LAST             |AGGREGATE
+LAST_VALUE       |AGGREGATE
 MAX              |AGGREGATE      
 MIN              |AGGREGATE      
 SUM              |AGGREGATE      
@@ -699,6 +703,8 @@ SELECT MIN(salary) AS min, MAX(salary) AS max FROM emp HAVING min > 25000;
 // end::groupByHavingImplicitNoMatch
 //;
 
+
+
 ///////////////////////////////
 //
 // Grouping
@@ -998,6 +1004,55 @@ SELECT COUNT(DISTINCT hire_date) unique_hires, COUNT(hire_date) AS hires FROM em
 // end::aggCountDistinct
 ;
 
+firstWithOneArg
+schema::FIRST(first_name):s
+// tag::firstWithOneArg
+SELECT FIRST(first_name) FROM emp;
+
+FIRST(first_name)
+-----------------
+Alejandro
+
+// end::firstWithOneArg
+;
+
+firstWithTwoArgs
+schema::FIRST(first_name, birth_date):s
+// tag::firstWithTwoArgs
+SELECT FIRST(first_name, birth_date) FROM emp;
+
+FIRST(first_name, birth_date)
+-----------------------------
+Remzi
+
+// end::firstWithTwoArgs
+;
+
+lastWithOneArg
+schema::LAST(first_name):s
+// tag::lastWithOneArg
+SELECT LAST(first_name) FROM emp;
+
+LAST(first_name)
+---------------
+Zvonko
+
+// end::lastWithOneArg
+;
+
+
+lastWithTwoArgs
+schema::LAST(first_name, birth_date):s
+// tag::lastWithTwoArgs
+SELECT LAST(first_name, birth_date) FROM emp;
+
+LAST(first_name, birth_date)
+---------------------------
+Hilari
+
+// end::lastWithTwoArgs
+;
+
 aggMax
 // tag::aggMax
 SELECT MAX(salary) AS max FROM emp;

diff --git a/x-pack/plugin/sql/src/main/java/org/elasticsearch/xpack/sql/analysis/analyzer/Verifier.java b/x-pack/plugin/sql/src/main/java/org/elasticsearch/xpack/sql/analysis/analyzer/Verifier.java
@@ -19,6 +19,7 @@
 import org.elasticsearch.xpack.sql.expression.function.Functions;
 import org.elasticsearch.xpack.sql.expression.function.Score;
 import org.elasticsearch.xpack.sql.expression.function.aggregate.AggregateFunctionAttribute;
+import org.elasticsearch.xpack.sql.expression.function.aggregate.TopHits;
 import org.elasticsearch.xpack.sql.expression.function.grouping.GroupingFunctionAttribute;
 import org.elasticsearch.xpack.sql.expression.function.scalar.ScalarFunction;
 import org.elasticsearch.xpack.sql.expression.predicate.conditional.ConditionalFunction;
@@ -366,16 +367,26 @@ private static boolean checkGroupByHaving(LogicalPlan p, Set<Failure> localFailu
             if (f.child() instanceof Aggregate) {
                 Aggregate a = (Aggregate) f.child();
 
-                Map<Expression, Node<?>> missing = new LinkedHashMap<>();
+                Set<Expression> missing = new LinkedHashSet<>();
+                Set<Expression> unsupported = new LinkedHashSet<>();
                 Expression condition = f.condition();
                 // variation of checkGroupMatch customized for HAVING, which requires just aggregations
-                condition.collectFirstChildren(c -> checkGroupByHavingHasOnlyAggs(c, condition, missing, functions));
+                condition.collectFirstChildren(c -> checkGroupByHavingHasOnlyAggs(c, missing, unsupported, functions));
 
                 if (!missing.isEmpty()) {
                     String plural = missing.size() > 1 ? "s" : StringUtils.EMPTY;
                     localFailures.add(
                             fail(condition, "Cannot use HAVING filter on non-aggregate" + plural + " %s; use WHERE instead",
-                            Expressions.names(missing.keySet())));
+                            Expressions.names(missing)));
+                    groupingFailures.add(a);
+                    return false;
+                }
+
+                if (!unsupported.isEmpty()) {
+                    String plural = unsupported.size() > 1 ? "s" : StringUtils.EMPTY;
+                    localFailures.add(
+                        fail(condition, "HAVING filter is unsupported for function" + plural + " %s",
+                            Expressions.names(unsupported)));
                     groupingFailures.add(a);
                     return false;
                 }
@@ -385,8 +396,8 @@ private static boolean checkGroupByHaving(LogicalPlan p, Set<Failure> localFailu
     }
 
 
-    private static boolean checkGroupByHavingHasOnlyAggs(Expression e, Node<?> source,
-            Map<Expression, Node<?>> missing, Map<String, Function> functions) {
+    private static boolean checkGroupByHavingHasOnlyAggs(Expression e, Set<Expression> missing,
+                                                         Set<Expression> unsupported, Map<String, Function> functions) {
 
         // resolve FunctionAttribute to backing functions
         if (e instanceof FunctionAttribute) {
@@ -407,13 +418,17 @@ private static boolean checkGroupByHavingHasOnlyAggs(Expression e, Node<?> sourc
 
             // unwrap function to find the base
             for (Expression arg : sf.arguments()) {
-                arg.collectFirstChildren(c -> checkGroupByHavingHasOnlyAggs(c, source, missing, functions));
+                arg.collectFirstChildren(c -> checkGroupByHavingHasOnlyAggs(c, missing, unsupported, functions));
             }
             return true;
 
         } else if (e instanceof Score) {
-            // Score can't be used for having
-            missing.put(e, source);
+            // Score can't be used in having
+            unsupported.add(e);
+            return true;
+        } else if (e instanceof TopHits) {
+            // First and last cannot be used in having
+            unsupported.add(e);
             return true;
         }
 
@@ -428,7 +443,7 @@ private static boolean checkGroupByHavingHasOnlyAggs(Expression e, Node<?> sourc
 
         // left without leaves which have to match; that's a failure since everything should be based on an agg
         if (e instanceof Attribute) {
-            missing.put(e, source);
+            missing.add(e);
             return true;
         }
 

diff --git a/x-pack/plugin/sql/src/main/java/org/elasticsearch/xpack/sql/execution/search/Querier.java b/x-pack/plugin/sql/src/main/java/org/elasticsearch/xpack/sql/execution/search/Querier.java
@@ -32,6 +32,7 @@
 import org.elasticsearch.xpack.sql.execution.search.extractor.FieldHitExtractor;
 import org.elasticsearch.xpack.sql.execution.search.extractor.HitExtractor;
 import org.elasticsearch.xpack.sql.execution.search.extractor.MetricAggExtractor;
+import org.elasticsearch.xpack.sql.execution.search.extractor.TopHitsAggExtractor;
 import org.elasticsearch.xpack.sql.expression.gen.pipeline.AggExtractorInput;
 import org.elasticsearch.xpack.sql.expression.gen.pipeline.AggPathInput;
 import org.elasticsearch.xpack.sql.expression.gen.pipeline.HitExtractorInput;
@@ -45,6 +46,7 @@
 import org.elasticsearch.xpack.sql.querydsl.container.QueryContainer;
 import org.elasticsearch.xpack.sql.querydsl.container.ScriptFieldRef;
 import org.elasticsearch.xpack.sql.querydsl.container.SearchHitFieldRef;
+import org.elasticsearch.xpack.sql.querydsl.container.TopHitsAggRef;
 import org.elasticsearch.xpack.sql.session.Configuration;
 import org.elasticsearch.xpack.sql.session.Rows;
 import org.elasticsearch.xpack.sql.session.SchemaRowSet;
@@ -276,6 +278,11 @@ private BucketExtractor createExtractor(FieldExtraction ref, BucketExtractor tot
                 return new MetricAggExtractor(r.name(), r.property(), r.innerKey());
             }
 
+            if (ref instanceof TopHitsAggRef) {
+                TopHitsAggRef r = (TopHitsAggRef) ref;
+                return new TopHitsAggExtractor(r.name(), r.fieldDataType());
+            }
+
             if (ref == GlobalCountRef.INSTANCE) {
                 return totalCount;
             }