SQLTransformer
SQLTransformer
SELECT a, a + b AS ab FROM __THIS__
SELECT a, SQRT(b) AS bsqrt FROM __THIS__ where a > 5
SELECT a, b, SUM(c) AS csum FROM __THIS__ GROUP BY a, bSELECT a, a + b AS ab FROM __THIS__
SELECT a, SQRT(b) AS bsqrt FROM __THIS__ where a > 5
SELECT a, b, SUM(c) AS csum FROM __THIS__ GROUP BY a, bid | v1 | v2
----|-----|-----
0 | 1.0 | 3.0
2 | 2.0 | 5.0import org.apache.spark.ml.feature.SQLTransformer
val df = spark.createDataFrame(
Seq((0, 1.0, 3.0), (2, 2.0, 5.0))).toDF("id", "v1", "v2")
val sqlTrans = new SQLTransformer().setStatement(
"SELECT *, (v1 + v2) AS v3, (v1 * v2) AS v4 FROM __THIS__")
sqlTrans.transform(df).show()
/*
+---+---+---+---+----+
| id| v1| v2| v3| v4|
+---+---+---+---+----+
| 0|1.0|3.0|4.0| 3.0|
| 2|2.0|5.0|7.0|10.0|
+---+---+---+---+----+
*/Last updated