使用join算子将两个数据进行连接时报的错误信息
报错信息如下:
Exception in thread "main" org.apache.spark.sql.AnalysisException: cannot resolve '`name`' given input columns: [_corrupt_record]; line 1 pos 40;
'Project ['name, 'age]
+- 'Filter 'name IN (mzk,root,admin)
+- SubqueryAlias student_info
+- LogicalRDD [_corrupt_record#25]
完整的代码如下:
package com.mzk.sql
import org.apache.spark.sql.SparkSession
import org.apache.spark.sql.types.StructType
import org.apache.spark.sql.types.StringType
import org.apache.spark.sql.types.StructField
import org.apache.spark.sql.types.IntegerType
import org.apache.spark.sql.Row
object JSONDataSource {
def main(args: Array[String]): Unit = {
//创建SparkSession、SparkContext、sqlContext
val spark = SparkSession.builder().appName("JSONDataSource").master("local").getOrCreate()
val sc = spark.sparkContext
val sql = spark.sqlContext