您的位置:首页 > 数据库

spark sql

2015-11-05 09:40 435 查看
spark sql

package com.spark.sql

import org.apache.spark.SparkConf
import org.apache.spark.SparkContext
import org.apache.spark.sql.SQLContext

object JSONDataSource {
def main(args: Array[String]): Unit = {
val conf = new SparkConf()
.setAppName("JSONDataSource")
.setMaster("local")
val sc = new SparkContext(conf)
val sqlContext = new SQLContext(sc)
// 创建学生成绩DataFrame
val studentScoresDF = sqlContext.read.json("E:\\spark-1.4.1-bin-hadoop2.4\\examples\\src\\main\\resources\\people.json")
// 查询出分数大于80分的学生成绩信息,以及学生姓名
studentScoresDF.registerTempTable("student_scores")
val goodStudentScoresDF = sqlContext.sql("select name,age from student_scores where age>=19")
val goodStudentNames = goodStudentScoresDF.rdd.map { row => row(0) }.collect()
goodStudentNames.map { row => println("-----name----->"+row) }
val goodStudentNamesAges = goodStudentScoresDF.rdd.map { row => (row(0),row(0)) }.collect()
goodStudentNamesAges.map { row => println("-----name and age----->"+row) }
// println(goodStudentNames)

}
}
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: