spark-shell客户端连接hive

1.拷贝hive-site.xml到spark/conf下,拷贝mysql-connector-java-xxx-bin.jar到hive/lib下

2.开启hive元数据服务:hive --service metastore

3.开启hadoop服务:sh $HADOOP_HOME/sbin/start-all.sh

4.开启spark服务:sh $SPARK_HOME/sbin/start-all.sh

5.进入spark-shell:./spark-shell

6.scala操作hive(spark-sql)

scala>val conf=new SparkConf().setAppName("SparkHive").setMaster("local")   //可忽略,已经自动创建了
            
scala>val sc=new SparkContext(conf)  //可忽略,已经自动创建了
            
scala>val sqlContext = new org.apache.spark.sql.hive.HiveContext(sc)
        
scala>sqlContext.sql("create table transaction(orderNo int, date string,orderType int,price int,id int) row format delimited fields terminated by ' ' ") 

//这里需要注意数据的间隔符

scala>sqlContext.sql("LOAD DATA INPATH '/user/spark/src.txt' INTO TABLE src ");

scala>sqlContext.sql(" SELECT * FROM src").collect().foreach(println)

scala>sc.stop()

猜你喜欢

转载自blog.csdn.net/weixin_43840194/article/details/89476512