大数据Spark “蘑菇云”行动第88课:Hive脚本、常用命令、having查询及变种实战
HiveScript.sql的脚本内容
show databases;
use default;
show tables;
select * from employees;
hive> !pwd
hive> ! /bin/echo "Hive on spark!"
hive> dfs -ls /
# hive -s -e "select * from employee" >> /usr/local/test.log
# hive -e "select * from employee"
hive -S -e "set" | grep warehouse
desc employee;
select name from (select name,sum(salary) as salarytotal from employee)
employeeforhaving加一个字段 性别 男、女
create table employeeforhaving (userid int, name string,address string,salary double,gender string)
ROW FORMAT DELIMITED FIELDS TERMINATED BY '\t' LINES TERMINATED BY '\n'");
load data local inpath '/..../employee.txt int tables‘ employeeforhaving;
select gender form(select gender,sun(salary) as salarytotal from employeesforhaving group by gender ) subquery where
subquery.salarytotal >30000
SELECT gender ,SUM(salary) FROM employeesforhaving
GROUP BY gender
HAVING SUM(salary)> 30000
