智警杯&大数据技能竞赛sql分析脚本汇总

####特殊:
#设置hive本地模式:
set hive.exec.mode.local.auto=true;

#加速hive
set hive.execution.engine=tez;

#扩大内存(最好不用)
set mapreduce.map.memory.mb=10150; 
set mapreduce.map.java.opts=-Xmx6144m;
set mapreduce.reduce.memory.mb=10150; 
set mapreduce.reduce.java.opts=-Xmx8120m;

#查询hadoop文件
hadoop fs -ls '/college2020/'
hadoop fs -cat '/college2020/'

####student

#hadoop fs -mkdir '/college2020/'

#cmd
cd /root
vi student.csv

#复制进student.csv
巴拉巴拉。。。

#hadoop
hadoop fs -put '/root/student.csv' '/college2020/'

#hive
create database student;
use student;
create table student(num int,name string) row format delimited fields terminated by ',';
load data local inpath '/root/student.csv' overwrite into table student;

#select * from student;

####爬取弹幕

#把comment.csv拖进/root/

#hadoop
hadoop fs -put '/root/comment.csv' '/college2020/'

#hive
create database qingjiao;
use qingjiao;
create table comment(text string,color string,size string,position string,time string) row format delimited fields terminated by ',';
load data local inpath '/root/comment.csv' overwrite into table comment;

#51 查询弹幕数量
insert overwrite directory "/college2020/51/" row format delimited fields terminated by 't' select count(*) from comment;

#52 查询弹幕对应颜色
insert overwrite directory "/college2020/52" row format delimited fields terminated by '\t ' select color from comment where text='haoran';

#53 查询弹幕颜色top6
#最大
insert overwrite directory "/college2020/53" row format delimited fields terminated by '\t'
评论 10
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包

打赏作者

TurkeyMan

你的鼓励将是我创作的最大动力

¥1 ¥2 ¥4 ¥6 ¥10 ¥20
扫码支付:¥1
获取中
扫码支付

您的余额不足,请更换扫码支付或充值

打赏作者

实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值