3、数据加载工作流所用hive脚本:
create database if not exists dw_weblog;
use dw_weblog;
drop table if exists t_orgin_weblog;
create table t_orgin_weblog(valid string,remote_addr string,
remote_user string,
time_local string,
request string,
status string,
body_bytes_sent string,
http_referer string,
http_user_agent string)
row format delimited
fields terminated by ‘<零距离_句子>1’;
load data inpath ‘/weblog/preout’ overwrite into table t_orgin_weblog;