--抽取refer_url到中间表 "t_ods_tmp_referurl"
--将来访url分离出host path query query id
在对来访数据进行抽取时,需要写一个函数,可以使用:Parse_url_tuple()
drop table if exists t_ods_tmp_referurl;
create table t_ ods _tmp_referurl as
SELECT a.*,b.*
FROM ods_origin_weblog a LATERAL VIEW parse_url_tuple(regexp_replace(http_referer, "\"", ""), 'HOST', 'PATH','QUERY', 'QUERY:id') b as host, path, query, query_id;
出错:
0: jdbc:hive2://node-1:10000> create table t_ods_tmp_referurl as
0: jdbc:hive2://node-1:10000> SELECT a.*,b.*
0: jdbc:hive2://node-1:10000> FROM ods_weblog_origin a
0: jdbc:hive2://node-1:10000> LATERAL VIEW parse_url_tuple(regexp_replace(http_referer, "\"", ""), 'HOST', 'PATH','QUERY', 'QUERY:id') b as host, path, query, query_id;
INFO : Number of reduce tasks is set to 0 since there's no reduce operator
一直停留在这个页面。请教?