欢迎投稿

今日深度:

hive UDF,

hive UDF,


use mwd;


--prepare data, c_ip 为左补足0转换后值




-- ETL: spv data
create temporary function row_sequence as 'com.mwd.hive.udf.RowSequence';
create temporary function parse_agent as 'com.mwd.hive.udf.HdfsRegexParseUdf';
create temporary function uri_to_map as 'com.mwd.hive.udf.GenericUDFUriToMap';


insert into table wdlog_ready_spv PARTITION (import_time='20131111') select row_sequence(), cur_date, concat_ws(' ', cur_date, cur_time), cs_uri_query, printf('%s%s%s%s', lpad(split(c_ip,'\\\.')[0],3,'0'), lpad(split(c_ip,'\\\.')[1],3,'0'), lpad(split(c_ip,'\\\.')[2],3,'0'), lpad(split(c_ip,'\\\.')[3],3,'0')), agent, if(instr(cs_uri_query, '&\\;') > 0, uri_to_map(cs_uri_query,'&\\;', '=','/user/searchdata','/user/mediadata'), uri_to_map(cs_uri_query, '&', '=','/user/searchdata','/user/mediadata')),  parse_agent(agent,'/user/reg_data') from wdlog where import_time='20131111' and cs_uri_query is not null;


drop temporary function parse_agent;
drop temporary function uri_to_map;
drop temporary function row_sequence;

www.htsjk.Com true http://www.htsjk.com/hive/41728.html NewsArticle hive UDF, use mwd;--prepare data, c_ip 为左补足0转换后值-- ETL: spv datacreate temporary function row_sequence as 'com.mwd.hive.udf.RowSequence';create temporary function parse_agent as 'com.mwd.hive.udf.HdfsRegexParseUdf';create...
相关文章
    暂无相关文章
评论暂时关闭