hive UDF

来源:互联网 发布:人工智能机器人在哪做 编辑:程序博客网 时间:2024/05/17 15:19
use mwd;--prepare data, c_ip 为左补足0转换后值-- ETL: spv datacreate temporary function row_sequence as 'com.mwd.hive.udf.RowSequence';create temporary function parse_agent as 'com.mwd.hive.udf.HdfsRegexParseUdf';create temporary function uri_to_map as 'com.mwd.hive.udf.GenericUDFUriToMap';insert into table wdlog_ready_spv PARTITION (import_time='20131111') select row_sequence(), cur_date, concat_ws(' ', cur_date, cur_time), cs_uri_query, printf('%s%s%s%s', lpad(split(c_ip,'\\\.')[0],3,'0'), lpad(split(c_ip,'\\\.')[1],3,'0'), lpad(split(c_ip,'\\\.')[2],3,'0'), lpad(split(c_ip,'\\\.')[3],3,'0')), agent, if(instr(cs_uri_query, '&\\;') > 0, uri_to_map(cs_uri_query,'&\\;', '=','/user/searchdata','/user/mediadata'), uri_to_map(cs_uri_query, '&', '=','/user/searchdata','/user/mediadata')),  parse_agent(agent,'/user/reg_data') from wdlog where import_time='20131111' and cs_uri_query is not null;drop temporary function parse_agent;drop temporary function uri_to_map;drop temporary function row_sequence;

0 0
原创粉丝点击