Saving all output to "!!{outputDirectory}!!/serde_regex.q.raw". Enter "record" with no arguments to stop it. >>> !run !!{qFileDirectory}!!/serde_regex.q >>> EXPLAIN CREATE TABLE serde_regex( host STRING, identity STRING, user STRING, time STRING, request STRING, status STRING, size STRING, referer STRING, agent STRING) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.RegexSerDe' WITH SERDEPROPERTIES ( "input.regex" = "([^ ]*) ([^ ]*) ([^ ]*) (-|\\[[^\\]]*\\]) ([^ \"]*|\"[^\"]*\") (-|[0-9]*) (-|[0-9]*)(?: ([^ \"]*|\"[^\"]*\") ([^ \"]*|\"[^\"]*\"))?" ) STORED AS TEXTFILE; 'Explain' 'ABSTRACT SYNTAX TREE:' ' (TOK_CREATETABLE (TOK_TABNAME serde_regex) TOK_LIKETABLE (TOK_TABCOLLIST (TOK_TABCOL host TOK_STRING) (TOK_TABCOL identity TOK_STRING) (TOK_TABCOL user TOK_STRING) (TOK_TABCOL time TOK_STRING) (TOK_TABCOL request TOK_STRING) (TOK_TABCOL status TOK_STRING) (TOK_TABCOL size TOK_STRING) (TOK_TABCOL referer TOK_STRING) (TOK_TABCOL agent TOK_STRING)) (TOK_TABLESERIALIZER (TOK_SERDENAME 'org.apache.hadoop.hive.serde2.RegexSerDe' (TOK_TABLEPROPERTIES (TOK_TABLEPROPLIST (TOK_TABLEPROPERTY "input.regex" "([^ ]*) ([^ ]*) ([^ ]*) (-|\\[[^\\]]*\\]) ([^ \"]*|\"[^\"]*\") (-|[0-9]*) (-|[0-9]*)(?: ([^ \"]*|\"[^\"]*\") ([^ \"]*|\"[^\"]*\"))?"))))) TOK_TBLTEXTFILE)' '' 'STAGE DEPENDENCIES:' ' Stage-0 is a root stage' '' 'STAGE PLANS:' ' Stage: Stage-0' ' Create Table Operator:' ' Create Table' ' columns: host string, identity string, user string, time string, request string, status string, size string, referer string, agent string' ' if not exists: false' ' input format: org.apache.hadoop.mapred.TextInputFormat' ' # buckets: -1' ' output format: org.apache.hadoop.hive.ql.io.IgnoreKeyTextOutputFormat' ' serde name: org.apache.hadoop.hive.serde2.RegexSerDe' ' serde properties:' ' input.regex ([^ ]*) ([^ ]*) ([^ ]*) (-|\[[^\]]*\]) ([^ "]*|"[^"]*") (-|[0-9]*) (-|[0-9]*)(?: ([^ "]*|"[^"]*") ([^ "]*|"[^"]*"))?' ' name: serde_regex' ' isExternal: false' '' '' 22 rows selected >>> >>> CREATE TABLE serde_regex( host STRING, identity STRING, user STRING, time STRING, request STRING, status STRING, size STRING, referer STRING, agent STRING) ROW FORMAT SERDE 'org.apache.hadoop.hive.serde2.RegexSerDe' WITH SERDEPROPERTIES ( "input.regex" = "([^ ]*) ([^ ]*) ([^ ]*) (-|\\[[^\\]]*\\]) ([^ \"]*|\"[^\"]*\") (-|[0-9]*) (-|[0-9]*)(?: ([^ \"]*|\"[^\"]*\") ([^ \"]*|\"[^\"]*\"))?" ) STORED AS TEXTFILE; No rows affected >>> >>> LOAD DATA LOCAL INPATH "../data/files/apache.access.log" INTO TABLE serde_regex; No rows affected >>> LOAD DATA LOCAL INPATH "../data/files/apache.access.2.log" INTO TABLE serde_regex; No rows affected >>> >>> SELECT * FROM serde_regex ORDER BY time; 'host','identity','user','time','request','status','size','referer','agent' '127.0.0.1','-','frank','[10/Oct/2000:13:55:36 -0700]','"GET /apache_pb.gif HTTP/1.0"','200','2326','','' '127.0.0.1','-','-','[26/May/2009:00:00:00 +0000]','"GET /someurl/?track=Blabla(Main) HTTP/1.1"','200','5864','-','"Mozilla/5.0 (Windows; U; Windows NT 6.0; en-US) AppleWebKit/525.19 (KHTML, like Gecko) Chrome/1.0.154.65 Safari/525.19"' 2 rows selected >>> >>> SELECT host, size, status, time from serde_regex ORDER BY time; 'host','size','status','time' '127.0.0.1','2326','200','[10/Oct/2000:13:55:36 -0700]' '127.0.0.1','5864','200','[26/May/2009:00:00:00 +0000]' 2 rows selected >>> >>> DROP TABLE serde_regex; No rows affected >>> !record