natbusa · August 29, 2015 13:57
diff --git a/wc.HiveQL.sql b/wc.HiveQL.sql
 -- Hive queries for Word Count
 drop table if exists doc;

 -- 1) create table to load whole file
 create table doc(
 text string
 ) row format delimited fields terminated by '\n' stored as textfile;

 --2) loads plain text file
 --if file is .csv then in replace '\n' by ',' in step no 1 (creation of doc table)
 load data local inpath './lorem.txt' overwrite into table doc;

 -- 3) wordCount in single line
 SELECT word, COUNT(*) FROM doc LATERAL VIEW explode(split(lower(text), '\\W+')) lTable as word GROUP BY word;
	-- Hive queries for Word Count
	drop table if exists doc;

	-- 1) create table to load whole file
	create table doc(
	text string
	) row format delimited fields terminated by '\n' stored as textfile;

	--2) loads plain text file
	--if file is .csv then in replace '\n' by ',' in step no 1 (creation of doc table)
	load data local inpath './lorem.txt' overwrite into table doc;

	-- 3) wordCount in single line
	SELECT word, COUNT(*) FROM doc LATERAL VIEW explode(split(lower(text), '\\W+')) lTable as word GROUP BY word;