Skip to content

Instantly share code, notes, and snippets.

@myui
Created December 15, 2016 11:30
Show Gist options
  • Save myui/5a6741e37d674b3887209ba8c752f98c to your computer and use it in GitHub Desktop.
Save myui/5a6741e37d674b3887209ba8c752f98c to your computer and use it in GitHub Desktop.
create table page (
docid int,
contents string
);
INSERT OVERWRITE TABLE page_exploded
select
d.docid,
normalize_unicode(t.word) as word
from
page d
LATERAL VIEW explode(tokenize_ja(contents)) t as word
where
t.word NOT IN ('stopward1', 'stopward2')
;
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment