example 1

1
CREATE TABLE rawdata (line STRING); LOAD DATA INPATH '/user/hadoop/edgar/' INTO TABLE rawdata ; CREATE TABLE wordcount AS SELECT word, count(1) AS count FROM (SELECT EXPLODE(SPLIT(line,' ')) AS word FROM rawdata ) words GROUP BY word ORDER BY word ; SELECT word, count FROM wordcount WHERE count > 1500 ORDER BY count ;

Upload: pysunil

Post on 14-Apr-2016

212 views

Category:

Documents


0 download

TRANSCRIPT

CREATE TABLE rawdata (line STRING);

LOAD DATA INPATH '/user/hadoop/edgar/' INTO TABLE rawdata ;

CREATE TABLE wordcount AS SELECT word, count(1) AS count FROM (SELECT EXPLODE(SPLIT(line,' ')) AS word FROM rawdata ) words GROUP BY word ORDER BY word ;

SELECT word, count FROM wordcount WHERE count > 1500 ORDER BY count ;