HIVE: word count
INSERT OVERWRITE LOCAL DIRECTORY 'RESULT/2013-3' ROW FORMAT DELIMITED FIELDS TERMINATED BY ','
SELECT WORD, COUNT(*)
FROM GH_RC LATERAL VIEW EXPLODE(SPLIT(TEXT, '[^A-ZA-Z_0-9\(\)\-]+') ) MYTABLE AS WORD
WHERE YEAR=2013 AND MONTH=3
GROUP BY WORD
HAVING COUNT(*) > 1;