create table documents(contents string) stored as textfile; LOAD DATA LOCAL INPATH '../data/files/docurl.txt' INTO TABLE documents; select url, count(1) FROM ( FROM documents MAP documents.contents USING 'java -cp ../build/ql/test/classes org.apache.hadoop.hive.scripts.extracturl' AS (url, count) ) subq group by url; DROP TABLE documents;