Commit bd7d7d97 authored by leroyq's avatar leroyq

twt5

parent 786209bd
dataset = LOAD '/laboratory/twitter-small.txt' AS (id: long, fr: long);
dataset = LOAD '/laboratory/tw.txt' AS (id: long, fr: long);
-- TODO: check if user IDs are valid (e.g. not null) and clean the dataset
B = FILTER dataset BY (id>0);
......
......@@ -10,4 +10,4 @@ D = GROUP C BY fr;
friends = FOREACH D GENERATE group, COUNT(C);
STORE friends INTO '/twitter/results1';
STORE friends INTO '/twitter/results-e1';
dataset = LOAD '/laboratory/twitter-small.txt' AS (id: long, fr: long);
dataset = LOAD '/laboratory/tw.txt' AS (id: long, fr: long);
-- TODO: check if user IDs are valid (e.g. not null) and clean the dataset
B = FILTER dataset BY (id>0);
......
......@@ -12,4 +12,4 @@ friends = FOREACH D GENERATE group, COUNT(C) AS count;
friends2 = FILTER friends BY (count > 2)
STORE friends2 INTO '/twitter/results1';
STORE friends2 INTO '/twitter/results-e2';
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment