Version 1 (modified by jazz, 11 years ago) (diff) |
---|
2013-08-14
with_country = STREAM notbots THROUGH `ipwrapper.sh $GEO`
AS (country_code, country, state, city, ip, time, uri, bytes, userAgent);
geo_uri_groups = GROUP with_country BY country_code;
geo_uri_group_counts = FOREACH geo_uri_groups GENERATE
group,
COUNT(with_country) AS cnt,
SUM(with_country.bytes) AS total_bytes;
geo_uri_group_counts = ORDER geo_uri_group_counts BY cnt DESC;
STORE geo_uri_group_counts INTO 'by_country.tsv';