Pig Latin代码示例:
-- Load data ratings = LOAD 'ratings_data' USING PigStorage(',') AS (userID:int, gender:chararray, rating:int);
-- Group by gender and calculate count and avg rating score gender_ratings = GROUP ratings BY gender; gender_rating_summary = FOREACH gender_ratings GENERATE group AS gender, COUNT(ratings) AS rating_count, AVG(ratings.rating) AS avg_rating_score;
-- Output results STORE gender_rating_summary INTO 'gender_rating_summary';