6
pig -x local
students = LOAD '/home/cloudera/Desktop/students.txt' USING PigStorage(',')
AS (id:int, name:chararray, dept:chararray, marks:int);
departments = LOAD '/home/cloudera/Desktop/departments.txt' USING PigStorage(',')
AS (dept_code:chararray, dept_name:chararray);
high_scorers = FILTER students BY marks > 70;
DUMP high_scorers;
projected = FOREACH high_scorers GENERATE name, marks;
DUMP projected;
grouped_by_dept = GROUP students BY dept;
DUMP grouped_by_dept;
avg_marks = FOREACH grouped_by_dept GENERATE group AS department, AVG(students.marks) AS average_marks;
DUMP avg_marks;
joined = JOIN students BY dept, departments BY dept_code;
DUMP joined;
sorted = ORDER students BY marks DESC;
DUMP sorted;
Comments
Post a Comment