6

 pig -x local

students = LOAD '/home/cloudera/Desktop/students.txt' USING PigStorage(',') 

AS (id:int, name:chararray, dept:chararray, marks:int);

departments = LOAD '/home/cloudera/Desktop/departments.txt' USING PigStorage(',') 

AS (dept_code:chararray, dept_name:chararray);

high_scorers = FILTER students BY marks > 70;

DUMP high_scorers;

projected = FOREACH high_scorers GENERATE name, marks;

DUMP projected;

grouped_by_dept = GROUP students BY dept;

DUMP grouped_by_dept;

avg_marks = FOREACH grouped_by_dept GENERATE group AS department, AVG(students.marks) AS average_marks;

DUMP avg_marks;

joined = JOIN students BY dept, departments BY dept_code;

DUMP joined;

sorted = ORDER students BY marks DESC;

DUMP sorted;









Comments

Popular posts from this blog

7

8