Professional Documents
Culture Documents
SQL Pig
SQL Pig
c = ORDER b BY column;
SQL Statement
SELECT * FROM table ORDER BY RAND()
Pig equivalent
c = GROUP b BY RANDOM();
d = FOREACH c GENERATE FLATTEN(b);
SQL Statement
SELECT users.ID, users.Location, comments.upVotes
FROM users
[INNER|LEFT|RIGHT] JOIN comments
ON users.ID=comments.UserID
Pig equivalent
-- Inner Join
A = JOIN comments BY userID, users BY userID;
-- Outer Join
A = JOIN comments BY userID [LEFT|RIGHT|FULL] OUTER, users BY
userID;
SQL Statement
SELECT * FROM tablea, tableb;
Pig equivalent
A = LOAD 'data1' AS (a1, a2, a3);
DUMP A;
(1,2,3)
(4,5,6)
B = LOAD 'data2' AS (b1, b2);
DUMP B;
(1,2)
(3,4)
(5,6)
C = CROSS A, B;
DUMP C;
(1,2,3,1,2)
(1,2,3,3,4)
(1,2,3,5,6)
(4,5,6,1,2)
(4,5,6,3,4)
(4,5,6,5,6)