Return-Path: X-Original-To: apmail-pig-commits-archive@www.apache.org Delivered-To: apmail-pig-commits-archive@www.apache.org Received: from mail.apache.org (hermes.apache.org [140.211.11.3]) by minotaur.apache.org (Postfix) with SMTP id A291C77E3 for ; Wed, 14 Sep 2011 19:04:03 +0000 (UTC) Received: (qmail 69070 invoked by uid 500); 14 Sep 2011 19:04:03 -0000 Delivered-To: apmail-pig-commits-archive@pig.apache.org Received: (qmail 69049 invoked by uid 500); 14 Sep 2011 19:04:03 -0000 Mailing-List: contact commits-help@pig.apache.org; run by ezmlm Precedence: bulk List-Help: List-Unsubscribe: List-Post: List-Id: Reply-To: dev@pig.apache.org Delivered-To: mailing list commits@pig.apache.org Received: (qmail 69041 invoked by uid 99); 14 Sep 2011 19:04:03 -0000 Received: from athena.apache.org (HELO athena.apache.org) (140.211.11.136) by apache.org (qpsmtpd/0.29) with ESMTP; Wed, 14 Sep 2011 19:04:03 +0000 X-ASF-Spam-Status: No, hits=-2000.0 required=5.0 tests=ALL_TRUSTED X-Spam-Check-By: apache.org Received: from [140.211.11.4] (HELO eris.apache.org) (140.211.11.4) by apache.org (qpsmtpd/0.29) with ESMTP; Wed, 14 Sep 2011 19:03:58 +0000 Received: from eris.apache.org (localhost [127.0.0.1]) by eris.apache.org (Postfix) with ESMTP id 03BEE2388AF0 for ; Wed, 14 Sep 2011 19:03:16 +0000 (UTC) Content-Type: text/plain; charset="utf-8" MIME-Version: 1.0 Content-Transfer-Encoding: 7bit Subject: svn commit: r1170769 [6/7] - in /pig/branches/branch-0.9: ./ test/e2e/harness/ test/e2e/harness/test/conf/ test/e2e/harness/test/tests/ test/e2e/pig/ test/e2e/pig/conf/ test/e2e/pig/deployers/ test/e2e/pig/drivers/ test/e2e/pig/macros/ test/e2e/pig/tes... Date: Wed, 14 Sep 2011 19:03:13 -0000 To: commits@pig.apache.org From: daijy@apache.org X-Mailer: svnmailer-1.0.8 Message-Id: <20110914190316.03BEE2388AF0@eris.apache.org> Modified: pig/branches/branch-0.9/test/e2e/pig/tests/turing_jython.conf URL: http://svn.apache.org/viewvc/pig/branches/branch-0.9/test/e2e/pig/tests/turing_jython.conf?rev=1170769&r1=1170768&r2=1170769&view=diff ============================================================================== --- pig/branches/branch-0.9/test/e2e/pig/tests/turing_jython.conf (original) +++ pig/branches/branch-0.9/test/e2e/pig/tests/turing_jython.conf Wed Sep 14 19:03:12 2011 @@ -27,24 +27,14 @@ our $FAILED="Pig job FAILED"; $cfg = { -#NOTE THAT currentversion returns rc=8 but should be rc=6 per Pig - 1801 -# So all of these tests are expected to fail for now - 'driver' => 'Pig' + 'driver' => 'Pig', ,'groups' => [ { 'name' => 'Jython_Checkin', 'tests' => [ { - 'num' => 1, - 'pig' => q\a = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); -store a into ':OUTPATH:';\, - 'sql' => "select name, age, gpa from studenttab10k;", - 'floatpostprocess' => 1, - 'delimiter' => ' ', - }, - { 'num' => 2, - ,'pig' => q\#!/usr/bin/python + 'pig' => q\#!/usr/bin/python from org.apache.pig.scripting import Pig input1=':INPATH:/singlefile/studenttab10k' @@ -69,14 +59,18 @@ if P.isSuccessful(): else: raise "Pig job FAILED" -\ - ,'sql' => "select registration, sum(contributions) -from studenttab10k as a full outer join votertab10k as b using (name, age) -where a.age < 50 and b.age < 50 -group by registration -order by 2;", - 'floatpostprocess' => 1, - 'delimiter' => ' ', +\, + 'verify_pig_script' => q\a = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + b = load ':INPATH:/singlefile/votertab10k' as (name, age, registration, contributions); + c = filter a by age < 50; + d = filter b by age < 50; + e = cogroup c by (name, age), d by (name, age) ; + f = foreach e generate flatten(c), flatten(d); + g = group f by registration; + h = foreach g generate group, SUM(f.d::contributions); + i = order h by $1; + store i into ':OUTPATH:'; +\, 'sortArgs' => ['-t', ' ', '+1', '-2'], } ] @@ -85,62 +79,8 @@ order by 2;", 'name' => 'Jython_Embedded', 'tests' => [ { -#NOT EMBEDDED - 'num' => 1 - ,'pig' => q\#!/usr/bin/python -# JYTHON COMMENT -from org.apache.pig.scripting import Pig - -P = Pig.compile("""A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); -store A into ':OUTPATH:';""") - -Q = P.bind() - -result = Q.runSingle() - -if result.isSuccessful(): - print "Pig job PASSED" - -else: - raise "Pig job FAILED" -\ - - ,'sql' => "select name, age, gpa+0.00 from studenttab10k;" - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - - }, { -# 15.0.3 1 invoke --embedded from java -# EMBEDDED - 'num' => 2 - ,'pig_params' => ['--embedded', 'jython'] - ,'pig' => q\ -# JYTHON COMMENT -from org.apache.pig.scripting import Pig - -P = Pig.compile("""A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); -store A into ':OUTPATH:';""") - -Q = P.bind() - -result = Q.runSingle() - -if result.isSuccessful(): - print "Pig job PASSED" - -else: - raise "Pig job FAILED" -\ - ,'sql' => "select name, age, gpa+0.00 from studenttab10k;" - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - - }, { - -# 15.0.1 1 invoke from pig.pl -embedded -# EMBEDDED - 'num' => 3 - ,'use-pig.pl'=> 1 + 'num' => 1, + 'ignore' => 1, # need a way not to pass --embedded to the verify script ,'pig_params' => ['--embedded', 'jython'] ,'pig' => q\ # JYTHON COMMENT @@ -158,24 +98,16 @@ if result.isSuccessful(): else: raise "Pig job FAILED" -\ - ,'sql' => "select name, age, gpa+0.00 from studenttab10k;" - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' -# 15.0.1 1 invoke from pig.pl -embedded +\, + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + store A into ':OUTPATH:';\, } ] }, { 'name' => 'Jython_CompileBindRun' ,'tests' => [ - { - # 8.1 1 compile pig script string - # 9.1 1 bind() without parameters - # 10.1 1 run a script that returns single positive result - # 12.1 1 python comments - # 14.0.4 (compile()bind().runSingle)+ - # 15.0.2 1 invoke from pig.pl with python script #!/bin/python + { # bind() with no parameters, runSingle 'num' => 1 ,'pig' => q\#!/usr/bin/python # JYTHON COMMENT @@ -194,53 +126,17 @@ if result.isSuccessful(): else: raise "Pig job FAILED" -\ - - ,'sql' => "select name, age, gpa from studenttab10k;" - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - # ,'expected_out_regex' => "Pig job PASSED" - - },{ - # 8.1 1 compile pig script string - # 9.1 1 bind() without parameters - # 10.1 1 run a script that returns single positive result - # 12.3 1 pig comments in pig script - # 14.0.9 (compile->(bind->runSingle)+)+ - - - - 'num' => 2 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig +\, - -#TEST PIG COMMENTS -P = Pig.compile(""" -A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); -store A into ':OUTPATH:';""") - -Q = P.bind() - -result = Q.runSingle() - -if result.isSuccessful(): - print "Pig job PASSED" - -else: - raise "Pig job FAILED" - \ - - ,'sql' => "select name, age, gpa from studenttab10k;" + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + store A into ':OUTPATH:';\, ,'floatpostprocess' => 1 ,'delimiter' => ' ' - # ,'expected_out_regex' => "Pig job PASSED" },{ # 9.2 1 bind single input parameter and no output parameters - 'num' => 3 + 'num' => 2 ,'pig' => q\#!/usr/bin/python -# 14.0.9 (compile->(bind->runSingle)+)+ from org.apache.pig.scripting import Pig @@ -258,6251 +154,289 @@ if result.isSuccessful(): else: raise "Pig job FAILED" -\ +\, - ,'sql' => "select name, age, gpa from studenttab10k;" + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + store A into ':OUTPATH:';\, ,'floatpostprocess' => 1 ,'delimiter' => ' ' # ,'expected_out_regex' => "Pig job PASSED" },{ -# 9.3 1 bind multiple input parameter and no output parameters -# 10.1 1 run a script that returns single positive result -# 14.0.9 (compile->(bind->runSingle)+)+ - 'num' => 4 +# bind parallel execution with a multiple entries + 'num' => 3 ,'pig' => q\#!/usr/bin/python from org.apache.pig.scripting import Pig -input1= ":INPATH:/singlefile/studenttab10k" -input2= ":INPATH:/singlefile/votertab10k" -input3= ":INPATH:/singlefile/studenttab10k" +input= ":INPATH:/singlefile/studenttab10k" +max1="50"; +output1= ":OUTPATH:.1" +max2="40.0"; +output2= ":OUTPATH:.2" +max3="30.0f"; +output3= ":OUTPATH:.3" P = Pig.compile(""" -A = load '$in1' as (name, age, gpa); -B = load '$in2' as (name, age, registration, contributions); -C = load '$in3' as (name, age, gpa); -store A into ':OUTPATH:.1'; -store B into ':OUTPATH:.2'; -store C into ':OUTPATH:.3'; +A = load '$in' as (name, age, gpa); +B= filter A by age < $max; +C = foreach B generate name; +store C into '$out'; +-- store C into put here as comment to fake multi-query """) -Q = P.bind({'in1':input1,'in2':input2, 'in3':input3}) -result = Q.runSingle() +Q = P.bind([ +{'in':input ,'max':max1 ,'out':output1 } + ,{'in':input ,'max':max2 ,'out':output2 } + ,{'in':input ,'max':max3 ,'out':output3 } + ]) -if result.isSuccessful(): - print "Pig job PASSED" +results = Q.run() +for i in [0, 1, 2]: + result = results[i] + if result.isSuccessful(): + print "Pig job PASSED" + else: + raise "Pig job FAILED" -else: - raise "Pig job FAILED" -\ +\, - ,'sql' => q\ -select name, age, gpa from studenttab10k; -select name, age, registration, contributions from votertab10k; -select name, age, gpa from studenttab10k;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' -# ,'expected_out_regex' => "Pig job PASSED" + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + B= filter A by age < 50; + C = foreach B generate name; + store C into ':OUTPATH:.1'; + A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + B= filter A by age < 40.0; + C = foreach B generate name; + store C into ':OUTPATH:.2'; + A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + B= filter A by age < 30.0f; + C = foreach B generate name; + store C into ':OUTPATH:.3'; +\, },{ -# 9.4 1 bind no input parameters and a single output arameter -# 10.1 1 run a script that returns single positive result -# 14.0.12 (single result =compile->result - 'num' => 5 - ,'pig' => q\#!/usr/bin/python +# 8.6 compile pig script file with no input and no output parameters +#12.2 import python modules +# + 'num' => 4 + ,'pig' => q\#!/usr/bin/python from org.apache.pig.scripting import Pig -input= ":INPATH:/singlefile/studenttab10k" -output = ":OUTPATH:" - -P = Pig.compile("""A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); store A into '$out';""") +#create pig script +pig_script = ":TMP:/script.pig" +pigfile = open( pig_script, 'w+') +pigfile.write(""" +A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); +store A into ':OUTPATH:'; +""") +pigfile.close() -Q = P.bind({'out':output}) +#execute pig script -result = Q.runSingle() +result = Pig.compileFromFile( pig_script ).bind().runSingle() if result.isSuccessful(): print "Pig job PASSED" - else: raise "Pig job FAILED" +\, + + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + store A into ':OUTPATH:'; \ + ,'floatpostprocess' => 1 + ,'delimiter' => ' ' + },{ +# 8.7 compile pig script file with no input and with output parameters + 'num' => 5 + ,'pig' => q\#!/usr/bin/python +from org.apache.pig.scripting import Pig - ,'sql' => q\select name, age, gpa from studenttab10k;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' -# ,'expected_out_regex' => "Pig job PASSED" +#create pig script - },{ -# 9.5 1 bind no input parameters and a multiple output parameter -# 10.1 1 run a script that returns single positive result -# 14.0.9 (compile->(bind->runSingle)+)+ - 'num' => 6 - ,'pig' => q\#!/usr/bin/python from org.apache.pig.scripting import Pig -output1 = ":OUTPATH:.1" -output2 = ":OUTPATH:.2" +#create pig script -P = Pig.compile(""" +pig_script = ":TMP:/script.pig" +pigfile = open( pig_script, 'w+') +pigfile.write(""" A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); -B = load ':INPATH:/singlefile/votertab10k' as (name, age, registration, contributions); -store A into '$out1'; -store B into '$out2'; +store A into '$out'; """) +pigfile.close() -Q = P.bind({'out1':output1,'out2':output2}) -result = Q.runSingle() +#execute pig script +output= ":OUTPATH:" + +result = Pig.compileFromFile(pig_script).bind({'out':output}).runSingle() if result.isSuccessful(): print "Pig job PASSED" - else: raise "Pig job FAILED" +\, + + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + store A into ':OUTPATH:'; \ + ,'floatpostprocess' => 1 + ,'delimiter' => ' ' - ,'sql' => q\select name, age, gpa from studenttab10k; -select name, age, registration, contributions from votertab10k;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' -# ,'expected_out_regex' => "Pig job PASSED" - },{ + },{ + # 11.15 1 results.getResults(alias) for null results + 'num' => 6 + ,'pig' => q\#!/usr/bin/python +from org.apache.pig.scripting import Pig +P = Pig.compile("""A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); +EMPTY= filter A by age > 9999; +store EMPTY into ':OUTPATH:'; +""") -# 9.6 1 bind multiple input parameters and a multiple output parameter -# 10.1 1 run a script that returns single positive result - 'num' => 7 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig +result = P.bind().runSingle() +\, -input1= ":INPATH:/singlefile/studenttab10k" -input2= ":INPATH:/singlefile/votertab10k" -output1 = ":OUTPATH:.1" -output2 = ":OUTPATH:.2" + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + EMPTY= filter A by age > 9999; + store EMPTY into ':OUTPATH:';\ + }, + { + # bind reading from python context + 'num' => 7 + ,'pig' => q\#!/usr/bin/python +from org.apache.pig.scripting import Pig -P = Pig.compile(""" -A = load '$in1' as (name, age, gpa); -B = load '$in2' as (name, age, registration, contributions); -store A into '$out1'; -store B into '$out2'; +P = Pig.compile("""A = load '$inpath' as (name, age, gpa); +B= filter A by age < $max; +store B into '$out'; """) -Q = P.bind({'in1':input1,'in2':input2, 'out1':output1, 'out2':output2 }) -result = Q.runSingle() +#execute pig script +inpath= ":INPATH:/singlefile/studenttab10k" +out= ":OUTPATH:" +max = 40 -if result.isSuccessful(): - print "Pig job PASSED" +result = P.bind().runSingle() +\, + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + B= filter A by age < 40; + store B into ':OUTPATH:';\ -else: - raise "Pig job FAILED" -\ + },{ + # bind multiple times + 'num' => 8 + ,'pig' => q\#!/usr/bin/python +from org.apache.pig.scripting import Pig - ,'sql' => q\select name, age, gpa from studenttab10k; -select name, age, registration, contributions from votertab10k;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - },{ +P = Pig.compile("""A = load '$inpath' as (name, age, gpa); +B= foreach A generate age + $i; +store B into '$out'; +-- extra store B into to force multiquery +""") +#execute pig script +inpath= ":INPATH:/singlefile/studenttab10k" +for i in [1,2,3]: + out= ":OUTPATH:." + str(i) + result = P.bind().runSingle() +\, + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + B= foreach A generate age + 1; + store B into ':OUTPATH:.1'; + A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + B= foreach A generate age + 2; + store B into ':OUTPATH:.2'; + A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + B= foreach A generate age + 3; + store B into ':OUTPATH:.3';\, -# 9.7 1 bind multiple input parameters and a multiple output parameter in any order -# 10.1 1 run a script that returns single positive result - 'num' => 8 - ,'pig' => q\#!/usr/bin/python + }, + { + # invoke .run() on a non-parallel pig script + 'num' => 9 + ,'pig' => q\#!/usr/bin/python +from org.apache.pig.scripting import Pig + +P = Pig.compile(""" +A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); +store A into ':OUTPATH:'; +""") +result = P.bind().run() +\, + 'verify_pig_script' => q\A = load ':INPATH:/singlefile/studenttab10k' as (name, age, gpa); + store A into ':OUTPATH:';\, + } + ] + },{ + 'name' => 'Jython_Diagnostics' + ,'tests' => [ + { +# 11.23 1 explain() on a complex query + 'num' => 1 + ,'ignore' => 'Expected output does not appear to be correct' + ,'pig' => q\#!/usr/bin/python from org.apache.pig.scripting import Pig input1= ":INPATH:/singlefile/studenttab10k" input2= ":INPATH:/singlefile/votertab10k" output1 = ":OUTPATH:.1" output2 = ":OUTPATH:.2" +maximum="20"; + +#No Schema specified P = Pig.compile(""" A = load '$in1' as (name, age, gpa); -B = load '$in2' as (name, age, registration, contributions); -store A into ':OUTPATH:.1'; -store B into ':OUTPATH:.2'; +B= filter A by age < $max; +C= foreach B generate name,age; +store C into '$out1'; +D = load '$in2' using PigStorage() as (name:chararray, age:int, registration, contributions:double); +E= filter D by age < $max; +F= foreach E generate name,age; +store F into '$out2'; """) -Q = P.bind({'in1':input1,'in2':input2 }) -result = Q.runSingle() - -if result.isSuccessful(): - print "Pig job PASSED" - -else: - raise "Pig job FAILED" +result = P.bind({'in1':input1, 'in2':input2, 'max':maximum, 'out1':output1, 'out2':output2 }).explain() \ - ,'sql' => q\select name, age, gpa from studenttab10k; -select name, age, registration, contributions from votertab10k;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - },{ + ,'rc'=> 0 + ,'expected_out_regex' => "Schema:.*{name:.*bytearray,age:.*bytearray}.*Type:.*Unknown" -# 9.8 bind parallel execution wit a single entry -# 10.1 run a script that returns single positive result -# 13.0.1 single pipeline that succeeds -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 9 - ,'pig' => q\#!/usr/bin/python + }, { +#11.22 1 illustrate() on a complex query + 'num' => 2 + ,'pig' => q\#!/usr/bin/python from org.apache.pig.scripting import Pig -input= ":INPATH:/singlefile/studenttab10k" -output= ":OUTPATH:" -maximum="50" +input1= ":INPATH:/singlefile/studenttab10k" +input2= ":INPATH:/singlefile/votertab10k" +output1 = ":OUTPATH:.1" +output2 = ":OUTPATH:.2" +maximum="20"; +#No Schema specified P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B = filter A by age < $max; -store B into '$out'; +A = load '$in1' as (name, age, gpa); +B= filter A by age < $max; +C= foreach B generate name,age; +store C into '$out1'; +D = load '$in2' using PigStorage() as (name:chararray, age:int, registration, contributions:double); +E= filter D by age < $max; +F= foreach E generate name,age; +store F into '$out2'; """) -Q = P.bind([ {'in':input ,'max':maximum ,'out':output} ]) - -results = Q.run() -for i in [0]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\select name, age, gpa from studenttab10k where age < 50;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED0" -# ,'rc' => 0 - - },{ -# 9.11 1 bind parallel execution with a multiple entries -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 10 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ -{'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - - },{ -# 9.13 For parallel execution, change the order of the entries, this should have no impact -# 10.2 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 11 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max3="30"; -output3= ":OUTPATH:.1" - -max1="50"; -output1= ":OUTPATH:.2" - -max2="40"; -output2= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ -{'in':input ,'max':max3 ,'out':output3} -,{'in':input ,'max':max1 ,'out':output1} -,{'in':input ,'max':max2 ,'out':output2} -]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 30; -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - - },{ - -# 9.8 1 bind input parameters that is undefined in python script -# 10.3 1 run a script that returns single negative result -#14.0.12 2 (parallel results = compile->bind->result - - 'num' => 12 - ,'ignore' => "Bugzilla()" - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" -output = ":OUTPATH:" - -P = Pig.compile("""A = load '$in' as (name, age, gpa); store A into '$out';""") - -Q = P.bind({'in':bad_input, 'out':output}) - -result = Q.runSingle() - -if result.isSuccessful(): - print "Pig job PASSED" - -else: - raise "Pig job FAILED" -\ - - ,'rc' => 6 - #,'expected_out_regex' => "Pig job FAILED" - #,'expected_err_regex' => "bad_input.*not defined" - ,'expected_err_regex' => "ERROR 1121" - - },{ -# 9.9 1 bind output parameters that is undefined in python script -# 10.3 1 run a script that returns single negative result - 'num' => 13 - ,'ignore' => "BUG(4249349)" - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" -output = ":OUTPATH:" - -P = Pig.compile("""A = load '$in' as (name, age, gpa); store A into '$out';""") - -Q = P.bind({'in':input, 'out':bad_output}) - -result = Q.runSingle() - -if result.isSuccessful(): - print "Pig job PASSED" - -else: - raise "Pig job FAILED" -\ - - ,'rc' => 2 - ,'expected_err_regex' => "INVALID.jar.*does not exist" - ,'expected_err_regex' => "ERROR 101" - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 14 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -results = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""").bind([ -{'in':input ,'max':max1 ,'out':output1 } -,{'in':input ,'max':max2 ,'out':output2 } -,{'in':input ,'max':max3 ,'out':output3 } -]).run() - -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).run - 'num' => 15 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ -{'in':input ,'max':max1 ,'out':output1 } -,{'in':input ,'max':max2 ,'out':output2 } -,{'in':input ,'max':max3 ,'out':output3 } -]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results - 'num' => 16 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ -{'in':input ,'max':max1 ,'out':output1 } -,{'in':input ,'max':max2 ,'out':output2 } -,{'in':input ,'max':max3 ,'out':output3 } -]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 17 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 18 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 19 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 20 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 21 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 22 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 23 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 24 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results - 'num' => 25 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results - 'num' => 26 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 27 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 28 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 29 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 30 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 31 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results - 'num' => 32 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 33 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 34 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 35 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 36 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 37 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 38 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 39 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 40 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 41 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 42 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 43 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 44 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 45 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 46 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 47 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 48 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 49 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 50 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 51 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 52 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: - result = results[i] - if result.isSuccessful(): - print "Pig job PASSED" - else: - raise "Pig job FAILED" - -\ - - ,'sql' => q\ -select name, age, gpa from studenttab10k where age < 50; -select name, age, gpa from studenttab10k where age < 40; -select name, age, gpa from studenttab10k where age < 30;\ - ,'floatpostprocess' => 1 - ,'delimiter' => ' ' - -# ,'expected_out_regex' => "Pig job PASSED1" -# ,'expected_out_regex' => "Pig job PASSED2" -# ,'expected_out_regex' => "Pig job PASSED3" -# ,'rc' => 0 - },{ -# 9.10 1 bind single inpput parameters with a parallel execution of scripts -# 10.2 1 run successful script that returns a list of positive result -# 13.0.4 multiple pipelines that succeed -# 13.0.5 run pipeline with multiple input and outputs -# 14.0.13 parallel results = compile.bind(parallel inputs).results -# 17.0.3 parallel execution : execute several data pipelines for the this pig script - 'num' => 53 - ,'pig' => q\#!/usr/bin/python -from org.apache.pig.scripting import Pig - -input= ":INPATH:/singlefile/studenttab10k" - -max1="50"; -output1= ":OUTPATH:.1" - -max2="40"; -output2= ":OUTPATH:.2" - -max3="30"; -output3= ":OUTPATH:.3" - - -P = Pig.compile(""" -A = load '$in' as (name, age, gpa); -B= filter A by age < $max; -store B into '$out'; -""") - -Q = P.bind([ - {'in':input ,'max':max1 ,'out':output1 } - ,{'in':input ,'max':max2 ,'out':output2 } - ,{'in':input ,'max':max3 ,'out':output3 } - ]) - -results = Q.run() -for i in [0, 1, 2]: [... 4464 lines stripped ...]