When I pass the following file pattern:
/user/tholden/dedupe/2013/05/0[89]/part-*.avro
to my Pangool m/r job using TupleMRBuilder.addInput(Path, InputFormat, TupleMapper) the job works fine.
13/10/03 12:19:52 INFO mapred.JobClient: Cleaning up the staging area hdfs://
hadoop1.mitre.org:8020/tmp/hadoop/mapred/staging/tholden/.staging/job_201309130701_61526Exception in thread "main" java.lang.ArrayIndexOutOfBoundsException: 1
at com.datasalt.pangool.tuplemr.mapred.lib.input.PangoolMultipleInputs.getInputFormatMap(PangoolMultipleInputs.java:121)
at com.datasalt.pangool.tuplemr.mapred.lib.input.DelegatingInputFormat.getSplits(DelegatingInputFormat.java:52)
at org.apache.hadoop.mapred.JobClient.writeNewSplits(JobClient.java:998)
at org.apache.hadoop.mapred.JobClient.writeSplits(JobClient.java:1015)
at org.apache.hadoop.mapred.JobClient.access$600(JobClient.java:174)
at org.apache.hadoop.mapred.JobClient$2.run(JobClient.java:928)
at org.apache.hadoop.mapred.JobClient$2.run(JobClient.java:881)
at java.security.AccessController.doPrivileged(Native Method)
at javax.security.auth.Subject.doAs(Subject.java:396)
at org.apache.hadoop.security.UserGroupInformation.doAs(UserGroupInformation.java:1278)
at org.apache.hadoop.mapred.JobClient.submitJobInternal(JobClient.java:881)
at org.apache.hadoop.mapreduce.Job.submit(Job.java:526)
at org.apache.hadoop.mapreduce.Job.waitForCompletion(Job.java:556)
at org.mitre.ttv.CompareToolBase.run(CompareToolBase.java:108)
at org.apache.hadoop.util.ToolRunner.run(ToolRunner.java:65)
at org.apache.hadoop.util.ToolRunner.run(ToolRunner.java:79)
at org.mitre.ttv.CompareADSBtoTTTool.main(CompareADSBtoTTTool.java:25)
at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:39)
at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:25)
at java.lang.reflect.Method.invoke(Method.java:597)
at org.apache.hadoop.util.RunJar.main(RunJar.java:197)