> hadoop jar /home/hadoop/my-job-0.2.0-standalone.jar clojure.main s3://my-bucket/path/to/file.csv ~/outException in thread "main" java.io.FileNotFoundException: s3://my-bucket/path/to/file.csv (No such file or directory) at java.io.FileInputStream.open(Native Method) at java.io.FileInputStream.<init>(FileInputStream.java:146) at java.io.FileInputStream.<init>(FileInputStream.java:101) at clojure.lang.Compiler.loadFile(Compiler.java:7314) at clojure.main$load_script.invokeStatic(main.clj:275) at clojure.main$load_script.invoke(main.clj:268) at clojure.main$script_opt.invokeStatic(main.clj:337) at clojure.main$script_opt.invoke(main.clj:330) at clojure.main$main.invokeStatic(main.clj:421) at clojure.main$main.doInvoke(main.clj:384) at clojure.lang.RestFn.invoke(RestFn.java:421) at clojure.lang.Var.invoke(Var.java:383) at clojure.lang.AFn.applyToHelper(AFn.java:156) at clojure.lang.Var.applyTo(Var.java:700) at clojure.main.main(main.java:37) at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method) at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:57) at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43) at java.lang.reflect.Method.invoke(Method.java:606) at org.apache.hadoop.util.RunJar.run(RunJar.java:221) at org.apache.hadoop.util.RunJar.main(RunJar.java:136)
IllegalArgumentException AWS Access Key ID and Secret Access Key must be specified as the username or password (respectively) of a s3n URL, or by setting the fs.s3n.awsAccessKeyId or fs.s3n.awsSecretAccessKey properties (respectively). org.apache.hadoop.fs.s3.S3Credentials.initialize (S3Credentials.java:66)
(defproject refpath-count "0.2.0" :description "FIXME: write description" :url "http://example.com/FIXME" :license {:name "Eclipse Public License" :repositories {"conjars" "http://conjars.org/repo"} :dependencies [ [org.clojure/clojure "1.8.0"] [cascalog/cascalog-core "3.0.0"] [cascalog/cascalog-more-taps "3.0.0"] ] :profiles { :dev { :dependencies [ [org.apache.hadoop/hadoop-core "1.2.1"] [cascalog/midje-cascalog "3.0.0"] ] } :plugins [ [lein-midje "3.0.1"] ] :provided { :dependencies [ [org.apache.hadoop/hadoop-core "1.2.1"] ] } } :jvm-opts ["-Xms768m" "-Xmx768m"] :main nil :aot [main.core] )
hadoop jar /home/hadoop/my-job-0.2.0-standalone.jar clojure.main s3://my-bucket/path/to/file.csv ~/out
; Main function; this is defined in project.clj(defn -main [in out & args] (?- (hfs-delimited out :sinkmode :replace :delimiter ",") ; (stdout) (<- [?refpath ?count] ((refpath-counts (user-consideration-paths (hfs-delimited in :delimiter ","))) :> ?refpath ?count) ) ))
(defproject refpath-count "0.2.1"
:description "FIXME: write description" :url "http://example.com/FIXME" :license {:name "Eclipse Public License" :repositories {"conjars" "http://conjars.org/repo"} :dependencies [ [org.clojure/clojure "1.8.0"] [cascalog/cascalog-core "3.0.0"] [cascalog/cascalog-more-taps "3.0.0"] ] :profiles { :dev { :dependencies [ [org.apache.hadoop/hadoop-core "1.2.1"] [cascalog/midje-cascalog "3.0.0"] ] } :plugins [ [lein-midje "3.0.1"] ] :provided { :dependencies [ [org.apache.hadoop/hadoop-core "1.2.1"] ] }
:uberjar {:aot :all} } :jvm-opts ["-Xms768m" "-Xmx768m"] :main "main.core" )