Following that the first, less ambitous invocation fails repeatedly at 15k files read,
$ bin/fac lda --read-dirs $mytextdir --num-topics 20 --num-iterations 100
java -Xmx6g -ea -Djava.awt.headless=true -Dfile.encoding=UTF-8 -server -classpath ./src/main/resources:./target/classes:./target/factorie_2.11-1.3-SNAPSHOT-jar-with-dependencies.jar
Reading files from directory <redacted>
1000 2000 3000 4000 5000 6000 7000 8000 9000 10000
11000 12000 13000 14000 15000Exception in thread "main" java.io.FileNotFoundException: <redacted>/2015-05-21-08503-b121d690-6f96-4d11-97c1-187554b704d2.txt (Too many open files)
at java.io.FileInputStream.open0(Native Method)
at java.io.FileInputStream.open(FileInputStream.java:195)
at java.io.FileInputStream.<init>(FileInputStream.java:138)
at cc.factorie.app.topics.lda.Document$.fromFile(Document.scala:141)
at cc.factorie.app.topics.lda.LDACmd$$anonfun$main$4$$anonfun$apply$1$$anonfun$apply$mcV$sp$2.apply(LDA.scala:333)
at cc.factorie.app.topics.lda.LDACmd$$anonfun$main$4$$anonfun$apply$1$$anonfun$apply$mcV$sp$2.apply(LDA.scala:331)
at scala.collection.TraversableLike$WithFilter$$anonfun$foreach$1.apply(TraversableLike.scala:733)
at scala.collection.IndexedSeqOptimized$class.foreach(IndexedSeqOptimized.scala:33)
at scala.collection.mutable.ArrayOps$ofRef.foreach(ArrayOps.scala:186)
at scala.collection.TraversableLike$WithFilter.foreach(TraversableLike.scala:732)
at cc.factorie.app.topics.lda.LDACmd$$anonfun$main$4$$anonfun$apply$1.apply$mcV$sp(LDA.scala:331)
at scala.util.control.Breaks.breakable(Breaks.scala:38)
at cc.factorie.app.topics.lda.LDACmd$$anonfun$main$4.apply(LDA.scala:331)
at cc.factorie.app.topics.lda.LDACmd$$anonfun$main$4.apply(LDA.scala:328)
at scala.collection.immutable.List.foreach(List.scala:381)
at cc.factorie.app.topics.lda.LDACmd.main(LDA.scala:328)
at cc.factorie.app.topics.lda.LDA.main(LDA.scala)
Any tip or insight is very much appreciated.