Something like the below…
Pipe p = new Pipe("picture url pipe");
p = new Each(p, new Fields("picture-url"), new Identity());
p = new Each(p, new Fields("picture-url"), new MyCustomHBaseOperation()); // Assume this only emits entries where picture isn't in HBase
p = new FetchPipe(xxx, yyy); // from Bixo
p = p.getContentTailPipe(); // two pipes from sub-assembly - one has status, one has fetched content
p = new Each(p, new MyCustomContentPreparer()); // get content into form/fields required for HBase
Tap source = new MongoDBTap(xxx);
Tap sink = new HBaseDBTap(xxx);
Flow f = FlowConnector().connect(source, sink, p);