Finetune with your specific font - see eg. below which uses IMPACT font.
#!/bin/bash
time ~/tesseract/src/training/tesstrain.sh \
--fonts_dir /usr/share/fonts \
--lang eng --linedata_only \
--noextract_font_properties \
--langdata_dir ~/langdata \
--tessdata_dir ~/tessdata \
--fontlist "Impact Condensed" \
--training_text ~/langdata/eng/eng.training_text \
--workspace_dir ~/tmp/ \
--save_box_tiff \
--output_dir ~/tesstutorial/engtrainfont
time ~/tesseract/src/training/tesstrain.sh \
--fonts_dir /usr/share/fonts \
--lang eng --linedata_only \
--noextract_font_properties \
--langdata_dir ~/langdata \
--tessdata_dir ~/tessdata \
--fontlist "Impact Condensed" \
--training_text ~/langdata/eng/eng.mywordlist.training_text \
--workspace_dir ~/tmp/ \
--save_box_tiff \
--output_dir ~/tesstutorial/engevalwordlist
echo "/n ****** Finetune one of the fully-trained existing models: ***********"
mkdir -p ~/tesstutorial/impact_from_full
combine_tessdata -e ~/tessdata_best/eng.traineddata \
~/tesstutorial/impact_from_full/eng.lstm
time ~/tesseract/src/training/lstmtraining \
--model_output ~/tesstutorial/impact_from_full/impact \
--continue_from ~/tesstutorial/impact_from_full/eng.lstm \
--traineddata ~/tessdata_best/eng.traineddata \
--train_listfile ~/tesstutorial/engtrainfont/eng.training_files.txt \
--debug_interval -1 \
--max_iterations 400
echo -e "\n*********** eval on training data ******\n"
time ~/tesseract/src/training/lstmeval \
--model ~/tesstutorial/impact_from_full/impact_checkpoint \
--traineddata ~/tessdata_best/eng.traineddata \
--eval_listfile ~/tesstutorial/engtrainfont/eng.training_files.txt
echo -e "\n***********eval on eval data ******\n"
time ~/tesseract/src/training/lstmeval \
--model ~/tesstutorial/impact_from_full/impact_checkpoint \
--traineddata ~/tessdata_best/eng.traineddata \
--eval_listfile ~/tesstutorial/engevalwordlist/eng.training_files.txt
echo -e "\n*********** convert to traineddata ******\n"
time ../tesseract/src/training/lstmtraining \
--stop_training \
--continue_from ~/tesstutorial/impact_from_full/impact_checkpoint \
--traineddata ~/tessdata_best/eng.traineddata \
--model_output ~/tesstutorial/engtrainfont/eng.traineddata