That means Tesseract Can't find nobatch file and box.train.stderr. Check if
this file in "tessdata" DIR if not you must download them, also it be
better if you set PREFIX_VARIABLE environment variable.

On 6 June 2012 00:37, Vince <[email protected]> wrote:

> I'm new to tesseract.  I'm trying to train a font using the
> instructions found here:
>
> http://code.google.com/p/tesseract-ocr/wiki/TrainingTesseract3
>
> I've generated a bmp and box file.  I'm trying to generate a tr file
> using tesseract.exe
>
> I can email the input files to anyone who's interested.
>
> C:\Users\vharron\Documents\shares\ocr>C:\Users\vharron\Documents\p4\wip
> \dte\ocr\tesseract\vs2008\LIB_Debug\tesseractd.exe
> eng.Arial_Regular.exp0.bmp eng.Arial_Regular.exp0.box nobatch
> box.train.stderr
> read_params_file: Can't open nobatch
> read_params_file: Can't open box.train.stderr
> Tesseract Open Source OCR Engine v3.02 with Leptonica
> index >= 0 && index < size_used_:Error:Assert failed:in file c:\users
> \vharron\documents\p4\wip\dte\ocr\tesseract\ccutil\genericvector.h,
> line 512
>
> ERRCODE::error(const char * caller=0x015d58e0, TessErrorLogCode
> action=ABORT, const char * format=0x015d58cc, ...)  Line 86 + 0x6
> bytes   C++
> GenericVector<tesseract::FontInfo>::get(int index=0)  Line 512 + 0x31
> bytes   C++
> UnicityTable<tesseract::FontInfo>::get(int id=0)  Line 134      C++
> tesseract::LanguageModel::FillConsistencyInfo(int curr_col=3, bool
> word_end=false, BLOB_CHOICE * b=0x19cb8428,
> tesseract::ViterbiStateEntry * parent_vse=0x19cc1bb0, BLOB_CHOICE *
> parent_b=0x19cb8178, CHUNKS_RECORD * chunks_record=0x0042f460,
> tesseract::LanguageModelConsistencyInfo *
> consistency_info=0x0042f014)  Line 1125 + 0x29 bytes    C++
> tesseract::LanguageModel::AddViterbiStateEntry(unsigned char
> top_choice_flags=' ', float denom=1.0000000, bool word_end=false, int
> curr_col=3, int curr_row=3, BLOB_CHOICE * b=0x19cb8428, BLOB_CHOICE *
> parent_b=0x19cb8178, tesseract::ViterbiStateEntry *
> parent_vse=0x19cc1bb0, HEAP * pain_points=0x19cbc370,
> tesseract::BestPathByColumn * * best_path_by_column=0x0042f34c,
> CHUNKS_RECORD * chunks_record=0x0042f460, tesseract::BestChoiceBundle
> * best_choice_bundle=0x0042f2f4, BlamerBundle *
> blamer_bundle=0x00000000)  Line 511     C++
> tesseract::LanguageModel::UpdateState(unsigned char changed=' ', int
> curr_col=3, int curr_row=3, BLOB_CHOICE_LIST * curr_list=0x19cb83e8,
> BLOB_CHOICE_LIST * parent_list=0x19cb8138, HEAP *
> pain_points=0x19cbc370, tesseract::BestPathByColumn * *
> best_path_by_column=0x0042f34c, CHUNKS_RECORD *
> chunks_record=0x0042f460, tesseract::BestChoiceBundle *
> best_choice_bundle=0x0042f2f4, BlamerBundle *
> blamer_bundle=0x00000000)  Line 372 + 0x53 bytes        C++
> tesseract::Wordrec::UpdateSegSearchNodes(int starting_col=0,
> SEG_SEARCH_PENDING_LIST * * pending=0x0042f2e8,
> tesseract::BestPathByColumn * * best_path_by_column=0x0042f34c,
> CHUNKS_RECORD * chunks_record=0x0042f460, HEAP *
> pain_points=0x19cbc370, tesseract::BestChoiceBundle *
> best_choice_bundle=0x0042f2f4, BlamerBundle *
> blamer_bundle=0x00000000)  Line 215 + 0x40 bytes        C++
> tesseract::Wordrec::SegSearch(CHUNKS_RECORD *
> chunks_record=0x0042f460, WERD_CHOICE * best_choice=0x19cae588,
> GenericVector<BLOB_CHOICE_LIST *> * best_char_choices=0x19c98438,
> WERD_CHOICE * raw_choice=0x19cae708, STATE *
> output_best_state=0x0042f57c, BlamerBundle *
> blamer_bundle=0x00000000)  Line 117     C++
> tesseract::Wordrec::word_associator(bool
> only_create_ratings_matrix=false, WERD_RES * word=0x19332b70, STATE *
> state=0x0042f57c, GenericVector<BLOB_CHOICE_LIST *> *
> best_char_choices=0x19c98438, GenericVector<DANGERR_INFO> *
> fixpt=0x0042f554, STATE * best_state=0x0042f57c)  Line 1031     C++
> tesseract::Wordrec::chop_word_main(WERD_RES * word=0x19332b70)  Line
> 646 + 0x1e bytes        C++
> tesseract::Wordrec::cc_recog(WERD_RES * word=0x19332b70)  Line 121 +
> 0xc bytes       C++
> tesseract::Tesseract::recog_word_recursive(WERD_RES * word=0x19332b70,
> BLOB_CHOICE_LIST_CLIST * blob_choices=0x19c7b600)  Line 116 + 0xc
> bytes   C++
> tesseract::Tesseract::recog_word(WERD_RES * word=0x19332b70,
> BLOB_CHOICE_LIST_CLIST * blob_choices=0x19c7b600)  Line 58      C++
> tesseract::Tesseract::tess_segment_pass1(WERD_RES * word=0x19332b70,
> BLOB_CHOICE_LIST_CLIST * blob_choices=0x19c7b600)  Line 57      C++
> tesseract::Tesseract::classify_word_pass1(BLOCK * block=0x18e21cc8,
> ROW * row=0x18d5d590, WERD_RES * word=0x19332b70)  Line 879     C++
> tesseract::Tesseract::classify_word_and_language(void (BLOCK *, ROW *,
> WERD_RES *)* recognizer=0x01236c40, BLOCK * block=0x18e21cc8, ROW *
> row=0x18d5d590, WERD_RES * word=0x19332b70)  Line 813 + 0x1a bytes      C++
> tesseract::Tesseract::recog_all_words(PAGE_RES * page_res=0x1760dd68,
> ETEXT_DESC * monitor=0x00000000, const TBOX *
> target_word_box=0x00000000, const char * word_config=0x00000000, int
> dopasses=0)  Line 262   C++
> tesseract::TessBaseAPI::Recognize(ETEXT_DESC * monitor=0x00000000)
> Line 696 + 0x1c bytes   C++
> tesseract::TessBaseAPI::ProcessPage(Pix * pix=0x00ba3590, int
> page_index=0, const char * filename=0x00292914, const char *
> retry_config=0x00000000, int timeout_millisec=0, STRING *
> text_out=0x0042fb28)  Line 880 + 0xa bytes      C++
> tesseract::TessBaseAPI::ProcessPages(const char * filename=0x00292914,
> const char * retry_config=0x00000000, int timeout_millisec=0, STRING *
> text_out=0x0042fb28)  Line 795 + 0x24 bytes     C++
> main(int argc=5, char * * argv=0x002928a8)  Line 156 + 0x17 bytes       C++
> __tmainCRTStartup()  Line 586 + 0x19 bytes      C
> mainCRTStartup()  Line 403      C
>
> --
> You received this message because you are subscribed to the Google
> Groups "tesseract-ocr" group.
> To post to this group, send email to [email protected]
> To unsubscribe from this group, send email to
> [email protected]
> For more options, visit this group at
> http://groups.google.com/group/tesseract-ocr?hl=en
>

-- 
You received this message because you are subscribed to the Google
Groups "tesseract-ocr" group.
To post to this group, send email to [email protected]
To unsubscribe from this group, send email to
[email protected]
For more options, visit this group at
http://groups.google.com/group/tesseract-ocr?hl=en

Reply via email to