They look alike.
http://www.fonts2u.com/dejavu-sans-extralight.font
http://www.fontsaddict.com/font/dejavu-sans-extralight.html
On Friday, July 18, 2014 6:34:15 AM UTC-5, Mustak M wrote:
>
> I am using Java wrapper Tess4J. Using following code to retrieve the font
> type and font size from an image. The image contains "Arial" font text and
> font size is 48. The code is returning font type as
> font: DejaVu_Sans_Ultra-Light, size: 13
>
> Code:
>
> * public*
> *static* *void* testResultIterator() *throws* Exception {
>
> String *datapath* =
> "tessdata";
>
> String *language* =
> "eng";
>
> String *expOCRResult* =
> "The (quick) [brown] {fox} jumps!\nOver the $43,456.78 <lazy> #90 dog";
>
> TessAPI1.TessBaseAPI handle;
>
> handle = TessAPI1.*TessBaseAPICreate*();
>
> System.
> *out*.println("TessBaseAPIGetIterator");
>
> String lang =
> "eng";
>
> File tiff =
> *new* File("C:\\1\\CaptureArial.JPG");
>
> BufferedImage image = ImageIO.*read*(
> *new* FileInputStream(tiff)); // require *jai*-*imageio* *lib* to read
> TIFF
>
> ByteBuffer buf = ImageIOHelper.*convertImageData*(image);
>
> *int* bpp = image.getColorModel().getPixelSize();
>
> *int* bytespp = bpp / 8;
>
> *int* bytespl = (*int*) Math.*ceil*(image.getWidth() * bpp / 8.0);
>
> TessAPI1.*TessBaseAPIInit3*(handle,
> "tessdata", lang);
>
> TessAPI1.*TessBaseAPISetPageSegMode*(handle, TessAPI1.TessPageSegMode.
> *PSM_AUTO*);
>
> TessAPI1.*TessBaseAPISetImage*(handle, buf, image.getWidth(),
> image.getHeight(), bytespp, bytespl);
>
> TessAPI1.*TessBaseAPIRecognize*(handle,
> *null*);
>
> TessAPI1.TessResultIterator ri = TessAPI1.*TessBaseAPIGetIterator*
> (handle);
>
> TessAPI1.TessPageIterator pi = TessAPI1.
> *TessResultIteratorGetPageIterator*(ri);
>
> TessAPI1.*TessPageIteratorBegin*(pi);
>
> System.
> *out*.println("Bounding boxes:\nchar(s) left top right bottom confidence
> font-attributes");
>
> // *int* height = image.getHeight();
>
> *do* {
>
> Pointer ptr = TessAPI1.*TessResultIteratorGetUTF8Text*(ri,
> TessAPI1.TessPageIteratorLevel.
> *RIL_WORD*);
>
> String word = ptr.getString(0);
>
> TessAPI1.*TessDeleteText*(ptr);
>
> *float* confidence = TessAPI1.*TessResultIteratorConfidence*(ri,
> TessAPI1.TessPageIteratorLevel.*RIL_WORD*);
>
> IntBuffer leftB = IntBuffer.*allocate*(1);
>
> IntBuffer topB = IntBuffer.*allocate*(1);
>
> IntBuffer rightB = IntBuffer.*allocate*(1);
>
> IntBuffer bottomB = IntBuffer.*allocate*(1);
>
> TessAPI1.*TessPageIteratorBoundingBox*(pi, TessAPI1.TessPageIteratorLevel.
> *RIL_WORD*, leftB, topB, rightB, bottomB);
>
> *int* left = leftB.get();
>
> *int* top = topB.get();
>
> *int* right = rightB.get();
>
> *int* bottom = bottomB.get();
>
> System.
> *out*.print(String.*format*("%s %d %d %d %d %f", word, left, top, right,
> bottom, confidence));
>
> // System.out.println(String.format("%s %d %d %d %d", *str*, left, height
> - bottom, right, height - top)); // training box coordinates
>
> IntBuffer boldB = IntBuffer.*allocate*(1);
>
> IntBuffer italicB = IntBuffer.*allocate*(1);
>
> IntBuffer underlinedB = IntBuffer.*allocate*(1);
>
> IntBuffer monospaceB = IntBuffer.*allocate*(1);
>
> IntBuffer serifB = IntBuffer.*allocate*(1);
>
> IntBuffer smallcapsB = IntBuffer.*allocate*(1);
>
> IntBuffer pointSizeB = IntBuffer.*allocate*(1);
>
> IntBuffer fontIdB = IntBuffer.*allocate*(1);
>
> String fontName = TessAPI1.*TessResultIteratorWordFontAttributes*(ri,
> boldB, italicB, underlinedB,
>
> monospaceB, serifB, smallcapsB, pointSizeB, fontIdB);
>
> *boolean* bold = boldB.get() == TessAPI1.*TRUE*;
>
> *boolean* italic = italicB.get() == TessAPI1.*TRUE*;
>
> *boolean* underlined = underlinedB.get() == TessAPI1.*TRUE*;
>
> *boolean* monospace = monospaceB.get() == TessAPI1.*TRUE*;
>
> *boolean* serif = serifB.get() == TessAPI1.*TRUE*;
>
> *boolean* smallcaps = smallcapsB.get() == TessAPI1.*TRUE*;
>
> *int* pointSize = pointSizeB.get();
>
> *int* fontId = fontIdB.get();
>
> System.
> *out*.println(String.*format*(" font: %s, size: %d, font id: %d, bold:
> %b," +
>
> " italic: %b, underlined: %b, monospace: %b, serif: %b, smallcap: %b",
>
> fontName, pointSize, fontId, bold, italic, underlined, monospace, serif,
> smallcaps));
>
> }
> *while* (TessAPI1.*TessPageIteratorNext*(pi,
> TessAPI1.TessPageIteratorLevel.*RIL_WORD*) == TessAPI1.*TRUE*);
>
> }
>
> ---------
>
> Its the same code refered from
>
>
> *http://sourceforge.net/p/tess4j/code/HEAD/tree/Tess4J_3/trunk/test/net/sourceforge/tess4j/TessAPI1Test.java#l447*
>
> <http://sourceforge.net/p/tess4j/code/HEAD/tree/Tess4J_3/trunk/test/net/sourceforge/tess4j/TessAPI1Test.java#l447>
>
> ----
>
> Any thoughts !
>
> Image file attached for reference.
>
>
>
> Thanks
>
>
>
>
>
--
You received this message because you are subscribed to the Google Groups
"tesseract-ocr" group.
To unsubscribe from this group and stop receiving emails from it, send an email
to [email protected].
To post to this group, send email to [email protected].
Visit this group at http://groups.google.com/group/tesseract-ocr.
To view this discussion on the web visit
https://groups.google.com/d/msgid/tesseract-ocr/e3f43b71-adc3-4e6d-ac98-f39ca72887f6%40googlegroups.com.
For more options, visit https://groups.google.com/d/optout.