распознавание текста по изображению - PullRequest
2 голосов
/ 21 ноября 2011

Как распознать текст по почерку?

Я пробовал библиотеки teseract (версия 2), но это не слишком хорошо.Его обновленные версии не работают хорошо.И я скачал один карманный OCR для демонстрационного проекта, но он также не компилируется.Я скомпилировал и интегрировал библиотеки тессеракта, но теперь он дает мне ошибку компоновки следующим образом

    Ld /Users/Arkenea/Library/Developer/Xcode/DerivedData/OCR-airiipqjvidtcogttlxdbnqufnnl/Build/Products/Debug-iphonesimulator/OCR.app/OCR normal i386
    cd "/Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2"
    setenv PATH "/Developer/Platforms/iPhoneSimulator.platform/Developer/usr/bin:/Developer/usr/bin:/usr/bin:/bin:/usr/sbin:/sbin"
    /Developer/Platforms/iPhoneSimulator.platform/Developer/usr/bin/clang++ -arch i386 -isysroot /Developer/Platforms/iPhoneSimulator.platform/Developer/SDKs/iPhoneSimulator5.0.sdk -L/Users/Arkenea/Library/Developer/Xcode/DerivedData/OCR-airiipqjvidtcogttlxdbnqufnnl/Build/Products/Debug-iphonesimulator "-L/Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2" "-L/Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/../../tesseract-ocr-svn" "-L/Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/../../tesseract-ocr-svn/outdir" "-L/Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/lib" -F/Users/Arkenea/Library/Developer/Xcode/DerivedData/OCR-airiipqjvidtcogttlxdbnqufnnl/Build/Products/Debug-iphonesimulator -filelist /Users/Arkenea/Library/Developer/Xcode/DerivedData/OCR-airiipqjvidtcogttlxdbnqufnnl/Build/Intermediates/OCR.build/Debug-iphonesimulator/OCR.build/Objects-normal/i386/OCR.LinkFileList -Xlinker -objc_abi_version -Xlinker 2 -Xlinker -no_implicit_dylibs -D__IPHONE_OS_VERSION_MIN_REQUIRED=30102 -framework Foundation -framework UIKit -framework CoreGraphics -framework MessageUI -ltesseract_api -ltesseract_ccstruct -ltesseract_ccutil -ltesseract_classify -ltesseract_cutil -ltesseract_dict -ltesseract_image -ltesseract_textord -ltesseract_training -ltesseract_viewer -ltesseract_wordrec -ltesseract_main -llept.2.0.0 -llept.2 -llept -llept -ltesseract.3.0.1 -ltesseract.3 -ltesseract -ltesseract -o /Users/Arkenea/Library/Developer/Xcode/DerivedData/OCR-airiipqjvidtcogttlxdbnqufnnl/Build/Products/Debug-iphonesimulator/OCR.app/OCR

ld: warning: directory not found for option '-L/Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/../../tesseract-ocr-svn'
ld: warning: directory not found for option '-L/Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/../../tesseract-ocr-svn/outdir'
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_api.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_ccstruct.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_ccutil.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_classify.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_cutil.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_dict.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_image.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_textord.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_training.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_viewer.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_wordrec.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/libtesseract_main.a, file was built for archive which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/lib/liblept.2.0.0.dylib, file was built for unsupported file format which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/lib/liblept.2.dylib, file was built for unsupported file format which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/lib/liblept.dylib, file was built for unsupported file format which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/lib/libtesseract.3.0.1.dylib, file was built for unsupported file format which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/lib/libtesseract.3.dylib, file was built for unsupported file format which is not the architecture being linked (i386)
ld: warning: ignoring file /Users/Arkenea/Desktop/suraj/notepad/rcarlsen-Pocket-OCR-9912da9 2/lib/libtesseract.dylib, file was built for unsupported file format which is not the architecture being linked (i386)
Undefined symbols for architecture i386:
  "tesseract::TessBaseAPI::End()", referenced from:
      -[OCRDisplayViewController dealloc] in OCRDisplayViewController.o
  "tesseract::TessBaseAPI::TessBaseAPI()", referenced from:
      -[OCRDisplayViewController viewDidLoad] in OCRDisplayViewController.o
  "tesseract::TessBaseAPI::Init(char const*, char const*, tesseract::OcrEngineMode, char**, int, GenericVector<STRING> const*, GenericVector<STRING> const*, bool)", referenced from:
      tesseract::TessBaseAPI::Init(char const*, char const*) in OCRDisplayViewController.o
  "tesseract::TessBaseAPI::TesseractRect(unsigned char const*, int, int, int, int, int, int)", referenced from:
      -[OCRDisplayViewController readAndProcessImage:] in OCRDisplayViewController.o
      -[OCRDisplayViewController threadedReadAndProcessImage:] in OCRDisplayViewController.o
ld: symbol(s) not found for architecture i386
clang: error: linker command failed with exit code 1 (use -v to see invocation)

Может ли кто-нибудь помочь мне или указать мне на некоторые замечательные ресурсы?

1 Ответ

1 голос
/ 09 января 2012

для этого мы должны установить в нем некоторые настройки лайк tesseract-> Init ([dataPath cStringUsingEncoding: NSUTF8StringEncoding], "eng"); tesseract-> SetVariable ("tessedit_char_whitelist", "ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789.! @ # $% ^ & * () _ + / {} |? tesseract-> AllWordConfidences ();

дайте ему белый список как ваше требование

и установите режим по умолчанию или согласно вашему требованию

Добро пожаловать на сайт PullRequest, где вы можете задавать вопросы и получать ответы от других членов сообщества.
...