Ravenports generated: 28 Mar 2021 15:51
[ravenports.git] / bucket_5D / tesseract
1 # Buildsheet autogenerated by ravenadm tool -- Do not edit.
2
3 NAMEBASE=               tesseract
4 VERSION=                4.1.1
5 REVISION=               1
6 KEYWORDS=               graphics
7 VARIANTS=               standard
8 SDESC[standard]=        OCR (Optical Character Recognition) engine
9 HOMEPAGE=               https://github.com/tesseract-ocr/tesseract
10 CONTACT=                nobody
11
12 DOWNLOAD_GROUPS=        main
13 SITES[main]=            GITHUB/tesseract-ocr:tesseract:4.1.1
14 DISTFILE[1]=            generated:main
15 DF_INDEX=               1
16 SPKGS[standard]=        complete
17                         tools
18                         library
19
20 OPTIONS_AVAILABLE=      none
21 OPTIONS_STANDARD=       none
22
23 BUILDRUN_DEPENDS=       fontconfig:primary:standard
24                         icu:single:standard
25                         leptonica:single:standard
26                         llvm:single:standard
27                         pango:primary:standard
28 RUN_DEPENDS=            tesseract-data:latin:standard
29 EXRUN[tools]=           tesseract:library:standard
30
31 USES=                   autoreconf libtool pkgconfig shebangfix
32 C_USES[freebsd]=        fortran:library
33
34 FPC_EQUIVALENT=         graphics/tesseract
35 SHEBANG_FILES=          {{WRKSRC}}/src/training/tesstrain.sh
36                         {{WRKSRC}}/src/training/language-specific.sh
37
38 MUST_CONFIGURE=         gnu
39 CONFIGURE_ENV=          LIBLEPT_HEADERSDIR="{{LOCALBASE}}/include/leptonica"
40
41 MAKE_ARGS=              datadir={{LOCALBASE}}/share/tesseract-data
42
43 INSTALL_TARGET=         install-strip training-install
44 INSTALL_REQ_TOOLCHAIN=  yes
45 SOVERSION=              4.0.1
46
47 LDFLAGS=                -lpthread
48
49 post-patch:
50         ${REINPLACE_CMD} -e 's|-O3 -DNDEBUG||' ${WRKSRC}/configure.ac
51
52 [FILE:54:descriptions/desc.tools]
53 This package contains the Tesseract OCR engine tools.
54
55
56 [FILE:291:descriptions/desc.library]
57 The Tesseract OCR engine was one of the top 3 engines in the 1995 UNLV
58 Accuracy test. Between 1995 and 2006 it had little work done on it, but
59 it is probably one of the most accurate open source OCR engines available.
60 The source code will read a binary, grey or color image and output text.
61
62
63 [FILE:115:distinfo]
64 2a66ff0d8595bff8f04032165e6c936389b1e5727c3ce5a27b3e059d218db1cb      1974988 tesseract-ocr-tesseract-4.1.1.tar.gz
65
66
67 [FILE:310:manifests/plist.tools]
68 bin/
69  ambiguous_words
70  classifier_tester
71  cntraining
72  combine_lang_model
73  combine_tessdata
74  dawg2wordlist
75  language-specific.sh
76  lstmeval
77  lstmtraining
78  merge_unicharsets
79  mftraining
80  set_unicharset_properties
81  shapeclustering
82  tesstrain.sh
83  tesstrain_utils.sh
84  text2image
85  unicharset_extractor
86  wordlist2dawg
87
88
89 [FILE:732:manifests/plist.library]
90 bin/tesseract
91 include/tesseract/
92  apitypes.h
93  baseapi.h
94  capi.h
95  genericvector.h
96  helpers.h
97  ltrresultiterator.h
98  ocrclass.h
99  osdetect.h
100  pageiterator.h
101  platform.h
102  publictypes.h
103  renderer.h
104  resultiterator.h
105  serialis.h
106  strngs.h
107  tess_version.h
108  tesscallback.h
109  thresholder.h
110  unichar.h
111 lib/
112  libtesseract.a
113  libtesseract.so
114  libtesseract.so.%%SOMAJOR%%
115  libtesseract.so.%%SOVERSION%%
116 lib/pkgconfig/tesseract.pc
117 share/tesseract-data/
118  alto
119  ambigs.train
120  api_config
121  batch
122  batch.nochop
123  bigram
124  box.train
125  box.train.stderr
126  digits
127  get.images
128  hocr
129  inter
130  kannada
131  linebox
132  logfile
133  lstm.train
134  lstmbox
135  lstmdebug
136  makebox
137  matdemo
138  msdemo
139  nobatch
140  pdf
141  pdf.ttf
142  quiet
143  rebox
144  segdemo
145  strokewidth
146  tsv
147  txt
148  unlv
149  wordstrbox
150
151
152 [FILE:609:freebsd/patch-configure.ac]
153 sem_init(3) is part of libc on FreeBSD, so we ended up not linking against
154 libpthread. Look for a symbol that causes us to load it.
155 libtesseract.so is not linked against libomp if openmp is enabled,
156 which makes dependent ports fail. This adds a workaround by linking
157 directly against libomp.
158 --- configure.ac.orig   2019-07-07 12:34:08 UTC
159 +++ configure.ac
160 @@ -372,6 +372,9 @@ esac
161  # ----------------------------------------
162  
163  AC_SEARCH_LIBS([pthread_create], [pthread])
164 +if test "$enable_openmp" != no; then
165 +  AC_SEARCH_LIBS([omp_get_thread_num ], [omp])
166 +fi
167  
168  
169  # ----------------------------------------
170
171
172 [FILE:276:freebsd/patch-src_ccutil_ocrclass.h]
173 --- src/ccutil/ocrclass.h.orig  2019-07-07 12:34:08 UTC
174 +++ src/ccutil/ocrclass.h
175 @@ -31,6 +31,7 @@
176  #ifdef _WIN32
177  #include <winsock2.h> // for timeval
178  #endif
179 +#include <sys/time.h>
180  
181  /**********************************************************************
182   * EANYCODE_CHAR
183