-
Notifications
You must be signed in to change notification settings - Fork 14
/
Copy patha00107_source.html
355 lines (353 loc) · 45.4 KB
/
a00107_source.html
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "https://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml">
<head>
<meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/>
<meta http-equiv="X-UA-Compatible" content="IE=9"/>
<meta name="generator" content="Doxygen 1.8.16"/>
<meta name="viewport" content="width=device-width, initial-scale=1"/>
<title>tesseract: /tesseract/src/arch/simddetect.cpp Source File</title>
<link href="tabs.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="jquery.js"></script>
<script type="text/javascript" src="dynsections.js"></script>
<link href="navtree.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="resize.js"></script>
<script type="text/javascript" src="navtreedata.js"></script>
<script type="text/javascript" src="navtree.js"></script>
<script type="text/javascript">
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
$(document).ready(initResizable);
/* @license-end */</script>
<link href="search/search.css" rel="stylesheet" type="text/css"/>
<script type="text/javascript" src="search/searchdata.js"></script>
<script type="text/javascript" src="search/search.js"></script>
<link href="doxygen.css" rel="stylesheet" type="text/css" />
</head>
<body>
<div id="top"><!-- do not remove this div, it is closed by doxygen! -->
<div id="titlearea">
<table cellspacing="0" cellpadding="0">
<tbody>
<tr style="height: 56px;">
<td id="projectalign" style="padding-left: 0.5em;">
<div id="projectname">tesseract
 <span id="projectnumber">5.0.0-alpha-619-ge9db</span>
</div>
</td>
</tr>
</tbody>
</table>
</div>
<!-- end header part -->
<!-- Generated by Doxygen 1.8.16 -->
<script type="text/javascript">
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
var searchBox = new SearchBox("searchBox", "search",false,'Search');
/* @license-end */
</script>
<script type="text/javascript" src="menudata.js"></script>
<script type="text/javascript" src="menu.js"></script>
<script type="text/javascript">
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
$(function() {
initMenu('',true,false,'search.php','Search');
$(document).ready(function() { init_search(); });
});
/* @license-end */</script>
<div id="main-nav"></div>
</div><!-- top -->
<div id="side-nav" class="ui-resizable side-nav-resizable">
<div id="nav-tree">
<div id="nav-tree-contents">
<div id="nav-sync" class="sync"></div>
</div>
</div>
<div id="splitbar" style="-moz-user-select:none;"
class="ui-resizable-handle">
</div>
</div>
<script type="text/javascript">
/* @license magnet:?xt=urn:btih:cf05388f2679ee054f2beb29a391d25f4e673ac3&dn=gpl-2.0.txt GPL-v2 */
$(document).ready(function(){initNavTree('a00107_source.html','');});
/* @license-end */
</script>
<div id="doc-content">
<!-- window showing the filter options -->
<div id="MSearchSelectWindow"
onmouseover="return searchBox.OnSearchSelectShow()"
onmouseout="return searchBox.OnSearchSelectHide()"
onkeydown="return searchBox.OnSearchSelectKey(event)">
</div>
<!-- iframe showing the search results (closed by default) -->
<div id="MSearchResultsWindow">
<iframe src="javascript:void(0)" frameborder="0"
name="MSearchResults" id="MSearchResults">
</iframe>
</div>
<div class="header">
<div class="headertitle">
<div class="title">simddetect.cpp</div> </div>
</div><!--header-->
<div class="contents">
<a href="a00107.html">Go to the documentation of this file.</a><div class="fragment"><div class="line"><a name="l00001"></a><span class="lineno"> 1</span> <span class="comment">// File: simddetect.cpp</span></div>
<div class="line"><a name="l00003"></a><span class="lineno"> 3</span> <span class="comment">// Description: Architecture detector.</span></div>
<div class="line"><a name="l00004"></a><span class="lineno"> 4</span> <span class="comment">// Author: Stefan Weil (based on code from Ray Smith)</span></div>
<div class="line"><a name="l00005"></a><span class="lineno"> 5</span> <span class="comment">//</span></div>
<div class="line"><a name="l00006"></a><span class="lineno"> 6</span> <span class="comment">// (C) Copyright 2014, Google Inc.</span></div>
<div class="line"><a name="l00007"></a><span class="lineno"> 7</span> <span class="comment">// Licensed under the Apache License, Version 2.0 (the "License");</span></div>
<div class="line"><a name="l00008"></a><span class="lineno"> 8</span> <span class="comment">// you may not use this file except in compliance with the License.</span></div>
<div class="line"><a name="l00009"></a><span class="lineno"> 9</span> <span class="comment">// You may obtain a copy of the License at</span></div>
<div class="line"><a name="l00010"></a><span class="lineno"> 10</span> <span class="comment">// http://www.apache.org/licenses/LICENSE-2.0</span></div>
<div class="line"><a name="l00011"></a><span class="lineno"> 11</span> <span class="comment">// Unless required by applicable law or agreed to in writing, software</span></div>
<div class="line"><a name="l00012"></a><span class="lineno"> 12</span> <span class="comment">// distributed under the License is distributed on an "AS IS" BASIS,</span></div>
<div class="line"><a name="l00013"></a><span class="lineno"> 13</span> <span class="comment">// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.</span></div>
<div class="line"><a name="l00014"></a><span class="lineno"> 14</span> <span class="comment">// See the License for the specific language governing permissions and</span></div>
<div class="line"><a name="l00015"></a><span class="lineno"> 15</span> <span class="comment">// limitations under the License.</span></div>
<div class="line"><a name="l00017"></a><span class="lineno"> 17</span> <span class="comment"></span> </div>
<div class="line"><a name="l00018"></a><span class="lineno"> 18</span> <span class="preprocessor">#include "config_auto.h"</span> <span class="comment">// for HAVE_AVX, ...</span></div>
<div class="line"><a name="l00019"></a><span class="lineno"> 19</span> <span class="preprocessor">#include <numeric></span> <span class="comment">// for std::inner_product</span></div>
<div class="line"><a name="l00020"></a><span class="lineno"> 20</span> <span class="preprocessor">#include "<a class="code" href="a00110.html">simddetect.h</a>"</span></div>
<div class="line"><a name="l00021"></a><span class="lineno"> 21</span> <span class="preprocessor">#include "<a class="code" href="a00083.html">dotproduct.h</a>"</span></div>
<div class="line"><a name="l00022"></a><span class="lineno"> 22</span> <span class="preprocessor">#include "<a class="code" href="a00098.html">intsimdmatrix.h</a>"</span> <span class="comment">// for IntSimdMatrix</span></div>
<div class="line"><a name="l00023"></a><span class="lineno"> 23</span> <span class="preprocessor">#include "<a class="code" href="a00554.html">params.h</a>"</span> <span class="comment">// for STRING_VAR</span></div>
<div class="line"><a name="l00024"></a><span class="lineno"> 24</span> <span class="preprocessor">#include "<a class="code" href="a00584.html">tprintf.h</a>"</span> <span class="comment">// for tprintf</span></div>
<div class="line"><a name="l00025"></a><span class="lineno"> 25</span>  </div>
<div class="line"><a name="l00026"></a><span class="lineno"> 26</span> <span class="preprocessor">#if defined(HAVE_AVX) || defined(HAVE_AVX2) || defined(HAVE_FMA) || defined(HAVE_SSE4_1)</span></div>
<div class="line"><a name="l00027"></a><span class="lineno"> 27</span> <span class="preprocessor"># define HAS_CPUID</span></div>
<div class="line"><a name="l00028"></a><span class="lineno"> 28</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00029"></a><span class="lineno"> 29</span>  </div>
<div class="line"><a name="l00030"></a><span class="lineno"> 30</span> <span class="preprocessor">#if defined(HAS_CPUID)</span></div>
<div class="line"><a name="l00031"></a><span class="lineno"> 31</span> <span class="preprocessor">#if defined(__GNUC__)</span></div>
<div class="line"><a name="l00032"></a><span class="lineno"> 32</span> <span class="preprocessor"># include <cpuid.h></span></div>
<div class="line"><a name="l00033"></a><span class="lineno"> 33</span> <span class="preprocessor">#elif defined(_WIN32)</span></div>
<div class="line"><a name="l00034"></a><span class="lineno"> 34</span> <span class="preprocessor"># include <intrin.h></span></div>
<div class="line"><a name="l00035"></a><span class="lineno"> 35</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00036"></a><span class="lineno"> 36</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00037"></a><span class="lineno"> 37</span>  </div>
<div class="line"><a name="l00038"></a><span class="lineno"> 38</span> <span class="keyword">namespace </span><a class="code" href="a01818.html">tesseract</a> {</div>
<div class="line"><a name="l00039"></a><span class="lineno"> 39</span>  </div>
<div class="line"><a name="l00040"></a><span class="lineno"> 40</span> <span class="comment">// Computes and returns the dot product of the two n-vectors u and v.</span></div>
<div class="line"><a name="l00041"></a><span class="lineno"> 41</span> <span class="comment">// Note: because the order of addition is different among the different dot</span></div>
<div class="line"><a name="l00042"></a><span class="lineno"> 42</span> <span class="comment">// product functions, the results can (and do) vary slightly (although they</span></div>
<div class="line"><a name="l00043"></a><span class="lineno"> 43</span> <span class="comment">// agree to within about 4e-15). This produces different results when running</span></div>
<div class="line"><a name="l00044"></a><span class="lineno"> 44</span> <span class="comment">// training, despite all random inputs being precisely equal.</span></div>
<div class="line"><a name="l00045"></a><span class="lineno"> 45</span> <span class="comment">// To get consistent results, use just one of these dot product functions.</span></div>
<div class="line"><a name="l00046"></a><span class="lineno"> 46</span> <span class="comment">// On a test multi-layer network, serial is 57% slower than SSE, and AVX</span></div>
<div class="line"><a name="l00047"></a><span class="lineno"> 47</span> <span class="comment">// is about 8% faster than SSE. This suggests that the time is memory</span></div>
<div class="line"><a name="l00048"></a><span class="lineno"> 48</span> <span class="comment">// bandwidth constrained and could benefit from holding the reused vector</span></div>
<div class="line"><a name="l00049"></a><span class="lineno"> 49</span> <span class="comment">// in AVX registers.</span></div>
<div class="line"><a name="l00050"></a><span class="lineno"><a class="line" href="a01818.html#a9ab0e86b57d2b88cdc6af72ff02c93d2"> 50</a></span> <a class="code" href="a01818.html#a33bdb7f88c6be930b0ea0d866f616ecf">DotProductFunction</a> <a class="code" href="a01818.html#a9ab0e86b57d2b88cdc6af72ff02c93d2">DotProduct</a>;</div>
<div class="line"><a name="l00051"></a><span class="lineno"> 51</span>  </div>
<div class="line"><a name="l00052"></a><span class="lineno"> 52</span> <span class="keyword">static</span> <a class="code" href="a00554.html#abaa7778083ba376d8c70a59631d4a6ab">STRING_VAR</a>(dotproduct, <span class="stringliteral">"auto"</span>,</div>
<div class="line"><a name="l00053"></a><span class="lineno"> 53</span>  <span class="stringliteral">"Function used for calculation of dot product"</span>);</div>
<div class="line"><a name="l00054"></a><span class="lineno"> 54</span>  </div>
<div class="line"><a name="l00055"></a><span class="lineno"> 55</span> <a class="code" href="a02574.html">SIMDDetect</a> SIMDDetect::detector;</div>
<div class="line"><a name="l00056"></a><span class="lineno"> 56</span>  </div>
<div class="line"><a name="l00057"></a><span class="lineno"> 57</span> <span class="comment">// If true, then AVX has been detected.</span></div>
<div class="line"><a name="l00058"></a><span class="lineno"> 58</span> <span class="keywordtype">bool</span> SIMDDetect::avx_available_;</div>
<div class="line"><a name="l00059"></a><span class="lineno"> 59</span> <span class="keywordtype">bool</span> SIMDDetect::avx2_available_;</div>
<div class="line"><a name="l00060"></a><span class="lineno"> 60</span> <span class="keywordtype">bool</span> SIMDDetect::avx512F_available_;</div>
<div class="line"><a name="l00061"></a><span class="lineno"> 61</span> <span class="keywordtype">bool</span> SIMDDetect::avx512BW_available_;</div>
<div class="line"><a name="l00062"></a><span class="lineno"> 62</span> <span class="comment">// If true, then FMA has been detected.</span></div>
<div class="line"><a name="l00063"></a><span class="lineno"> 63</span> <span class="keywordtype">bool</span> SIMDDetect::fma_available_;</div>
<div class="line"><a name="l00064"></a><span class="lineno"> 64</span> <span class="comment">// If true, then SSe4.1 has been detected.</span></div>
<div class="line"><a name="l00065"></a><span class="lineno"> 65</span> <span class="keywordtype">bool</span> SIMDDetect::sse_available_;</div>
<div class="line"><a name="l00066"></a><span class="lineno"> 66</span>  </div>
<div class="line"><a name="l00067"></a><span class="lineno"> 67</span> <span class="comment">// Computes and returns the dot product of the two n-vectors u and v.</span></div>
<div class="line"><a name="l00068"></a><span class="lineno"> 68</span> <span class="keyword">static</span> <span class="keywordtype">double</span> DotProductGeneric(<span class="keyword">const</span> <span class="keywordtype">double</span>* u, <span class="keyword">const</span> <span class="keywordtype">double</span>* v, <span class="keywordtype">int</span> n) {</div>
<div class="line"><a name="l00069"></a><span class="lineno"> 69</span>  <span class="keywordtype">double</span> total = 0.0;</div>
<div class="line"><a name="l00070"></a><span class="lineno"> 70</span>  <span class="keywordflow">for</span> (<span class="keywordtype">int</span> k = 0; k < n; ++k) total += u[k] * v[k];</div>
<div class="line"><a name="l00071"></a><span class="lineno"> 71</span>  <span class="keywordflow">return</span> total;</div>
<div class="line"><a name="l00072"></a><span class="lineno"> 72</span> }</div>
<div class="line"><a name="l00073"></a><span class="lineno"> 73</span>  </div>
<div class="line"><a name="l00074"></a><span class="lineno"> 74</span> <span class="comment">// Compute dot product using std::inner_product.</span></div>
<div class="line"><a name="l00075"></a><span class="lineno"> 75</span> <span class="keyword">static</span> <span class="keywordtype">double</span> DotProductStdInnerProduct(<span class="keyword">const</span> <span class="keywordtype">double</span>* u, <span class="keyword">const</span> <span class="keywordtype">double</span>* v, <span class="keywordtype">int</span> n) {</div>
<div class="line"><a name="l00076"></a><span class="lineno"> 76</span>  <span class="keywordflow">return</span> std::inner_product(u, u + n, v, 0.0);</div>
<div class="line"><a name="l00077"></a><span class="lineno"> 77</span> }</div>
<div class="line"><a name="l00078"></a><span class="lineno"> 78</span>  </div>
<div class="line"><a name="l00079"></a><span class="lineno"> 79</span> <span class="keyword">static</span> <span class="keywordtype">void</span> SetDotProduct(<a class="code" href="a01818.html#a33bdb7f88c6be930b0ea0d866f616ecf">DotProductFunction</a> f, <span class="keyword">const</span> IntSimdMatrix* m = <span class="keyword">nullptr</span>) {</div>
<div class="line"><a name="l00080"></a><span class="lineno"> 80</span>  <a class="code" href="a01818.html#a9ab0e86b57d2b88cdc6af72ff02c93d2">DotProduct</a> = f;</div>
<div class="line"><a name="l00081"></a><span class="lineno"> 81</span>  <a class="code" href="a02570.html#ad7321e9f71f4d5e2c8920c370acb25ac">IntSimdMatrix::intSimdMatrix</a> = m;</div>
<div class="line"><a name="l00082"></a><span class="lineno"> 82</span> }</div>
<div class="line"><a name="l00083"></a><span class="lineno"> 83</span>  </div>
<div class="line"><a name="l00084"></a><span class="lineno"> 84</span> <span class="comment">// Constructor.</span></div>
<div class="line"><a name="l00085"></a><span class="lineno"> 85</span> <span class="comment">// Tests the architecture in a system-dependent way to detect AVX, SSE and</span></div>
<div class="line"><a name="l00086"></a><span class="lineno"> 86</span> <span class="comment">// any other available SIMD equipment.</span></div>
<div class="line"><a name="l00087"></a><span class="lineno"> 87</span> <span class="comment">// __GNUC__ is also defined by compilers that include GNU extensions such as</span></div>
<div class="line"><a name="l00088"></a><span class="lineno"> 88</span> <span class="comment">// clang.</span></div>
<div class="line"><a name="l00089"></a><span class="lineno"> 89</span> SIMDDetect::SIMDDetect() {</div>
<div class="line"><a name="l00090"></a><span class="lineno"> 90</span>  <span class="comment">// The fallback is a generic dot product calculation.</span></div>
<div class="line"><a name="l00091"></a><span class="lineno"> 91</span>  SetDotProduct(DotProductGeneric);</div>
<div class="line"><a name="l00092"></a><span class="lineno"> 92</span>  </div>
<div class="line"><a name="l00093"></a><span class="lineno"> 93</span> <span class="preprocessor">#if defined(HAS_CPUID)</span></div>
<div class="line"><a name="l00094"></a><span class="lineno"> 94</span> <span class="preprocessor">#if defined(__GNUC__)</span></div>
<div class="line"><a name="l00095"></a><span class="lineno"> 95</span>  <span class="keywordtype">unsigned</span> <span class="keywordtype">int</span> eax, ebx, ecx, edx;</div>
<div class="line"><a name="l00096"></a><span class="lineno"> 96</span>  <span class="keywordflow">if</span> (__get_cpuid(1, &eax, &ebx, &ecx, &edx) != 0) {</div>
<div class="line"><a name="l00097"></a><span class="lineno"> 97</span>  <span class="comment">// Note that these tests all use hex because the older compilers don't have</span></div>
<div class="line"><a name="l00098"></a><span class="lineno"> 98</span>  <span class="comment">// the newer flags.</span></div>
<div class="line"><a name="l00099"></a><span class="lineno"> 99</span> <span class="preprocessor">#if defined(HAVE_SSE4_1)</span></div>
<div class="line"><a name="l00100"></a><span class="lineno"> 100</span>  sse_available_ = (ecx & 0x00080000) != 0;</div>
<div class="line"><a name="l00101"></a><span class="lineno"> 101</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00102"></a><span class="lineno"> 102</span> <span class="preprocessor">#if defined(HAVE_FMA)</span></div>
<div class="line"><a name="l00103"></a><span class="lineno"> 103</span>  fma_available_ = (ecx & 0x00001000) != 0;</div>
<div class="line"><a name="l00104"></a><span class="lineno"> 104</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00105"></a><span class="lineno"> 105</span> <span class="preprocessor">#if defined(HAVE_AVX)</span></div>
<div class="line"><a name="l00106"></a><span class="lineno"> 106</span>  avx_available_ = (ecx & 0x10000000) != 0;</div>
<div class="line"><a name="l00107"></a><span class="lineno"> 107</span>  <span class="keywordflow">if</span> (avx_available_) {</div>
<div class="line"><a name="l00108"></a><span class="lineno"> 108</span>  <span class="comment">// There is supposed to be a __get_cpuid_count function, but this is all</span></div>
<div class="line"><a name="l00109"></a><span class="lineno"> 109</span>  <span class="comment">// there is in my cpuid.h. It is a macro for an asm statement and cannot</span></div>
<div class="line"><a name="l00110"></a><span class="lineno"> 110</span>  <span class="comment">// be used inside an if.</span></div>
<div class="line"><a name="l00111"></a><span class="lineno"> 111</span>  __cpuid_count(7, 0, eax, ebx, ecx, edx);</div>
<div class="line"><a name="l00112"></a><span class="lineno"> 112</span>  avx2_available_ = (ebx & 0x00000020) != 0;</div>
<div class="line"><a name="l00113"></a><span class="lineno"> 113</span>  avx512F_available_ = (ebx & 0x00010000) != 0;</div>
<div class="line"><a name="l00114"></a><span class="lineno"> 114</span>  avx512BW_available_ = (ebx & 0x40000000) != 0;</div>
<div class="line"><a name="l00115"></a><span class="lineno"> 115</span>  }</div>
<div class="line"><a name="l00116"></a><span class="lineno"> 116</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00117"></a><span class="lineno"> 117</span>  }</div>
<div class="line"><a name="l00118"></a><span class="lineno"> 118</span> <span class="preprocessor"># elif defined(_WIN32)</span></div>
<div class="line"><a name="l00119"></a><span class="lineno"> 119</span>  <span class="keywordtype">int</span> cpuInfo[4];</div>
<div class="line"><a name="l00120"></a><span class="lineno"> 120</span>  <span class="keywordtype">int</span> max_function_id;</div>
<div class="line"><a name="l00121"></a><span class="lineno"> 121</span>  __cpuid(cpuInfo, 0);</div>
<div class="line"><a name="l00122"></a><span class="lineno"> 122</span>  max_function_id = cpuInfo[0];</div>
<div class="line"><a name="l00123"></a><span class="lineno"> 123</span>  <span class="keywordflow">if</span> (max_function_id >= 1) {</div>
<div class="line"><a name="l00124"></a><span class="lineno"> 124</span>  __cpuid(cpuInfo, 1);</div>
<div class="line"><a name="l00125"></a><span class="lineno"> 125</span> <span class="preprocessor">#if defined(HAVE_SSE4_1)</span></div>
<div class="line"><a name="l00126"></a><span class="lineno"> 126</span>  sse_available_ = (cpuInfo[2] & 0x00080000) != 0;</div>
<div class="line"><a name="l00127"></a><span class="lineno"> 127</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00128"></a><span class="lineno"> 128</span> <span class="preprocessor">#if defined(HAVE_AVX) || defined(HAVE_AVX2) || defined(HAVE_FMA)</span></div>
<div class="line"><a name="l00129"></a><span class="lineno"> 129</span>  <span class="keywordflow">if</span> ((cpuInfo[2] & 0x08000000) && ((_xgetbv(0) & 6) == 6)) {</div>
<div class="line"><a name="l00130"></a><span class="lineno"> 130</span>  <span class="comment">// OSXSAVE bit is set, XMM state and YMM state are fine.</span></div>
<div class="line"><a name="l00131"></a><span class="lineno"> 131</span> <span class="preprocessor">#if defined(HAVE_FMA)</span></div>
<div class="line"><a name="l00132"></a><span class="lineno"> 132</span>  fma_available_ = (cpuInfo[2] & 0x00001000) != 0;</div>
<div class="line"><a name="l00133"></a><span class="lineno"> 133</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00134"></a><span class="lineno"> 134</span> <span class="preprocessor">#if defined(HAVE_AVX)</span></div>
<div class="line"><a name="l00135"></a><span class="lineno"> 135</span>  avx_available_ = (cpuInfo[2] & 0x10000000) != 0;</div>
<div class="line"><a name="l00136"></a><span class="lineno"> 136</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00137"></a><span class="lineno"> 137</span> <span class="preprocessor">#if defined(HAVE_AVX2)</span></div>
<div class="line"><a name="l00138"></a><span class="lineno"> 138</span>  <span class="keywordflow">if</span> (max_function_id >= 7) {</div>
<div class="line"><a name="l00139"></a><span class="lineno"> 139</span>  __cpuid(cpuInfo, 7);</div>
<div class="line"><a name="l00140"></a><span class="lineno"> 140</span>  avx2_available_ = (cpuInfo[1] & 0x00000020) != 0;</div>
<div class="line"><a name="l00141"></a><span class="lineno"> 141</span>  avx512F_available_ = (cpuInfo[1] & 0x00010000) != 0;</div>
<div class="line"><a name="l00142"></a><span class="lineno"> 142</span>  avx512BW_available_ = (cpuInfo[1] & 0x40000000) != 0;</div>
<div class="line"><a name="l00143"></a><span class="lineno"> 143</span>  }</div>
<div class="line"><a name="l00144"></a><span class="lineno"> 144</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00145"></a><span class="lineno"> 145</span>  }</div>
<div class="line"><a name="l00146"></a><span class="lineno"> 146</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00147"></a><span class="lineno"> 147</span>  }</div>
<div class="line"><a name="l00148"></a><span class="lineno"> 148</span> <span class="preprocessor">#else</span></div>
<div class="line"><a name="l00149"></a><span class="lineno"> 149</span> <span class="preprocessor">#error "I don't know how to test for SIMD with this compiler"</span></div>
<div class="line"><a name="l00150"></a><span class="lineno"> 150</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00151"></a><span class="lineno"> 151</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00152"></a><span class="lineno"> 152</span>  </div>
<div class="line"><a name="l00153"></a><span class="lineno"> 153</span>  <span class="comment">// Select code for calculation of dot product based on autodetection.</span></div>
<div class="line"><a name="l00154"></a><span class="lineno"> 154</span>  <span class="keywordflow">if</span> (<span class="keyword">false</span>) {</div>
<div class="line"><a name="l00155"></a><span class="lineno"> 155</span>  <span class="comment">// This is a dummy to support conditional compilation.</span></div>
<div class="line"><a name="l00156"></a><span class="lineno"> 156</span> <span class="preprocessor">#if defined(HAVE_AVX2)</span></div>
<div class="line"><a name="l00157"></a><span class="lineno"> 157</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (avx2_available_) {</div>
<div class="line"><a name="l00158"></a><span class="lineno"> 158</span>  <span class="comment">// AVX2 detected.</span></div>
<div class="line"><a name="l00159"></a><span class="lineno"> 159</span>  SetDotProduct(<a class="code" href="a01818.html#aa41529fcf80de7ee0e8cc5691fbee53b">DotProductAVX</a>, &<a class="code" href="a02570.html#a503a9e29415ca20f74d48fd9665a0f0c">IntSimdMatrix::intSimdMatrixAVX2</a>);</div>
<div class="line"><a name="l00160"></a><span class="lineno"> 160</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00161"></a><span class="lineno"> 161</span> <span class="preprocessor">#if defined(HAVE_AVX)</span></div>
<div class="line"><a name="l00162"></a><span class="lineno"> 162</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (avx_available_) {</div>
<div class="line"><a name="l00163"></a><span class="lineno"> 163</span>  <span class="comment">// AVX detected.</span></div>
<div class="line"><a name="l00164"></a><span class="lineno"> 164</span>  SetDotProduct(<a class="code" href="a01818.html#aa41529fcf80de7ee0e8cc5691fbee53b">DotProductAVX</a>, &<a class="code" href="a02570.html#ad7aed52d7915512a59818a5efda68c1e">IntSimdMatrix::intSimdMatrixSSE</a>);</div>
<div class="line"><a name="l00165"></a><span class="lineno"> 165</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00166"></a><span class="lineno"> 166</span> <span class="preprocessor">#if defined(HAVE_SSE4_1)</span></div>
<div class="line"><a name="l00167"></a><span class="lineno"> 167</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (sse_available_) {</div>
<div class="line"><a name="l00168"></a><span class="lineno"> 168</span>  <span class="comment">// SSE detected.</span></div>
<div class="line"><a name="l00169"></a><span class="lineno"> 169</span>  SetDotProduct(<a class="code" href="a01818.html#ad3b5fe062bd97bc8cb1117a29fa24ac2">DotProductSSE</a>, &<a class="code" href="a02570.html#ad7aed52d7915512a59818a5efda68c1e">IntSimdMatrix::intSimdMatrixSSE</a>);</div>
<div class="line"><a name="l00170"></a><span class="lineno"> 170</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00171"></a><span class="lineno"> 171</span>  }</div>
<div class="line"><a name="l00172"></a><span class="lineno"> 172</span> }</div>
<div class="line"><a name="l00173"></a><span class="lineno"> 173</span>  </div>
<div class="line"><a name="l00174"></a><span class="lineno"><a class="line" href="a02574.html#af2ebffb31ead931cd95f89ae15c367d9"> 174</a></span> <span class="keywordtype">void</span> <a class="code" href="a02574.html#af2ebffb31ead931cd95f89ae15c367d9">SIMDDetect::Update</a>() {</div>
<div class="line"><a name="l00175"></a><span class="lineno"> 175</span>  <span class="comment">// Select code for calculation of dot product based on the</span></div>
<div class="line"><a name="l00176"></a><span class="lineno"> 176</span>  <span class="comment">// value of the config variable if that value is not empty.</span></div>
<div class="line"><a name="l00177"></a><span class="lineno"> 177</span>  <span class="keyword">const</span> <span class="keywordtype">char</span>* dotproduct_method = <span class="stringliteral">"generic"</span>;</div>
<div class="line"><a name="l00178"></a><span class="lineno"> 178</span>  <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"auto"</span>)) {</div>
<div class="line"><a name="l00179"></a><span class="lineno"> 179</span>  <span class="comment">// Automatic detection. Nothing to be done.</span></div>
<div class="line"><a name="l00180"></a><span class="lineno"> 180</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"generic"</span>)) {</div>
<div class="line"><a name="l00181"></a><span class="lineno"> 181</span>  <span class="comment">// Generic code selected by config variable.</span></div>
<div class="line"><a name="l00182"></a><span class="lineno"> 182</span>  SetDotProduct(DotProductGeneric);</div>
<div class="line"><a name="l00183"></a><span class="lineno"> 183</span>  dotproduct_method = <span class="stringliteral">"generic"</span>;</div>
<div class="line"><a name="l00184"></a><span class="lineno"> 184</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"native"</span>)) {</div>
<div class="line"><a name="l00185"></a><span class="lineno"> 185</span>  <span class="comment">// Native optimized code selected by config variable.</span></div>
<div class="line"><a name="l00186"></a><span class="lineno"> 186</span>  SetDotProduct(<a class="code" href="a01818.html#aac80847fbb0b16120a17ae3ed9d1ac54">DotProductNative</a>);</div>
<div class="line"><a name="l00187"></a><span class="lineno"> 187</span>  dotproduct_method = <span class="stringliteral">"native"</span>;</div>
<div class="line"><a name="l00188"></a><span class="lineno"> 188</span> <span class="preprocessor">#if defined(HAVE_AVX2)</span></div>
<div class="line"><a name="l00189"></a><span class="lineno"> 189</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"avx2"</span>)) {</div>
<div class="line"><a name="l00190"></a><span class="lineno"> 190</span>  <span class="comment">// AVX2 selected by config variable.</span></div>
<div class="line"><a name="l00191"></a><span class="lineno"> 191</span>  SetDotProduct(<a class="code" href="a01818.html#aa41529fcf80de7ee0e8cc5691fbee53b">DotProductAVX</a>, &<a class="code" href="a02570.html#a503a9e29415ca20f74d48fd9665a0f0c">IntSimdMatrix::intSimdMatrixAVX2</a>);</div>
<div class="line"><a name="l00192"></a><span class="lineno"> 192</span>  dotproduct_method = <span class="stringliteral">"avx2"</span>;</div>
<div class="line"><a name="l00193"></a><span class="lineno"> 193</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00194"></a><span class="lineno"> 194</span> <span class="preprocessor">#if defined(HAVE_AVX)</span></div>
<div class="line"><a name="l00195"></a><span class="lineno"> 195</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"avx"</span>)) {</div>
<div class="line"><a name="l00196"></a><span class="lineno"> 196</span>  <span class="comment">// AVX selected by config variable.</span></div>
<div class="line"><a name="l00197"></a><span class="lineno"> 197</span>  SetDotProduct(<a class="code" href="a01818.html#aa41529fcf80de7ee0e8cc5691fbee53b">DotProductAVX</a>, &<a class="code" href="a02570.html#ad7aed52d7915512a59818a5efda68c1e">IntSimdMatrix::intSimdMatrixSSE</a>);</div>
<div class="line"><a name="l00198"></a><span class="lineno"> 198</span>  dotproduct_method = <span class="stringliteral">"avx"</span>;</div>
<div class="line"><a name="l00199"></a><span class="lineno"> 199</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00200"></a><span class="lineno"> 200</span> <span class="preprocessor">#if defined(HAVE_FMA)</span></div>
<div class="line"><a name="l00201"></a><span class="lineno"> 201</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"fma"</span>)) {</div>
<div class="line"><a name="l00202"></a><span class="lineno"> 202</span>  <span class="comment">// FMA selected by config variable.</span></div>
<div class="line"><a name="l00203"></a><span class="lineno"> 203</span>  SetDotProduct(<a class="code" href="a01818.html#ab1837ad1dc5a0a43ba1b08e888a0f620">DotProductFMA</a>, <a class="code" href="a02570.html#ad7321e9f71f4d5e2c8920c370acb25ac">IntSimdMatrix::intSimdMatrix</a>);</div>
<div class="line"><a name="l00204"></a><span class="lineno"> 204</span>  dotproduct_method = <span class="stringliteral">"fma"</span>;</div>
<div class="line"><a name="l00205"></a><span class="lineno"> 205</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00206"></a><span class="lineno"> 206</span> <span class="preprocessor">#if defined(HAVE_SSE4_1)</span></div>
<div class="line"><a name="l00207"></a><span class="lineno"> 207</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"sse"</span>)) {</div>
<div class="line"><a name="l00208"></a><span class="lineno"> 208</span>  <span class="comment">// SSE selected by config variable.</span></div>
<div class="line"><a name="l00209"></a><span class="lineno"> 209</span>  SetDotProduct(<a class="code" href="a01818.html#ad3b5fe062bd97bc8cb1117a29fa24ac2">DotProductSSE</a>, &<a class="code" href="a02570.html#ad7aed52d7915512a59818a5efda68c1e">IntSimdMatrix::intSimdMatrixSSE</a>);</div>
<div class="line"><a name="l00210"></a><span class="lineno"> 210</span>  dotproduct_method = <span class="stringliteral">"sse"</span>;</div>
<div class="line"><a name="l00211"></a><span class="lineno"> 211</span> <span class="preprocessor">#endif</span></div>
<div class="line"><a name="l00212"></a><span class="lineno"> 212</span>  } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (!strcmp(dotproduct.c_str(), <span class="stringliteral">"std::inner_product"</span>)) {</div>
<div class="line"><a name="l00213"></a><span class="lineno"> 213</span>  <span class="comment">// std::inner_product selected by config variable.</span></div>
<div class="line"><a name="l00214"></a><span class="lineno"> 214</span>  SetDotProduct(DotProductStdInnerProduct);</div>
<div class="line"><a name="l00215"></a><span class="lineno"> 215</span>  dotproduct_method = <span class="stringliteral">"std::inner_product"</span>;</div>
<div class="line"><a name="l00216"></a><span class="lineno"> 216</span>  } <span class="keywordflow">else</span> {</div>
<div class="line"><a name="l00217"></a><span class="lineno"> 217</span>  <span class="comment">// Unsupported value of config variable.</span></div>
<div class="line"><a name="l00218"></a><span class="lineno"> 218</span>  <a class="code" href="a00581.html#a0c2bcd4462ec67ab0971b34a0f610f55">tprintf</a>(<span class="stringliteral">"Warning, ignoring unsupported config variable value: dotproduct=%s\n"</span>,</div>
<div class="line"><a name="l00219"></a><span class="lineno"> 219</span>  dotproduct.c_str());</div>
<div class="line"><a name="l00220"></a><span class="lineno"> 220</span>  <a class="code" href="a00581.html#a0c2bcd4462ec67ab0971b34a0f610f55">tprintf</a>(<span class="stringliteral">"Support values for dotproduct: auto generic native"</span></div>
<div class="line"><a name="l00221"></a><span class="lineno"> 221</span> #<span class="keywordflow">if</span> defined(HAVE_AVX)</div>
<div class="line"><a name="l00222"></a><span class="lineno"> 222</span>  <span class="stringliteral">" avx"</span></div>
<div class="line"><a name="l00223"></a><span class="lineno"> 223</span> #endif</div>
<div class="line"><a name="l00224"></a><span class="lineno"> 224</span> #<span class="keywordflow">if</span> defined(HAVE_SSE4_1)</div>
<div class="line"><a name="l00225"></a><span class="lineno"> 225</span>  <span class="stringliteral">" sse"</span></div>
<div class="line"><a name="l00226"></a><span class="lineno"> 226</span> #endif</div>
<div class="line"><a name="l00227"></a><span class="lineno"> 227</span>  <span class="stringliteral">" std::inner_product.\n"</span>);</div>
<div class="line"><a name="l00228"></a><span class="lineno"> 228</span>  }</div>
<div class="line"><a name="l00229"></a><span class="lineno"> 229</span>  </div>
<div class="line"><a name="l00230"></a><span class="lineno"> 230</span>  dotproduct.set_value(dotproduct_method);</div>
<div class="line"><a name="l00231"></a><span class="lineno"> 231</span> }</div>
<div class="line"><a name="l00232"></a><span class="lineno"> 232</span>  </div>
<div class="line"><a name="l00233"></a><span class="lineno"> 233</span> } <span class="comment">// namespace tesseract</span></div>
</div><!-- fragment --></div><!-- contents -->
</div><!-- doc-content -->
<div class="ttc" id="aa01818_html_ab1837ad1dc5a0a43ba1b08e888a0f620"><div class="ttname"><a href="a01818.html#ab1837ad1dc5a0a43ba1b08e888a0f620">tesseract::DotProductFMA</a></div><div class="ttdeci">double DotProductFMA(const double *u, const double *v, int n)</div><div class="ttdef"><b>Definition:</b> <a href="a00089_source.html#l00030">dotproductfma.cpp:30</a></div></div>
<div class="ttc" id="aa00554_html"><div class="ttname"><a href="a00554.html">params.h</a></div></div>
<div class="ttc" id="aa00110_html"><div class="ttname"><a href="a00110.html">simddetect.h</a></div></div>
<div class="ttc" id="aa02570_html_a503a9e29415ca20f74d48fd9665a0f0c"><div class="ttname"><a href="a02570.html#a503a9e29415ca20f74d48fd9665a0f0c">tesseract::IntSimdMatrix::intSimdMatrixAVX2</a></div><div class="ttdeci">static const IntSimdMatrix intSimdMatrixAVX2</div><div class="ttdef"><b>Definition:</b> <a href="a00098_source.html#l00117">intsimdmatrix.h:117</a></div></div>
<div class="ttc" id="aa02574_html"><div class="ttname"><a href="a02574.html">tesseract::SIMDDetect</a></div><div class="ttdef"><b>Definition:</b> <a href="a00110_source.html#l00031">simddetect.h:31</a></div></div>
<div class="ttc" id="aa00554_html_abaa7778083ba376d8c70a59631d4a6ab"><div class="ttname"><a href="a00554.html#abaa7778083ba376d8c70a59631d4a6ab">STRING_VAR</a></div><div class="ttdeci">#define STRING_VAR(name, val, comment)</div><div class="ttdef"><b>Definition:</b> <a href="a00554_source.html#l00306">params.h:306</a></div></div>
<div class="ttc" id="aa01818_html_ad3b5fe062bd97bc8cb1117a29fa24ac2"><div class="ttname"><a href="a01818.html#ad3b5fe062bd97bc8cb1117a29fa24ac2">tesseract::DotProductSSE</a></div><div class="ttdeci">double DotProductSSE(const double *u, const double *v, int n)</div><div class="ttdef"><b>Definition:</b> <a href="a00092_source.html#l00031">dotproductsse.cpp:31</a></div></div>
<div class="ttc" id="aa00083_html"><div class="ttname"><a href="a00083.html">dotproduct.h</a></div></div>
<div class="ttc" id="aa01818_html_a9ab0e86b57d2b88cdc6af72ff02c93d2"><div class="ttname"><a href="a01818.html#a9ab0e86b57d2b88cdc6af72ff02c93d2">tesseract::DotProduct</a></div><div class="ttdeci">DotProductFunction DotProduct</div><div class="ttdef"><b>Definition:</b> <a href="a00107_source.html#l00050">simddetect.cpp:50</a></div></div>
<div class="ttc" id="aa02570_html_ad7321e9f71f4d5e2c8920c370acb25ac"><div class="ttname"><a href="a02570.html#ad7321e9f71f4d5e2c8920c370acb25ac">tesseract::IntSimdMatrix::intSimdMatrix</a></div><div class="ttdeci">static const IntSimdMatrix * intSimdMatrix</div><div class="ttdef"><b>Definition:</b> <a href="a00098_source.html#l00116">intsimdmatrix.h:116</a></div></div>
<div class="ttc" id="aa01818_html_a33bdb7f88c6be930b0ea0d866f616ecf"><div class="ttname"><a href="a01818.html#a33bdb7f88c6be930b0ea0d866f616ecf">tesseract::DotProductFunction</a></div><div class="ttdeci">double(*)(const double *, const double *, int) DotProductFunction</div><div class="ttdef"><b>Definition:</b> <a href="a00110_source.html#l00025">simddetect.h:25</a></div></div>
<div class="ttc" id="aa01818_html"><div class="ttname"><a href="a01818.html">tesseract</a></div><div class="ttdef"><b>Definition:</b> <a href="a00005_source.html#l00065">baseapi.h:65</a></div></div>
<div class="ttc" id="aa00584_html"><div class="ttname"><a href="a00584.html">tprintf.h</a></div></div>
<div class="ttc" id="aa01818_html_aa41529fcf80de7ee0e8cc5691fbee53b"><div class="ttname"><a href="a01818.html#aa41529fcf80de7ee0e8cc5691fbee53b">tesseract::DotProductAVX</a></div><div class="ttdeci">double DotProductAVX(const double *u, const double *v, int n)</div><div class="ttdef"><b>Definition:</b> <a href="a00086_source.html#l00030">dotproductavx.cpp:30</a></div></div>
<div class="ttc" id="aa00581_html_a0c2bcd4462ec67ab0971b34a0f610f55"><div class="ttname"><a href="a00581.html#a0c2bcd4462ec67ab0971b34a0f610f55">tprintf</a></div><div class="ttdeci">DLLSYM void tprintf(const char *format,...)</div><div class="ttdef"><b>Definition:</b> <a href="a00581_source.html#l00034">tprintf.cpp:34</a></div></div>
<div class="ttc" id="aa02570_html_ad7aed52d7915512a59818a5efda68c1e"><div class="ttname"><a href="a02570.html#ad7aed52d7915512a59818a5efda68c1e">tesseract::IntSimdMatrix::intSimdMatrixSSE</a></div><div class="ttdeci">static const IntSimdMatrix intSimdMatrixSSE</div><div class="ttdef"><b>Definition:</b> <a href="a00098_source.html#l00118">intsimdmatrix.h:118</a></div></div>
<div class="ttc" id="aa00098_html"><div class="ttname"><a href="a00098.html">intsimdmatrix.h</a></div></div>
<div class="ttc" id="aa02574_html_af2ebffb31ead931cd95f89ae15c367d9"><div class="ttname"><a href="a02574.html#af2ebffb31ead931cd95f89ae15c367d9">tesseract::SIMDDetect::Update</a></div><div class="ttdeci">static TESS_API void Update()</div><div class="ttdef"><b>Definition:</b> <a href="a00107_source.html#l00174">simddetect.cpp:174</a></div></div>
<div class="ttc" id="aa01818_html_aac80847fbb0b16120a17ae3ed9d1ac54"><div class="ttname"><a href="a01818.html#aac80847fbb0b16120a17ae3ed9d1ac54">tesseract::DotProductNative</a></div><div class="ttdeci">double DotProductNative(const double *u, const double *v, int n)</div><div class="ttdef"><b>Definition:</b> <a href="a00080_source.html#l00022">dotproduct.cpp:22</a></div></div>
<!-- start footer part -->
<div id="nav-path" class="navpath"><!-- id is needed for treeview function! -->
<ul>
<li class="navelem"><a class="el" href="dir_68267d1309a1af8e8297ef4c3efbcdba.html">src</a></li><li class="navelem"><a class="el" href="dir_70d5e250c66d001b18da37689179cade.html">arch</a></li><li class="navelem"><a class="el" href="a00107.html">simddetect.cpp</a></li>
<li class="footer">Generated on Thu Jan 30 2020 14:22:19 for tesseract by
<a href="http://www.doxygen.org/index.html">
<img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.8.16 </li>
</ul>
</div>
</body>
</html>