-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathphototest.hocr
98 lines (97 loc) · 7.67 KB
/
phototest.hocr
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN"
"http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd">
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head>
<title></title>
<meta http-equiv="Content-Type" content="text/html;charset=utf-8"/>
<meta name='ocr-system' content='tesseract 4.1.0-rc1-752-g8b69' />
<meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word ocrp_wconf'/>
</head>
<body>
<div class='ocr_page' id='page_1' title='image "phototest.tif"; bbox 0 0 640 480; ppageno 0'>
<div class='ocr_carea' id='block_1_1' title="bbox 36 92 618 361">
<p class='ocr_par' id='par_1_1' lang='eng' title="bbox 36 92 618 184">
<span class='ocr_line' id='line_1_1' title="bbox 36 92 580 122; baseline 0 -6; x_size 30; x_descenders 6; x_ascenders 6">
<span class='ocrx_word' id='word_1_1' title='bbox 36 92 96 116; x_wconf 91'>This</span>
<span class='ocrx_word' id='word_1_2' title='bbox 109 92 129 116; x_wconf 92'>is</span>
<span class='ocrx_word' id='word_1_3' title='bbox 141 98 156 116; x_wconf 92'>a</span>
<span class='ocrx_word' id='word_1_4' title='bbox 169 92 201 116; x_wconf 90'>lot</span>
<span class='ocrx_word' id='word_1_5' title='bbox 212 92 240 116; x_wconf 93'>of</span>
<span class='ocrx_word' id='word_1_6' title='bbox 251 92 282 116; x_wconf 93'>12</span>
<span class='ocrx_word' id='word_1_7' title='bbox 296 92 364 122; x_wconf 90'>point</span>
<span class='ocrx_word' id='word_1_8' title='bbox 374 93 427 116; x_wconf 93'>text</span>
<span class='ocrx_word' id='word_1_9' title='bbox 437 93 463 116; x_wconf 92'>to</span>
<span class='ocrx_word' id='word_1_10' title='bbox 474 93 526 116; x_wconf 92'>test</span>
<span class='ocrx_word' id='word_1_11' title='bbox 536 92 580 116; x_wconf 92'>the</span>
</span>
<span class='ocr_line' id='line_1_2' title="bbox 36 126 618 157; baseline 0 -7; x_size 31; x_descenders 7; x_ascenders 6">
<span class='ocrx_word' id='word_1_12' title='bbox 36 132 81 150; x_wconf 90'>ocr</span>
<span class='ocrx_word' id='word_1_13' title='bbox 91 126 160 150; x_wconf 91'>code</span>
<span class='ocrx_word' id='word_1_14' title='bbox 172 126 223 150; x_wconf 90'>and</span>
<span class='ocrx_word' id='word_1_15' title='bbox 236 132 286 150; x_wconf 91'>see</span>
<span class='ocrx_word' id='word_1_16' title='bbox 299 126 314 150; x_wconf 92'>if</span>
<span class='ocrx_word' id='word_1_17' title='bbox 325 126 339 150; x_wconf 92'>it</span>
<span class='ocrx_word' id='word_1_18' title='bbox 348 126 433 150; x_wconf 92'>works</span>
<span class='ocrx_word' id='word_1_19' title='bbox 445 132 478 150; x_wconf 87'>on</span>
<span class='ocrx_word' id='word_1_20' title='bbox 500 126 529 150; x_wconf 87'>all</span>
<span class='ocrx_word' id='word_1_21' title='bbox 541 127 618 157; x_wconf 92'>types</span>
</span>
<span class='ocr_line' id='line_1_3' title="bbox 36 160 223 184; baseline 0 0; x_size 31.214842; x_descenders 7.2148418; x_ascenders 6">
<span class='ocrx_word' id='word_1_22' title='bbox 36 160 64 184; x_wconf 92'>of</span>
<span class='ocrx_word' id='word_1_23' title='bbox 72 160 113 184; x_wconf 92'>file</span>
<span class='ocrx_word' id='word_1_24' title='bbox 123 160 223 184; x_wconf 91'>format.</span>
</span>
</p>
<p class='ocr_par' id='par_1_2' lang='eng' title="bbox 36 194 597 361">
<span class='ocr_line' id='line_1_4' title="bbox 36 194 585 225; baseline 0 -7; x_size 31; x_descenders 7; x_ascenders 6">
<span class='ocrx_word' id='word_1_25' title='bbox 36 194 91 218; x_wconf 92'>The</span>
<span class='ocrx_word' id='word_1_26' title='bbox 102 194 177 224; x_wconf 91'>quick</span>
<span class='ocrx_word' id='word_1_27' title='bbox 189 194 274 218; x_wconf 91'>brown</span>
<span class='ocrx_word' id='word_1_28' title='bbox 287 194 339 225; x_wconf 91'>dog</span>
<span class='ocrx_word' id='word_1_29' title='bbox 348 194 456 225; x_wconf 91'>jumped</span>
<span class='ocrx_word' id='word_1_30' title='bbox 468 200 531 218; x_wconf 91'>over</span>
<span class='ocrx_word' id='word_1_31' title='bbox 540 194 585 218; x_wconf 92'>the</span>
</span>
<span class='ocr_line' id='line_1_5' title="bbox 37 228 585 259; baseline 0 -7; x_size 31; x_descenders 7; x_ascenders 6">
<span class='ocrx_word' id='word_1_32' title='bbox 37 228 92 259; x_wconf 92'>lazy</span>
<span class='ocrx_word' id='word_1_33' title='bbox 103 228 153 252; x_wconf 92'>fox.</span>
<span class='ocrx_word' id='word_1_34' title='bbox 165 228 220 252; x_wconf 92'>The</span>
<span class='ocrx_word' id='word_1_35' title='bbox 232 228 307 258; x_wconf 91'>quick</span>
<span class='ocrx_word' id='word_1_36' title='bbox 319 228 404 252; x_wconf 91'>brown</span>
<span class='ocrx_word' id='word_1_37' title='bbox 417 228 468 259; x_wconf 91'>dog</span>
<span class='ocrx_word' id='word_1_38' title='bbox 478 228 585 259; x_wconf 92'>jumped</span>
</span>
<span class='ocr_line' id='line_1_6' title="bbox 36 262 597 293; baseline 0 -7; x_size 31; x_descenders 7; x_ascenders 6">
<span class='ocrx_word' id='word_1_39' title='bbox 36 268 99 286; x_wconf 90'>over</span>
<span class='ocrx_word' id='word_1_40' title='bbox 109 262 153 286; x_wconf 92'>the</span>
<span class='ocrx_word' id='word_1_41' title='bbox 165 262 221 293; x_wconf 92'>lazy</span>
<span class='ocrx_word' id='word_1_42' title='bbox 231 262 281 286; x_wconf 91'>fox.</span>
<span class='ocrx_word' id='word_1_43' title='bbox 294 262 349 286; x_wconf 92'>The</span>
<span class='ocrx_word' id='word_1_44' title='bbox 360 262 435 292; x_wconf 91'>quick</span>
<span class='ocrx_word' id='word_1_45' title='bbox 447 262 532 286; x_wconf 91'>brown</span>
<span class='ocrx_word' id='word_1_46' title='bbox 545 262 597 293; x_wconf 90'>dog</span>
</span>
<span class='ocr_line' id='line_1_7' title="bbox 43 296 561 327; baseline 0 -7; x_size 31; x_descenders 7; x_ascenders 6">
<span class='ocrx_word' id='word_1_47' title='bbox 43 296 150 327; x_wconf 92'>jumped</span>
<span class='ocrx_word' id='word_1_48' title='bbox 162 302 226 320; x_wconf 92'>over</span>
<span class='ocrx_word' id='word_1_49' title='bbox 235 296 279 320; x_wconf 92'>the</span>
<span class='ocrx_word' id='word_1_50' title='bbox 292 296 347 327; x_wconf 88'>lazy</span>
<span class='ocrx_word' id='word_1_51' title='bbox 357 296 407 320; x_wconf 91'>fox.</span>
<span class='ocrx_word' id='word_1_52' title='bbox 420 296 475 320; x_wconf 91'>The</span>
<span class='ocrx_word' id='word_1_53' title='bbox 486 296 561 326; x_wconf 91'>quick</span>
</span>
<span class='ocr_line' id='line_1_8' title="bbox 37 330 561 361; baseline 0 -7; x_size 31; x_descenders 7; x_ascenders 6">
<span class='ocrx_word' id='word_1_54' title='bbox 37 330 122 354; x_wconf 92'>brown</span>
<span class='ocrx_word' id='word_1_55' title='bbox 135 330 187 361; x_wconf 92'>dog</span>
<span class='ocrx_word' id='word_1_56' title='bbox 196 330 304 361; x_wconf 91'>jumped</span>
<span class='ocrx_word' id='word_1_57' title='bbox 316 336 379 354; x_wconf 90'>over</span>
<span class='ocrx_word' id='word_1_58' title='bbox 388 330 433 354; x_wconf 91'>the</span>
<span class='ocrx_word' id='word_1_59' title='bbox 445 330 500 361; x_wconf 89'>lazy</span>
<span class='ocrx_word' id='word_1_60' title='bbox 511 330 561 354; x_wconf 90'>fox.</span>
</span>
</p>
</div>
</div>
</body>
</html>