Browse Source

text frame editable and load hocr content in it

master
nglk 2 years ago
parent
commit
9831036345
  1. BIN
      .app.py.swp
  2. 6
      README.md
  3. BIN
      __pycache__/app.cpython-37.pyc
  4. BIN
      __pycache__/parsepdf.cpython-37.pyc
  5. BIN
      app.pyc
  6. 21
      templates/results.html
  7. 119
      templates/results.html.save
  8. 415
      test.hocr
  9. BIN
      test.pdf

BIN
.app.py.swp

Binary file not shown.

6
README.md

@ -0,0 +1,6 @@
# Poinikos
## not forget
debug mode should ne on to check alerts and bugs
we need to connect flask with html with POST and GET
run `export FLASK_DEBUG=1`

BIN
__pycache__/app.cpython-37.pyc

Binary file not shown.

BIN
__pycache__/parsepdf.cpython-37.pyc

Binary file not shown.

BIN
app.pyc

Binary file not shown.

21
templates/results.html

@ -8,7 +8,7 @@
<td colspan="3">
<form method="POST">
<!-- <input type="text" id="my_field" value="" wrap="soft"> -->
<textarea name="file" id="my_field" wrap="soft" placeholder="Επικόλληση του συνδέσμου του PDF του Ποινικού Κώδικα που βρήκατε στο ηλεκτρονικό ταχυδρομείο σας ή στο ΔΙΑΒΑΣΕΜΕ.txt, εδώ.
<textarea name="file" id="my_field" wrap="soft" placeholder="Επικόλληση του συνδέσμου του PDF του Ποινικού Κώδικα που βρήκατε στο ηλεκτρονικό ταχυδρομείο σας ή στο ΔΙΑΒΑΣΕΜΕ.txt, εδώ.
"></textarea>
</form>
</td>
@ -32,7 +32,7 @@
</div>
</td>
<td>
<textarea name="empty" id="empty_frame" wrap="soft" placeholder="Επιλέξτε και αντιγράψτε το περιεχόμενο του PDF.
<textarea name="empty" contenteditable="true" id="empty_frame" wrap="soft" placeholder="Επιλέξτε και αντιγράψτε το περιεχόμενο του PDF.
Κάντε επικόλληση του περιεχομένου του Ποινικού Κώδικα εδώ.
Υπάρχει δυνατότητα επεξεργασίας του επικολλημένου κειμένου.
@ -49,9 +49,21 @@
</table>
<script>
window.addEventListener('DOMContentLoaded', (e) => {
let input = document.getElementById('empty_frame');
// load default.txt into input box
try {
let fileToLoad = 'static/hocr/gynaikoktonia.hocr';
let xmlhttp = new XMLHttpRequest();
xmlhttp.open('GET', fileToLoad, false);
xmlhttp.send();
input.innerHTML = xmlhttp.responseText;
} catch(DOMException) {
input.innerHTML = "Error loading file. Maybe related to filepath or CORS?";
}
});
function decode() {
@ -89,6 +101,7 @@ function readme(){
}
function transform() {
alert("anything");
const show = document.getElementById("showmonster");
show.style.visibility = "visible";
const button4 = document.getElementById("button4");

119
templates/results.html.save

@ -0,0 +1,119 @@
{% extends 'base.html' %}
{% block content %}
<!-- <iframe src="https://pad.vvvvvvaria.org/wordmord.test" height="800" width="800"></iframe> -->
<table>
<tr>
<td colspan="3">
<form method="post">
<!-- <input type="text" id="my_field" value="" wrap="soft"> -->
<textarea name="file" id="my_field" wrap="soft" placeholder="Επικόλληση του συνδέσμου του PDF του Ποινικού Κώδικα που βρήκατε στο ηλεκτρονικό ταχυδρομείο σας ή στο ΔΙΑΒΑΣΕΜΕ.txt, εδώ.
"></textarea>
</form>
</td>
</tr>
<tr>
<td colspan="3">
<button id="button3" onclick="readme()">ΔΙΑΒΑΣΕΜΕ.txt</button>
<button id="button5" onclick="decode()">ΠΡΟΒΟΛΗ ΠΟΙΝΙΚΟΥ ΚΩΔΙΚΑ <img src="{{url_for('static', filename='images/closed.gif')}}"></button>
<button id="button2" onclick="copy()"> ΑΝΤΙΓΡΑΦΗ ΚΩΔΙΚΑ</button>
<button id="button1" onclick="transform()">ΜΕΤΑΛΛΑΓΜΕΝΟΣ ΚΩΔΙΚΑΣ</button>
<button id="button4" onclick="window.open('{{url_for('static', filename='pdf/ΣΧΕΔΙΟ_ΜΕΤΑΛΛΑΓΜΕΝΟΥ_ΠΟΙΝΙΚΟΥ_ΚΩΔΙΚΑ_01.pdf')}}');">ΚΑΤΕΒΑΣΕ ΜΕΤΑΛΛΑΓΜΕΝΟ ΚΩΔΙΚΑ <img src="{{url_for('static', filename='images/open.gif')}}"> </button>
</td>
</tr>
<tr>
<td>
<div id="initialpdf">
<iframe id="inputpdf" src="" height="800rem" width="750rem"></iframe>
</div>
</td>
<td>
<textarea name="empty" id="empty_frame" wrap="soft" placeholder="Επιλέξτε και αντιγράψτε το περιεχόμενο του PDF.
Κάντε επικόλληση του περιεχομένου του Ποινικού Κώδικα εδώ.
Υπάρχει δυνατότητα επεξεργασίας του επικολλημένου κειμένου.
Μπορείτε να στείλετε τις τροποποιήσεις που προτείνετε στο mailing list του WordMord https://we.lurk.org/mailman3/lists/wordmord.we.lurk.org/"></textarea>
</td>
<td class="prevent">
<!--<iframe id="showmonster" src="{{url_for('static', filename='pdf/ΣΧΕΔΙΟ_ΜΕΤΑΛΛΑΓΜΕΝΟΥ_ΠΟΙΝΙΚΟΥ_ΚΩΔΙΚΑ_01.pdf')}}" height="750rem" width="800rem"></iframe>-->
<iframe id="showmonster" src="{{url_for('static', filename='pdf/ΣΧΕΔΙΟ_ΜΕΤΑΛΛΑΓΜΕΝΟΥ_ΠΟΙΝΙΚΟΥ_ΚΩΔΙΚΑ_01.pdf')}}" height="800rem" width="750rem"></iframe>
</td>
</tr>
</table>
<script>
function decode() {
var url = document.getElementById("my_field").value;
var urlDecode = decodeURIComponent(url);
// console.log(urlDecode);
document.getElementById("my_field").value = urlDecode;
const showpdf = document.getElementById("inputpdf");
var textarea = document.getElementById('my_field');
var result
function updateResult() {
result.textContent = textarea.value;
}
textarea.addEventListener('keyup', updateResult);
showpdf.src = textarea.value;
const pdf = document.getElementById("initialpdf");
pdf.style.visibility = "visible";
const button2 = document.getElementById("button2");
button2.style.visibility = "visible";
textarea.style.color = "blue";
}
function readme(){
window.open('{{url_for('static',filename='ΔΙΑΒΑΣΕΜΕ.txt')}}');
const button5 = document.getElementById("button5");
button5.style.visibility = "visible";
}
function transform() {
const show = document.getElementById("showmonster");
show.style.visibility = "visible";
const button4 = document.getElementById("button4");
button4.style.visibility = "visible";
var emptyframe = document.getElementById('empty_frame');
emptyframe.style.color = "blue";
}
function copy() {
const show = document.getElementById("empty_frame");
show.style.visibility = "visible";
const button1 = document.getElementById("button1");
button1.style.visibility = "visible";
$(document).ready(function() {
$('form').find("input[type='text'],textarea").val("");
});
// extract the text of a pdf/ copy on clipboard
</script>
{% endblock %}

415
test.hocr

@ -0,0 +1,415 @@
<?xml version="1.0" encoding="UTF-8"?>
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
<head>
<title></title>
<meta http-equiv="Content-Type" content="text/html;charset=utf-8" />
<meta name='ocr-system' content='tesseract 3.04.01' />
<meta name='ocr-capabilities' content='ocr_page ocr_carea ocr_par ocr_line ocrx_word'/>
</head>
<body>
<div class="ocr_page" id="page_1" title="bbox 0 0 595 841; ppageno 0">
<figure title="bbox 0 0 595 841"/>
<div class="ocrx_block" pdftotree="section_header" title="bbox 146 76 465 86">
<span class="ocrx_line" title="bbox 146 76 465 86">
<span class="ocrx_word" title="bbox 146 76 206 86">ΕΓΚΛΗΜΑΤΑ</span>
<span class="ocrx_word" title="bbox 212 76 238 86">ΚΑΤΑ</span>
<span class="ocrx_word" title="bbox 241 76 260 86">ΤΗΣ</span>
<span class="ocrx_word" title="bbox 263 76 290 86">ΖΩΗΣ</span>
<span class="ocrx_word" title="bbox 293 76 310 86">ΚΑΙ</span>
<span class="ocrx_word" title="bbox 313 76 371 86">ΠΡΟΣΒΟΛΕΣ</span>
<span class="ocrx_word" title="bbox 376 76 397 86">ΤΩΝ</span>
<span class="ocrx_word" title="bbox 400 76 465 86">ΘΥΛΗΚΟΤΗΤ*</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 184 105 406 115">
<span class="ocrx_line" title="bbox 184 105 406 115">
<span class="ocrx_word" title="bbox 184 105 190 115">Ι.</span>
<span class="ocrx_word" title="bbox 193 105 247 115">Εγκλήματα</span>
<span class="ocrx_word" title="bbox 251 105 286 115">βλάβης</span>
<span class="ocrx_word" title="bbox 290 105 306 115">της</span>
<span class="ocrx_word" title="bbox 310 105 333 115">ζωής</span>
<span class="ocrx_word" title="bbox 336 105 352 115">της</span>
<span class="ocrx_word" title="bbox 357 105 406 115">●●●●●●●●</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 270 134 322 144">
<span class="ocrx_line" title="bbox 270 134 322 144">
<span class="ocrx_word" title="bbox 270 134 301 144">Άρθρο</span>
<span class="ocrx_word" title="bbox 306 134 322 144">299</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 235 149 305 159">
<span class="ocrx_line" title="bbox 235 149 305 159">
<span class="ocrx_word" title="bbox 235 149 305 159">Γυναικοκτονία</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 320 149 357 159">
<span class="ocrx_line" title="bbox 320 149 357 159">
<span class="ocrx_word" title="bbox 320 149 331 159">με</span>
<span class="ocrx_word" title="bbox 334 149 357 159">δόλο</span>
</span>
</div>
<div class="ocrx_block" pdftotree="paragraph" title="bbox 58 178 527 203">
<span class="ocrx_line" title="bbox 58 178 178 188">
<span class="ocrx_word" title="bbox 58 178 66 188">1.</span>
<span class="ocrx_word" title="bbox 69 178 103 188">Όποιος</span>
<span class="ocrx_word" title="bbox 108 178 148 188">σκότωσε</span>
<span class="ocrx_word" title="bbox 153 178 178 188">άλλη</span>
</span>
<span class="ocrx_line" title="bbox 185 178 235 188">
<span class="ocrx_word" title="bbox 185 178 235 188">τιμωρείται</span>
</span>
<span class="ocrx_line" title="bbox 242 178 519 188">
<span class="ocrx_word" title="bbox 242 178 253 188">με</span>
<span class="ocrx_word" title="bbox 256 178 300 188">κάθειρξη</span>
<span class="ocrx_word" title="bbox 303 178 333 188">ισόβια</span>
<span class="ocrx_word" title="bbox 338 178 344 188">ή</span>
<span class="ocrx_word" title="bbox 347 178 398 188">πρόσκαιρη</span>
<span class="ocrx_word" title="bbox 403 178 462 188">τουλάχιστον</span>
<span class="ocrx_word" title="bbox 467 178 489 188">δέκα</span>
<span class="ocrx_word" title="bbox 494 178 519 188">ετών.</span>
</span>
<span class="ocrx_line" title="bbox 58 193 196 203">
<span class="ocrx_word" title="bbox 58 193 65 203">2.</span>
<span class="ocrx_word" title="bbox 69 193 83 203">Αν</span>
<span class="ocrx_word" title="bbox 85 193 91 203">η</span>
<span class="ocrx_word" title="bbox 94 193 124 203">πράξη</span>
<span class="ocrx_word" title="bbox 127 193 196 203">αποφασίστηκε</span>
</span>
<span class="ocrx_line" title="bbox 203 193 413 203">
<span class="ocrx_word" title="bbox 203 193 218 203">και</span>
<span class="ocrx_word" title="bbox 220 193 279 203">εκτελέστηκε</span>
<span class="ocrx_word" title="bbox 283 193 294 203">σε</span>
<span class="ocrx_word" title="bbox 298 193 334 203">βρασμό</span>
<span class="ocrx_word" title="bbox 340 193 378 203">ψυχικής</span>
<span class="ocrx_word" title="bbox 382 193 413 203">ορμής,</span>
</span>
<span class="ocrx_line" title="bbox 418 193 527 203">
<span class="ocrx_word" title="bbox 418 193 476 203">επιβάλλεται</span>
<span class="ocrx_word" title="bbox 481 193 527 203">κάθειρξη.</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 270 222 325 232">
<span class="ocrx_line" title="bbox 270 222 325 232">
<span class="ocrx_word" title="bbox 270 222 301 232">●●●●●</span>
<span class="ocrx_word" title="bbox 306 222 325 232">●●●</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 220 237 376 247">
<span class="ocrx_line" title="bbox 220 237 376 247">
<span class="ocrx_word" title="bbox 220 237 299 247">●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 304 237 376 247">●●●●●●●●●●●●</span>
</span>
</div>
<div class="ocrx_block" pdftotree="paragraph" title="bbox 57 266 539 291">
<span class="ocrx_line" title="bbox 57 266 539 276">
<span class="ocrx_word" title="bbox 57 266 93 276">●●●●●●</span>
<span class="ocrx_word" title="bbox 97 266 152 276">●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 158 266 176 276">●●●</span>
<span class="ocrx_word" title="bbox 178 266 305 276">●●●●●●●●●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 308 266 345 276">●●●●●●</span>
<span class="ocrx_word" title="bbox 348 266 366 276">●●●</span>
<span class="ocrx_word" title="bbox 372 266 421 276">●●●●●●●●</span>
<span class="ocrx_word" title="bbox 426 266 444 276">●●●</span>
<span class="ocrx_word" title="bbox 445 266 488 276">●●●●●●●</span>
<span class="ocrx_word" title="bbox 490 266 539 276">●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 57 281 531 291">
<span class="ocrx_word" title="bbox 57 281 75 291">●●●</span>
<span class="ocrx_word" title="bbox 78 281 120 291">●●●●●●●</span>
<span class="ocrx_word" title="bbox 123 281 159 291">●●●●●●</span>
<span class="ocrx_word" title="bbox 163 281 237 291">●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 238 281 257 291">●●●</span>
<span class="ocrx_word" title="bbox 261 281 297 291">●●●●●●</span>
<span class="ocrx_word" title="bbox 300 281 318 291">●●●</span>
<span class="ocrx_word" title="bbox 322 281 475 291">●●●●●●●●●●●●●●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 477 281 531 291">●●●●●●●●●</span>
</span>
</div>
<table class="ocr_table" title="bbox 57 310 536 379">
<tr>
<td/>
<td/>
<td/>
<td/>
<td title="bbox 270 312 322 317">
<span class="ocrx_line" title="bbox 270 310 322 320">
<span class="ocrx_word" title="bbox 270 310 302 320">Άρθρο</span>
<span class="ocrx_word" title="bbox 306 310 322 320">301</span>
</span>
</td>
<td/>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td/>
<td/>
<td/>
<td title="bbox 233 327 360 332">
<span class="ocrx_line" title="bbox 233 325 360 335">
<span class="ocrx_word" title="bbox 233 325 287 335">Συμμετοχή</span>
<span class="ocrx_word" title="bbox 290 325 301 335">σε</span>
<span class="ocrx_word" title="bbox 305 325 360 335">αυτοκτονία</span>
</span>
</td>
<td/>
<td/>
<td/>
<td/>
<td/>
</tr>
<tr>
<td title="bbox 57 356 92 361">
<span class="ocrx_line" title="bbox 57 354 91 364">
<span class="ocrx_word" title="bbox 57 354 91 364">Όποιος</span>
</span>
</td>
<td/>
<td/>
<td/>
<td title="bbox 204 356 346 361">
<span class="ocrx_line" title="bbox 280 354 345 364">
<span class="ocrx_word" title="bbox 280 354 292 364">αν</span>
<span class="ocrx_word" title="bbox 297 354 345 364">τελέστηκε</span>
</span>
</td>
<td title="bbox 352 356 418 361">
<span class="ocrx_line" title="bbox 352 354 417 364">
<span class="ocrx_word" title="bbox 352 354 358 364">η</span>
<span class="ocrx_word" title="bbox 363 354 417 364">αυτοκτονία</span>
</span>
</td>
<td/>
<td/>
<td/>
<td title="bbox 518 356 536 361">
<span class="ocrx_line" title="bbox 518 354 536 364">
<span class="ocrx_word" title="bbox 518 354 536 364">της,</span>
</span>
</td>
</tr>
<tr>
<td/>
<td/>
<td title="bbox 148 371 223 376">
<span class="ocrx_line" title="bbox 148 369 176 379">
<span class="ocrx_word" title="bbox 148 369 176 379">έδωσε</span>
</span>
</td>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
<td/>
</tr>
</table>
<div class="ocrx_block" pdftotree="section_header" title="bbox 57 383 176 393">
<span class="ocrx_line" title="bbox 57 383 176 393">
<span class="ocrx_word" title="bbox 57 383 107 393">τιμωρείται</span>
<span class="ocrx_word" title="bbox 113 383 125 393">με</span>
<span class="ocrx_word" title="bbox 128 383 176 393">φυλάκιση.</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 270 413 322 423">
<span class="ocrx_line" title="bbox 270 413 322 423">
<span class="ocrx_word" title="bbox 270 413 302 423">Άρθρο</span>
<span class="ocrx_word" title="bbox 306 413 322 423">302</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 223 427 293 437">
<span class="ocrx_line" title="bbox 223 427 293 437">
<span class="ocrx_word" title="bbox 223 427 293 437">Γυναικοκτονία</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 307 427 410 437">
<span class="ocrx_line" title="bbox 307 427 410 437">
<span class="ocrx_word" title="bbox 307 427 326 437">από</span>
<span class="ocrx_word" title="bbox 330 427 369 437">θεσμική</span>
<span class="ocrx_word" title="bbox 371 427 410 437">αμέλεια</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 57 457 491 467">
<span class="ocrx_line" title="bbox 57 457 491 467">
<span class="ocrx_word" title="bbox 57 457 91 467">Όποιος</span>
<span class="ocrx_word" title="bbox 96 457 115 467">από</span>
<span class="ocrx_word" title="bbox 118 457 156 467">αμέλεια</span>
<span class="ocrx_word" title="bbox 161 457 202 467">σκότωσε</span>
<span class="ocrx_word" title="bbox 207 457 239 467">άλλην,</span>
<span class="ocrx_word" title="bbox 242 457 291 467">τιμωρείται</span>
<span class="ocrx_word" title="bbox 298 457 309 467">με</span>
<span class="ocrx_word" title="bbox 312 457 358 467">φυλάκιση</span>
<span class="ocrx_word" title="bbox 362 457 422 467">τουλάχιστον</span>
<span class="ocrx_word" title="bbox 426 457 453 467">τριών</span>
<span class="ocrx_word" title="bbox 457 457 491 467">μηνών.</span>
</span>
</div>
<div class="ocrx_block" pdftotree="paragraph" title="bbox 266 486 327 511">
<span class="ocrx_line" title="bbox 270 486 322 496">
<span class="ocrx_word" title="bbox 270 486 301 496">Άρθρο</span>
<span class="ocrx_word" title="bbox 306 486 322 496">303</span>
</span>
<span class="ocrx_line" title="bbox 266 501 327 511">
<span class="ocrx_word" title="bbox 266 501 327 511">Παιδοκτονία</span>
</span>
</div>
<div class="ocrx_block" pdftotree="paragraph" title="bbox 58 530 533 555">
<span class="ocrx_line" title="bbox 58 530 533 540">
<span class="ocrx_word" title="bbox 58 530 118 540">Πατέραςπου</span>
<span class="ocrx_word" title="bbox 123 530 134 540">με</span>
<span class="ocrx_word" title="bbox 137 530 178 540">πρόθεση</span>
<span class="ocrx_word" title="bbox 184 530 224 540">σκότωσε</span>
<span class="ocrx_word" title="bbox 229 530 266 540">τηνκόρη</span>
<span class="ocrx_word" title="bbox 271 530 288 540">του</span>
<span class="ocrx_word" title="bbox 291 530 315 540">κατά</span>
<span class="ocrx_word" title="bbox 318 530 324 540">ή</span>
<span class="ocrx_word" title="bbox 327 530 350 540">μετά</span>
<span class="ocrx_word" title="bbox 352 530 368 540">τον</span>
<span class="ocrx_word" title="bbox 371 530 405 540">τοκετό,</span>
<span class="ocrx_word" title="bbox 410 530 435 540">αλλά</span>
<span class="ocrx_word" title="bbox 437 530 456 540">ενώ</span>
<span class="ocrx_word" title="bbox 460 530 533 540">εξακολουθούσε</span>
</span>
<span class="ocrx_line" title="bbox 58 545 498 555">
<span class="ocrx_word" title="bbox 58 545 88 555">ακόμη</span>
<span class="ocrx_word" title="bbox 92 545 98 555">η</span>
<span class="ocrx_word" title="bbox 101 545 151 555">διατάραξη</span>
<span class="ocrx_word" title="bbox 155 545 171 555">του</span>
<span class="ocrx_word" title="bbox 176 545 232 555">οργανισμού</span>
<span class="ocrx_word" title="bbox 237 545 253 555">της</span>
<span class="ocrx_word" title="bbox 256 545 275 555">από</span>
<span class="ocrx_word" title="bbox 279 545 309 555">αυτόν,</span>
<span class="ocrx_word" title="bbox 313 545 363 555">τιμωρείται</span>
<span class="ocrx_word" title="bbox 370 545 381 555">με</span>
<span class="ocrx_word" title="bbox 384 545 428 555">κάθειρξη</span>
<span class="ocrx_word" title="bbox 431 545 448 555">έως</span>
<span class="ocrx_word" title="bbox 453 545 475 555">δέκα</span>
<span class="ocrx_word" title="bbox 479 545 498 555">έτη.</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 230 588 364 599">
<span class="ocrx_line" title="bbox 230 588 364 599">
<span class="ocrx_word" title="bbox 230 588 297 599">●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 300 588 318 599">●●●</span>
<span class="ocrx_word" title="bbox 321 588 364 599">●●●●●●●</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 270 618 325 628">
<span class="ocrx_line" title="bbox 270 618 325 628">
<span class="ocrx_word" title="bbox 270 618 302 628">●●●●●</span>
<span class="ocrx_word" title="bbox 306 618 325 628">●●●</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 247 632 349 642">
<span class="ocrx_line" title="bbox 247 632 349 642">
<span class="ocrx_word" title="bbox 247 632 289 642">●●●●●●●</span>
<span class="ocrx_word" title="bbox 292 632 311 642">●●●</span>
<span class="ocrx_word" title="bbox 312 632 349 642">●●●●●●</span>
</span>
</div>
<div class="ocrx_block" pdftotree="paragraph" title="bbox 57 662 538 745">
<span class="ocrx_line" title="bbox 58 662 538 672">
<span class="ocrx_word" title="bbox 58 662 106 672">●●●●●●●●</span>
<span class="ocrx_word" title="bbox 109 662 140 672">●●●●●</span>
<span class="ocrx_word" title="bbox 141 662 153 672">●●</span>
<span class="ocrx_word" title="bbox 156 662 230 672">●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 232 662 268 672">●●●●●●</span>
<span class="ocrx_word" title="bbox 271 662 341 672">●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 344 662 374 672">●●●●●</span>
<span class="ocrx_word" title="bbox 378 662 396 672">●●●</span>
<span class="ocrx_word" title="bbox 398 662 467 672">●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 471 662 538 672">●●●●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 58 676 109 686">
<span class="ocrx_word" title="bbox 58 676 82 686">●●●●</span>
<span class="ocrx_word" title="bbox 84 676 109 686">●●●●</span>
</span>
<span class="ocrx_line" title="bbox 58 691 109 701">
<span class="ocrx_word" title="bbox 58 691 70 701">●●</span>
<span class="ocrx_word" title="bbox 72 691 109 701">●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 115 691 302 701">
<span class="ocrx_word" title="bbox 115 691 127 701">●●</span>
<span class="ocrx_word" title="bbox 132 691 144 701">●●</span>
<span class="ocrx_word" title="bbox 150 691 205 701">●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 207 691 226 701">●●●</span>
<span class="ocrx_word" title="bbox 230 691 266 701">●●●●●●</span>
<span class="ocrx_word" title="bbox 272 691 278 701">●</span>
<span class="ocrx_word" title="bbox 284 691 302 701">●●●</span>
</span>
<span class="ocrx_line" title="bbox 308 691 357 701">
<span class="ocrx_word" title="bbox 308 691 357 701">●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 369 691 387 701">
<span class="ocrx_word" title="bbox 369 691 387 701">●●●</span>
</span>
<span class="ocrx_line" title="bbox 394 691 537 701">
<span class="ocrx_word" title="bbox 394 691 425 701">●●●●●</span>
<span class="ocrx_word" title="bbox 429 691 441 701">●●</span>
<span class="ocrx_word" title="bbox 446 691 483 701">●●●●●●</span>
<span class="ocrx_word" title="bbox 485 691 528 701">●●●●●●●</span>
<span class="ocrx_word" title="bbox 531 691 537 701">●</span>
</span>
<span class="ocrx_line" title="bbox 58 706 538 716">
<span class="ocrx_word" title="bbox 58 706 127 716">●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 128 706 140 716">●●</span>
<span class="ocrx_word" title="bbox 143 706 167 716">●●●●</span>
<span class="ocrx_word" title="bbox 170 706 251 716">●●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 255 706 383 716">●●●●●●●●●●●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 385 706 538 716">●●●●●●●●●●●●●●●●●●●●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 58 720 106 730">
<span class="ocrx_word" title="bbox 58 720 106 730">●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 113 720 131 730">
<span class="ocrx_word" title="bbox 113 720 131 730">●●●</span>
</span>
<span class="ocrx_line" title="bbox 138 720 196 730">
<span class="ocrx_word" title="bbox 138 720 162 730">●●●●</span>
<span class="ocrx_word" title="bbox 166 720 184 730">●●●</span>
<span class="ocrx_word" title="bbox 190 720 196 730">●</span>
</span>
<span class="ocrx_line" title="bbox 202 720 329 730">
<span class="ocrx_word" title="bbox 202 720 257 730">●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 260 720 290 730">●●●●●</span>
<span class="ocrx_word" title="bbox 295 720 314 730">●●●</span>
<span class="ocrx_word" title="bbox 317 720 329 730">●●</span>
</span>
<span class="ocrx_line" title="bbox 336 720 461 730">
<span class="ocrx_word" title="bbox 336 720 379 730">●●●●●●●</span>
<span class="ocrx_word" title="bbox 380 720 404 730">●●●●</span>
<span class="ocrx_word" title="bbox 407 720 461 730">●●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 471 720 538 730">
<span class="ocrx_word" title="bbox 471 720 484 730">●●</span>
<span class="ocrx_word" title="bbox 490 720 538 730">●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 57 735 300 745">
<span class="ocrx_word" title="bbox 57 735 142 745">●●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 147 735 171 745">●●●●</span>
<span class="ocrx_word" title="bbox 176 735 194 745">●●●</span>
<span class="ocrx_word" title="bbox 196 735 250 745">●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 252 735 300 745">●●●●●●●●</span>
</span>
<span class="ocrx_line" title="bbox 308 735 538 745">
<span class="ocrx_word" title="bbox 308 735 326 745">●●●</span>
<span class="ocrx_word" title="bbox 330 735 439 745">●●●●●●●●●●●●●●●●●●</span>
<span class="ocrx_word" title="bbox 442 735 467 745">●●●●</span>
<span class="ocrx_word" title="bbox 470 735 482 745">●●</span>
<span class="ocrx_word" title="bbox 486 735 517 745">●●●●●</span>
<span class="ocrx_word" title="bbox 519 735 538 745">●●●</span>
</span>
</div>
<div class="ocrx_block" pdftotree="section_header" title="bbox 526 782 536 792">
<span class="ocrx_line" title="bbox 526 782 536 792">
<span class="ocrx_word" title="bbox 526 782 536 792">78</span>
</span>
</div>
</div>
</body>
</html>

BIN
test.pdf

Binary file not shown.
Loading…
Cancel
Save