init

8 months ago · c59a4dbb7f
commit c59a4dbb7f
2 changed files with 14 additions and 0 deletions
--- a/.gitignore
+++ b/.gitignore
@ -0,0 +1 @@
 *.pdf
--- a/app.py
+++ b/app.py
@ -0,0 +1,13 @@
 import fitz
 import re
 doc = fitz.open("test.pdf")
 index_page = doc[0]
 blocks = index_page.get_text("blocks")
 for block in blocks:
    text = block[4].strip()
    print(int(text))
    match = re.search(r'(\d+)', text)
    if match:
        print(match.group(1))