File tree Expand file tree Collapse file tree 5 files changed +17
-7
lines changed Expand file tree Collapse file tree 5 files changed +17
-7
lines changed Original file line number Diff line number Diff line change 1
1
# Change Log
2
2
3
+ ## Changes in version 0.0.24
4
+
5
+ ### Fixes:
6
+
7
+ * [ 270] ( https://github.com/pymupdf/RAG/issues/270 ) - Fix UnboundLocalError for table_strategy in pymupdf_rag.py
8
+
9
+ ### Other Changes:
10
+
11
+
12
+
3
13
## Changes in version 0.0.23
4
14
5
15
### Fixes:
Original file line number Diff line number Diff line change 13
13
"Programming Language :: Python :: 3" ,
14
14
"Topic :: Utilities" ,
15
15
]
16
- requires = ["pymupdf4llm==0.0.23 " ]
16
+ requires = ["pymupdf4llm==0.0.24 " ]
17
17
18
18
setuptools .setup (
19
19
name = "pdf4llm" ,
20
- version = "0.0.23 " ,
20
+ version = "0.0.24 " ,
21
21
author = "Artifex" ,
22
22
author_email = "support@artifex.com" ,
23
23
description = "PyMuPDF Utilities for LLM/RAG" ,
Original file line number Diff line number Diff line change 1
1
from .helpers .pymupdf_rag import IdentifyHeaders , to_markdown
2
2
3
- __version__ = "0.0.23 "
3
+ __version__ = "0.0.24 "
4
4
version = __version__
5
5
version_tuple = tuple (map (int , version .split ("." )))
6
6
Original file line number Diff line number Diff line change @@ -988,12 +988,12 @@ def get_page_output(
988
988
graphics_count = len ([b for b in page .get_bboxlog () if "path" in b [0 ]])
989
989
if GRAPHICS_LIMIT and graphics_count > GRAPHICS_LIMIT :
990
990
IGNORE_GRAPHICS = True
991
- table_strategy = None
992
991
993
992
# Locate all tables on page
994
993
parms .written_tables = [] # stores already written tables
995
994
omitted_table_rects = []
996
- if table_strategy is None :
995
+ if IGNORE_GRAPHICS or not table_strategy :
996
+ # do not try to extract tables
997
997
parms .tabs = None
998
998
else :
999
999
parms .tabs = page .find_tables (clip = parms .clip , strategy = table_strategy )
@@ -1147,7 +1147,7 @@ def get_page_output(
1147
1147
toc = doc .get_toc ()
1148
1148
1149
1149
# Text extraction flags:
1150
- # omit invisible text, collect styles, use accurate bounding boxes
1150
+ # omit clipped text, collect styles, use accurate bounding boxes
1151
1151
textflags = (
1152
1152
0
1153
1153
| mupdf .FZ_STEXT_CLIP
Original file line number Diff line number Diff line change 17
17
18
18
setuptools .setup (
19
19
name = "pymupdf4llm" ,
20
- version = "0.0.23 " ,
20
+ version = "0.0.24 " ,
21
21
author = "Artifex" ,
22
22
author_email = "support@artifex.com" ,
23
23
description = "PyMuPDF Utilities for LLM/RAG" ,
You can’t perform that action at this time.
0 commit comments