docling
docling copied to clipboard
`22682 segmentation fault python main3.py`
Bug
/Users/nsviridenko/ws/nikita-ai/tsa-browser-worker/main3.py:14: LangChainDeprecationWarning: Importing get_openai_callback from /Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/langchain/callbacks/__init__.py is deprecated. Please replace deprecated imports:
>> from /Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/langchain/callbacks/__init__.py import get_openai_callback
with new imports of:
>> from langchain_community.callbacks.manager import get_openai_callback
You can use the langchain cli to **automatically** upgrade many imports. Please see documentation here <https://python.langchain.com/docs/versions/v0_2/>
from langchain.callbacks import get_openai_callback
Fatal Python error: Segmentation fault
Current thread 0x000000010ecd3e00 (most recent call first):
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 1233 in create_module
File "<frozen importlib._bootstrap>", line 573 in module_from_spec
File "<frozen importlib._bootstrap>", line 676 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/pyarrow/__init__.py", line 65 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/pandas/compat/pyarrow.py", line 8 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/pandas/compat/__init__.py", line 27 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/pandas/__init__.py", line 26 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/docling_core/types/doc/document.py", line 19 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/docling_core/types/doc/__init__.py", line 9 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap>", line 1126 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/docling_core/types/__init__.py", line 8 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap>", line 1126 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/docling/backend/abstract_backend.py", line 6 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/.local/share/virtualenvs/tsa-browser-worker-_ynmeLqu/lib/python3.11/site-packages/docling/document_converter.py", line 10 in <module>
File "<frozen importlib._bootstrap>", line 241 in _call_with_frames_removed
File "<frozen importlib._bootstrap_external>", line 940 in exec_module
File "<frozen importlib._bootstrap>", line 690 in _load_unlocked
File "<frozen importlib._bootstrap>", line 1147 in _find_and_load_unlocked
File "<frozen importlib._bootstrap>", line 1176 in _find_and_load
File "/Users/nsviridenko/ws/nikita-ai/tsa-browser-worker/main3.py", line 18 in <module>
Extension modules: markupsafe._speedups, charset_normalizer.md, requests.packages.charset_normalizer.md, requests.packages.chardet.md, google._upb._message, greenlet._greenlet, yaml._yaml, regex._regex, numpy.core._multiarray_umath, numpy.core._multiarray_tests, numpy.linalg._umath_linalg, numpy.fft._pocketfft_internal, numpy.random._common, numpy.random.bit_generator, numpy.random._bounded_integers, numpy.random._mt19937, numpy.random.mtrand, numpy.random._philox, numpy.random._pcg64, numpy.random._sfc64, numpy.random._generator (total: 21)
[1] 22682 segmentation fault python main3.py
Steps to reproduce
from docling.document_converter import DocumentConverter
converter = DocumentConverter()
result = converter.convert(html_content)
markdown_content = result.document.export_to_markdown()
print(markdown_content)
Docling version
"docling": {
"hashes": [
"sha256:47222067fcfe87dbe8875ebab53dcad87e7637aea87c854c4951455846ad5031",
"sha256:993ac2d7024684c7bcec75169fc28a2f7f880b2c803608dc9da1db3cfbcae647"
],
"index": "pypi",
"markers": "python_version >= '3.9' and python_version < '4.0'",
"version": "==2.7.0"
},
Python version
Python 3.11.5