feat(llm): Send images to model and enhance processing prompt

This commit is contained in:
2025-10-25 22:51:54 +11:00
parent 37d4facee3
commit 4f29d5c814
3 changed files with 94 additions and 45 deletions

38
uv.lock generated
View File

@@ -294,25 +294,6 @@ wheels = [
{ url = "https://files.pythonhosted.org/packages/31/f3/039520544492e4015703880df3475973bd9ed1b35d20674616f96fc07268/docling_parse-4.7.0-cp314-cp314-win_amd64.whl", hash = "sha256:c9add2fdd93cfc6ef14f82085af8d26444711255569e6fffb661a7f5f878f9a8", size = 16783637, upload-time = "2025-10-20T13:45:21.561Z" },
]
[[package]]
name = "docling-tool"
version = "0.1.0"
source = { virtual = "." }
dependencies = [
{ name = "docling" },
{ name = "langchain" },
{ name = "langchain-google-genai" },
{ name = "langchain-ollama" },
]
[package.metadata]
requires-dist = [
{ name = "docling", specifier = ">=2.57.0" },
{ name = "langchain", specifier = ">=1.0.2" },
{ name = "langchain-google-genai", specifier = ">=3.0.0" },
{ name = "langchain-ollama", specifier = ">=1.0.0" },
]
[[package]]
name = "et-xmlfile"
version = "2.0.0"
@@ -2148,6 +2129,25 @@ wheels = [
{ url = "https://files.pythonhosted.org/packages/b7/ce/149a00dd41f10bc29e5921b496af8b574d8413afcd5e30dfa0ed46c2cc5e/six-1.17.0-py2.py3-none-any.whl", hash = "sha256:4721f391ed90541fddacab5acf947aa0d3dc7d27b2e1e8eda2be8970586c3274", size = 11050, upload-time = "2024-12-04T17:35:26.475Z" },
]
[[package]]
name = "slide-translate"
version = "0.1.0"
source = { virtual = "." }
dependencies = [
{ name = "docling" },
{ name = "langchain" },
{ name = "langchain-google-genai" },
{ name = "langchain-ollama" },
]
[package.metadata]
requires-dist = [
{ name = "docling", specifier = ">=2.57.0" },
{ name = "langchain", specifier = ">=1.0.2" },
{ name = "langchain-google-genai", specifier = ">=3.0.0" },
{ name = "langchain-ollama", specifier = ">=1.0.0" },
]
[[package]]
name = "sniffio"
version = "1.3.1"