diff --git a/tamingllms/_build/.doctrees/environment.pickle b/tamingllms/_build/.doctrees/environment.pickle index ebb908a..9f32a87 100644 Binary files a/tamingllms/_build/.doctrees/environment.pickle and b/tamingllms/_build/.doctrees/environment.pickle differ diff --git a/tamingllms/_build/.doctrees/notebooks/input.doctree b/tamingllms/_build/.doctrees/notebooks/input.doctree index 3069486..8bdabeb 100644 Binary files a/tamingllms/_build/.doctrees/notebooks/input.doctree and b/tamingllms/_build/.doctrees/notebooks/input.doctree differ diff --git a/tamingllms/_build/html/_sources/notebooks/input.ipynb b/tamingllms/_build/html/_sources/notebooks/input.ipynb index b5ad6c5..66e5c30 100644 --- a/tamingllms/_build/html/_sources/notebooks/input.ipynb +++ b/tamingllms/_build/html/_sources/notebooks/input.ipynb @@ -171,7 +171,7 @@ "from docling.document_converter import DocumentConverter\n", "\n", "converter = DocumentConverter()\n", - "forecast_result_docling = converter.convert(source).document.export_to_markdown()" + "forecast_result_docling = converter.convert(FORECAST_FILE_PATH).document.export_to_markdown()" ] }, { diff --git a/tamingllms/_build/html/notebooks/input.html b/tamingllms/_build/html/notebooks/input.html index ce139f8..776c377 100644 --- a/tamingllms/_build/html/notebooks/input.html +++ b/tamingllms/_build/html/notebooks/input.html @@ -408,7 +408,7 @@

from docling.document_converter import DocumentConverter
 
 converter = DocumentConverter()
-forecast_result_docling = converter.convert(source).document.export_to_markdown()
+forecast_result_docling = converter.convert(FORECAST_FILE_PATH).document.export_to_markdown()
 
diff --git a/tamingllms/_build/jupyter_execute/markdown/intro.ipynb b/tamingllms/_build/jupyter_execute/markdown/intro.ipynb index a039551..a1ac36c 100644 --- a/tamingllms/_build/jupyter_execute/markdown/intro.ipynb +++ b/tamingllms/_build/jupyter_execute/markdown/intro.ipynb @@ -2,7 +2,7 @@ "cells": [ { "cell_type": "markdown", - "id": "8b162760", + "id": "54449f64", "metadata": {}, "source": [ "(intro)=\n", diff --git a/tamingllms/_build/jupyter_execute/notebooks/input.ipynb b/tamingllms/_build/jupyter_execute/notebooks/input.ipynb index a89a1c3..de692a5 100644 --- a/tamingllms/_build/jupyter_execute/notebooks/input.ipynb +++ b/tamingllms/_build/jupyter_execute/notebooks/input.ipynb @@ -171,7 +171,7 @@ "from docling.document_converter import DocumentConverter\n", "\n", "converter = DocumentConverter()\n", - "forecast_result_docling = converter.convert(source).document.export_to_markdown()" + "forecast_result_docling = converter.convert(FORECAST_FILE_PATH).document.export_to_markdown()" ] }, { diff --git a/tamingllms/latex/chapters/input.tex b/tamingllms/latex/chapters/input.tex index c279655..caf2277 100644 --- a/tamingllms/latex/chapters/input.tex +++ b/tamingllms/latex/chapters/input.tex @@ -117,7 +117,7 @@ \subsection{Structured Data Extraction\index{Structured output}} from docling.document_converter import DocumentConverter converter = DocumentConverter() -forecast_result_docling = converter.convert(source).document.export_to_markdown() +forecast_result_docling = converter.convert(FORECAST_FILE_PATH).document.export_to_markdown() \end{minted} How similar are the two results? We can use use Levenshtein distance\index{Levenshtein distance}~\sidecite{10.5555/1822502} to measure the similarity between the two results. We will also calculate a naive score using the \texttt{SequenceMatcher} from the \texttt{difflib} package, which is a simple measure of similarity between two strings based on the number of matches in the longest common subsequence. diff --git a/tamingllms/notebooks/input.ipynb b/tamingllms/notebooks/input.ipynb index b5ad6c5..66e5c30 100644 --- a/tamingllms/notebooks/input.ipynb +++ b/tamingllms/notebooks/input.ipynb @@ -171,7 +171,7 @@ "from docling.document_converter import DocumentConverter\n", "\n", "converter = DocumentConverter()\n", - "forecast_result_docling = converter.convert(source).document.export_to_markdown()" + "forecast_result_docling = converter.convert(FORECAST_FILE_PATH).document.export_to_markdown()" ] }, {