diff --git a/functions/import_pipeline/import_pipeline.py b/functions/import_pipeline/import_pipeline.py index d58d2a6..a1d3720 100644 --- a/functions/import_pipeline/import_pipeline.py +++ b/functions/import_pipeline/import_pipeline.py @@ -103,7 +103,12 @@ def import_arxiv_latex_and_pdf( raise if len(latex_string) > MAX_LATEX_CHARACTER_COUNT: - raise ValueError(f"Document is too long") + raise ValueError( + f"Document is too long: {len(latex_string):,} characters " + f"(limit is {MAX_LATEX_CHARACTER_COUNT:,}). " + f"Consider using a shorter version of the paper or " + f"splitting it into sections." + ) if existing_model_output_file: with open(existing_model_output_file, "r") as file: