validmind · johnwalz97 · Feb 11, 2025 · Feb 11, 2025 · Feb 11, 2025 · Feb 11, 2025
diff --git a/pyproject.toml b/pyproject.toml
@@ -10,7 +10,7 @@ description = "ValidMind Library"
 license = "Commercial License"
 name = "validmind"
 readme = "README.pypi.md"
-version = "2.7.7"
+version = "2.7.8"
 
 [tool.poetry.dependencies]
 aiohttp = {extras = ["speedups"], version = "*"}

diff --git a/validmind/__version__.py b/validmind/__version__.py
@@ -1 +1 @@
-__version__ = "2.7.7"
+__version__ = "2.7.8"
diff --git a/validmind/ai/test_descriptions.py b/validmind/ai/test_descriptions.py
@@ -8,6 +8,7 @@
 from concurrent.futures import ThreadPoolExecutor
 from typing import List, Optional, Union
 
+import tiktoken
 from jinja2 import Template
 
 from ..client_config import client_config
@@ -82,6 +83,29 @@ def _get_llm_global_context():
     return context if context_enabled and context else None
 
 
+def _truncate_summary(summary: str, test_id: str, max_tokens: int = 100_000):
+    if len(summary) < max_tokens:
+        # since string itself is less than max_tokens, definitely small enough
+        return summary
+
+    # TODO: better context length handling
+    encoding = tiktoken.encoding_for_model("gpt-4o")
+    summary_tokens = encoding.encode(summary)
+
+    if len(summary_tokens) > max_tokens:
+        logger.warning(
+            f"Truncating {test_id} due to context length restrictions..."
+            " Generated description may be innacurate"
+        )
+        summary = (
+            encoding.decode(summary_tokens[:max_tokens])
+            + "...[truncated]"
+            + encoding.decode(summary_tokens[-100:])
+        )
+
+    return summary
+
+
 def generate_description(
     test_id: str,
     test_description: str,
@@ -127,7 +151,7 @@ def generate_description(
         "test_name": test_name,
         "test_description": test_description,
         "title": title,
-        "summary": summary,
+        "summary": _truncate_summary(summary, test_id),
         "figures": [figure._get_b64_url() for figure in ([] if tables else figures)],
         "context": context,
     }
@@ -165,7 +189,13 @@ def wrapped():
                 title=title,
             )
         except Exception as e:
-            logger.error(f"Failed to generate description: {e}")
+            if "maximum context length" in str(e):
+                logger.warning(
+                    f"Test result {test_id} is too large to generate a description"
+                )
+            else:
+                logger.warning(f"Failed to generate description for {test_id}: {e}")
+            logger.warning(f"Using default description for {test_id}")
 
             return test_description
 

diff --git a/validmind/tests/run.py b/validmind/tests/run.py
@@ -3,11 +3,11 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 
 import platform
+import pprint
 import subprocess
 import time
 from datetime import datetime
 from inspect import getdoc
-import pprint
 from typing import Any, Callable, Dict, List, Optional, Tuple, Union
 from uuid import uuid4