PacificAI
diff --git a/‎.github/workflows/build_and_test.yml‎
Lines changed: 2 additions & 2 deletions b/‎.github/workflows/build_and_test.yml‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎.github/workflows/llm_tests_build.yml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/llm_tests_build.yml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/release.yaml‎
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/release.yaml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎langtest/datahandler/datasource.py‎
Lines changed: 1 addition & 1 deletion b/‎langtest/datahandler/datasource.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎langtest/langtest.py‎
Lines changed: 1 addition & 1 deletion b/‎langtest/langtest.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎langtest/metrics/llm_eval.py‎
Lines changed: 16 additions & 19 deletions b/‎langtest/metrics/llm_eval.py‎
Lines changed: 16 additions & 19 deletions
diff --git a/‎langtest/modelhandler/__init__.py‎
Lines changed: 2 additions & 2 deletions b/‎langtest/modelhandler/__init__.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎langtest/modelhandler/llm_modelhandler.py‎
Lines changed: 2 additions & 2 deletions b/‎langtest/modelhandler/llm_modelhandler.py‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎langtest/modelhandler/modelhandler.py‎
Lines changed: 3 additions & 3 deletions b/‎langtest/modelhandler/modelhandler.py‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎langtest/transform/accuracy.py‎
Lines changed: 11 additions & 4 deletions b/‎langtest/transform/accuracy.py‎
Lines changed: 11 additions & 4 deletions
@@ -17,7 +17,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        python-version: [ "3.9","3.10", "3.11" ]
+        python-version: ["3.12", "3.13" ]
 
     steps:
       - name: Free up disk space at start
@@ -53,7 +53,7 @@ jobs:
         if: steps.cached-poetry-dependencies.outputs.cache-hit != 'true'
         run: |
           poetry cache clear pypi --all -n > /dev/null
-          poetry install --with dev --all-extras --no-cache --quiet --no-interaction
+          poetry install --with dev --all-extras --no-cache --no-interaction
           source ./.venv/bin/activate && pip uninstall -y pyspark && rm -rf ./.venv/lib/python${{ matrix.python-version }}/site-packages/pyspark*/
           pip install pyspark==3.5.6
 
 
@@ -10,7 +10,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        python-version: [ "3.8", "3.9", "3.10" ]
+        python-version: [ "3.12", "3.13" ]
 
     steps:
       - uses: actions/checkout@v3
 
@@ -9,7 +9,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        python-version: [3.9]
+        python-version: [3.12]
         poetry-version: [2.1.3]
         os: [ubuntu-latest]
     runs-on: ${{ matrix.os }}
 
@@ -808,7 +808,7 @@ def load_raw_data(self, standardize_columns: bool = False) -> List[Dict]:
                 parsed CSV file into list of dicts
         """
 
-        if type(self._file_path) == dict:
+        if isinstance(self._file_path, dict):
             df = pd.read_csv(self._file_path["data_source"])
 
             if self.task == "text-classification":
 
@@ -286,7 +286,7 @@ def configure(self, config: Union[HarnessConfig, dict, str]) -> HarnessConfig:
         Returns:
             dict: Loaded configuration.
         """
-        if type(config) == dict:
+        if isinstance(config, dict):
             self._config = config
         else:
             with open(config, "r", encoding="utf-8") as yml:
 
@@ -66,25 +66,22 @@ def build_prompt(
                 f"""\n\nScore the student answer based on the following criteria:\n{eval_criteria}"""
             )
 
-        prompt += dedent(
-            f"""
-        Example Format:
-        QUESTION: question here
-        STUDENT ANSWER: student's answer here
-        TRUE ANSWER: true answer here
-        GRADE: {grade_list} here
-
-        {
-            ("Grade the student answers based ONLY on their factual accuracy. Ignore differences"
-             " in punctuation and phrasing between the student answer and true answer. It is OK "
-             "if the student answer contains more or relevant information than the true answer, as"
-             " long as it does not contain any conflicting statements. Begin!")
-        }
-
-        QUESTION: {{query}}
-        STUDENT ANSWER: {{result}}
-        TRUE ANSWER: {{answer}}
-        GRADE:"""
+        prompt += (
+            "Example Format:\n"
+            "QUESTION: question here\n"
+            "STUDENT ANSWER: student's answer here\n"
+            "TRUE ANSWER: true answer here\n"
+            f"GRADE: {grade_list} here"
+            "\n\n"
+            "Grade the student answers based ONLY on their factual accuracy. Ignore differences"
+            " in punctuation and phrasing between the student answer and true answer. It is OK "
+            "if the student answer contains more or relevant information than the true answer, as"
+            " long as it does not contain any conflicting statements. Begin!"
+            "\n\n"
+            "QUESTION: {{query}}\n"
+            "STUDENT ANSWER: {{result}}\n"
+            "TRUE ANSWER: {{answer}}\n"
+            "GRADE:\n"
         )
         return prompt
 
 
@@ -33,15 +33,15 @@
 
 
 if "langchain" in INSTALLED_HUBS:
-    import langchain
+    import langchain_classic
 
     LANGCHAIN_HUBS = {
         (
             RENAME_HUBS.get(hub.lower(), hub.lower())
             if hub.lower() in RENAME_HUBS
             else hub.lower()
         ): hub
-        for hub in langchain.llms.__all__
+        for hub in langchain_classic.llms.__all__
     }
     LANGCHAIN_HUBS["openrouter"] = "openrouter"
 
 
@@ -3,9 +3,9 @@
 
 import os
 from typing import Any, List, Type, Union, TypeVar
-import langchain.llms as lc
+import langchain_classic.llms as lc
 import langchain.chat_models as chat_models
-from langchain.chains.llm import LLMChain
+from langchain_classic.chains.llm import LLMChain
 from langchain_core.prompts import PromptTemplate
 from langchain_core.language_models.base import BaseLanguageModel
 from langchain_core.exceptions import OutputParserException
 
@@ -14,16 +14,16 @@
 }
 
 if try_import_lib("langchain"):
-    import langchain
-    import langchain.llms
+    import langchain_classic
+    import langchain_classic.llms
 
     LANGCHAIN_HUBS = {
         (
             RENAME_HUBS.get(hub.lower(), hub.lower())
             if hub.lower() in RENAME_HUBS
             else hub.lower()
         ): hub
-        for hub in langchain.llms.__all__
+        for hub in langchain_classic.llms.__all__
     }
     LANGCHAIN_HUBS["openrouter"] = "openrouter"
 else:
 
@@ -276,7 +276,8 @@ class BaseAccuracy(ABC):
 
     TestConfig = TypedDict(
         "TestConfig",
-        min_score=Union[Dict[str, float], float],
+        # min_score=Union[Dict[str, float], float],
+        {"min_score": Union[Dict[str, float], float]},
     )
 
     @classmethod
@@ -1029,9 +1030,15 @@ class LLMEval(BaseAccuracy):
 
     TestConfig = TypedDict(
         "TestConfig",
-        model=str,
-        hub=str,
-        min_score=float,
+        # model=str,
+        # hub=str,
+        # min_score=float,
+        {
+            "model": str,
+            "hub": str,
+            "model_parameters": dict,
+            "min_score": float,
+        },
     )
 
     @classmethod
Original file line number	Diff line number	Diff line change
`@@ -33,15 +33,15 @@`
`33`	`33`
`34`	`34`
`35`	`35`	`if "langchain" in INSTALLED_HUBS:`
`36`		`- import langchain`
	`36`	`+ import langchain_classic`
`37`	`37`
`38`	`38`	`LANGCHAIN_HUBS = {`
`39`	`39`	`(`
`40`	`40`	`RENAME_HUBS.get(hub.lower(), hub.lower())`
`41`	`41`	`if hub.lower() in RENAME_HUBS`
`42`	`42`	`else hub.lower()`
`43`	`43`	`): hub`
`44`		`- for hub in langchain.llms.__all__`
	`44`	`+ for hub in langchain_classic.llms.__all__`
`45`	`45`	`}`
`46`	`46`	`LANGCHAIN_HUBS["openrouter"] = "openrouter"`
`47`	`47`
Original file line number	Diff line number	Diff line change
`@@ -14,16 +14,16 @@`
`14`	`14`	`}`
`15`	`15`
`16`	`16`	`if try_import_lib("langchain"):`
`17`		`- import langchain`
`18`		`- import langchain.llms`
	`17`	`+ import langchain_classic`
	`18`	`+ import langchain_classic.llms`
`19`	`19`
`20`	`20`	`LANGCHAIN_HUBS = {`
`21`	`21`	`(`
`22`	`22`	`RENAME_HUBS.get(hub.lower(), hub.lower())`
`23`	`23`	`if hub.lower() in RENAME_HUBS`
`24`	`24`	`else hub.lower()`
`25`	`25`	`): hub`
`26`		`- for hub in langchain.llms.__all__`
	`26`	`+ for hub in langchain_classic.llms.__all__`
`27`	`27`	`}`
`28`	`28`	`LANGCHAIN_HUBS["openrouter"] = "openrouter"`
`29`	`29`	`else:`