Giskard-AI · andreybavt · Aug 25, 2023 · Aug 25, 2023 · Aug 25, 2023 · Aug 25, 2023
diff --git a/python-client/giskard/models/base/wrapper.py b/python-client/giskard/models/base/wrapper.py
@@ -6,10 +6,10 @@
 from typing import Any, Callable, Iterable, Optional, Union
 
 import cloudpickle
+import mlflow
 import numpy as np
 import pandas as pd
 import yaml
-import mlflow
 
 from ...core.core import ModelType
 from ...core.validation import configured_validate_arguments
@@ -31,18 +31,18 @@ class WrapperModel(BaseModel, ABC):
 
     @configured_validate_arguments
     def __init__(
-            self,
-            model: Any,
-            model_type: ModelType,
-            data_preprocessing_function: Optional[Callable[[pd.DataFrame], Any]] = None,
-            model_postprocessing_function: Optional[Callable[[Any], Any]] = None,
-            name: Optional[str] = None,
-            feature_names: Optional[Iterable] = None,
-            classification_threshold: Optional[float] = 0.5,
-            classification_labels: Optional[Iterable] = None,
-            id: Optional[str] = None,
-            batch_size: Optional[int] = None,
-            **kwargs,
+        self,
+        model: Any,
+        model_type: ModelType,
+        data_preprocessing_function: Optional[Callable[[pd.DataFrame], Any]] = None,
+        model_postprocessing_function: Optional[Callable[[Any], Any]] = None,
+        name: Optional[str] = None,
+        feature_names: Optional[Iterable] = None,
+        classification_threshold: Optional[float] = 0.5,
+        classification_labels: Optional[Iterable] = None,
+        id: Optional[str] = None,
+        batch_size: Optional[int] = None,
+        **kwargs,
     ) -> None:
         """
         Parameters
@@ -130,7 +130,12 @@ def predict_df(self, df: pd.DataFrame):
             output = self._postprocess(output)
             outputs.append(output)
 
-        return np.concatenate(outputs)
+        raw_prediction = np.concatenate(outputs)
+
+        if self.is_regression:
+            return raw_prediction.astype(float)
+
+        return raw_prediction
 
     def _possibly_fix_predictions_shape(self, raw_predictions: np.ndarray):
         if not self.is_classification:
@@ -292,15 +297,11 @@ def load_wrapper_meta(cls, local_dir):
             # ensuring backward compatibility
             return {"batch_size": None}
 
-    def to_mlflow(self,
-                  artifact_path: str = "prediction-function-from-giskard",
-                  **kwargs):
-
+    def to_mlflow(self, artifact_path: str = "prediction-function-from-giskard", **kwargs):
         def _giskard_predict(df):
             return self.predict(df)
 
         class MLflowModel(mlflow.pyfunc.PythonModel):
-
             def predict(self, df):
                 return _giskard_predict(df)
 

diff --git a/python-client/giskard/models/cache/cache.py b/python-client/giskard/models/cache/cache.py
@@ -1,14 +1,13 @@
 import csv
-import os
-import uuid
 from pathlib import Path
-from typing import Dict, List, Any, Iterable, Optional
+from typing import Any, Iterable, List, Optional
 
 import numpy as np
 import pandas as pd
 
-from giskard.core.core import SupportedModelTypes
-from giskard.settings import settings
+from ...client.python_utils import warning
+from ...core.core import SupportedModelTypes
+from ...settings import settings
 
 NaN = float("NaN")
 
@@ -24,43 +23,58 @@ def flatten(xs):
 
 
 class ModelCache:
-    id: Optional[str] = None
-    prediction_cache: Dict[str, Any] = None
+    _default_cache_dir_prefix = Path(settings.home_dir / settings.cache_dir / "global" / "prediction_cache")
 
-    vectorized_get_cache_or_na = None
-
-    def __init__(self, model_type: SupportedModelTypes, id: Optional[str] = None, cache_dir: Path = None):
-        self.id = id or str(uuid.uuid4())
+    def __init__(self, model_type: SupportedModelTypes, id: Optional[str] = None, cache_dir: Optional[Path] = None):
+        self.id = id
         self.prediction_cache = dict()
-        self.cache_dir = cache_dir or Path(settings.home_dir / settings.cache_dir / "global/prediction_cache" / self.id)
-
-        if id is not None:
-            if (self.cache_dir / CACHE_CSV_FILENAME).exists():
-                with open(self.cache_dir / CACHE_CSV_FILENAME, "r") as pred_f:
-                    reader = csv.reader(pred_f)
-                    for row in reader:
-                        if model_type == SupportedModelTypes.TEXT_GENERATION:
-                            self.prediction_cache[row[0]] = row[1:]
-                        elif model_type == SupportedModelTypes.REGRESSION:
-                            self.prediction_cache[row[0]] = float(row[1])
-                        else:
-                            self.prediction_cache[row[0]] = [float(i) for i in row[1:]]
+
+        if cache_dir is None and self.id:
+            cache_dir = self._default_cache_dir_prefix.joinpath(self.id)
+
+        self.cache_file = cache_dir / CACHE_CSV_FILENAME if cache_dir else None
 
         self.vectorized_get_cache_or_na = np.vectorize(self.get_cache_or_na, otypes=[object])
+        self.model_type = model_type
+        self._warmed_up = False
+
+    def warm_up_from_disk(self):
+        if self.cache_file is None or not self.cache_file.exists():
+            return
+
+        try:
+            with self.cache_file.open("r", newline="") as pred_f:
+                reader = csv.reader(pred_f)
+                for row in reader:
+                    if self.model_type == SupportedModelTypes.TEXT_GENERATION:
+                        # Text generation models output should be a single string
+                        self.prediction_cache[row[0]] = row[1]
+                    elif self.model_type == SupportedModelTypes.REGRESSION:
+                        # Regression models output is always casted to float
+                        self.prediction_cache[row[0]] = float(row[1])
+                    else:
+                        # Classification models return list of probabilities
+                        self.prediction_cache[row[0]] = [float(i) for i in row[1:]]
+        except Exception as e:
+            warning(f"Failed to load cache from disk for model {self.id}: {e}")
 
     def get_cache_or_na(self, key: str):
         return self.prediction_cache.get(key, NaN)
 
     def read_from_cache(self, keys: pd.Series):
+        if self.id and not self._warmed_up:
+            self.warm_up_from_disk()
+            self._warmed_up = True
+
         return pd.Series(self.vectorized_get_cache_or_na(keys), index=keys.index)
 
     def set_cache(self, keys: pd.Series, values: List[Any]):
         for i in range(len(keys)):
             self.prediction_cache[keys.iloc[i]] = values[i]
 
-        if self.id:
-            os.makedirs(self.cache_dir, exist_ok=True)
-            with open(self.cache_dir / CACHE_CSV_FILENAME, "a") as pred_f:
+        if self.cache_file is not None:
+            self.cache_file.parent.mkdir(parents=True, exist_ok=True)
+            with self.cache_file.open("a", newline="") as pred_f:
                 writer = csv.writer(pred_f)
                 for i in range(len(keys)):
                     writer.writerow(flatten([keys.iloc[i], values[i]]))

diff --git a/python-client/tests/models/test_model_cache.py b/python-client/tests/models/test_model_cache.py
@@ -4,13 +4,42 @@
 import numpy as np
 import pandas as pd
 import xxhash
+from langchain import LLMChain, PromptTemplate
+from langchain.llms.fake import FakeListLLM
 
 import giskard
-from giskard import Model, Dataset
+from giskard import Dataset, Model
 from giskard.core.core import SupportedModelTypes
 from giskard.models.cache import ModelCache
 
 
+def test_model_prediction_is_cached_on_text_generation_model():
+    llm = FakeListLLM(responses=['This is my text with special chars" → ,.!? # and \n\nnewlines', "This is my text"])
+
+    prompt = PromptTemplate(template="{instruct}", input_variables=["instruct"])
+    chain = LLMChain(llm=llm, prompt=prompt)
+    model = Model(chain, model_type="text_generation")
+    dataset = Dataset(
+        pd.DataFrame({"instruct": ["Test 1", "Test 2"]}),
+        column_types={
+            "instruct": "text",
+        },
+    )
+    model.predict(dataset)
+
+    # Should load from cache
+    assert model.predict(dataset).raw_prediction.tolist() == llm.responses
+    assert model.predict(dataset).raw_prediction.tolist() == llm.responses
+
+    # Test cache persistence
+    model_id = model.id
+
+    del model
+    model = Model(chain, model_type="text_generation", id=model_id.hex)
+
+    assert model.predict(dataset).raw_prediction.tolist() == llm.responses
+
+
 def test_model_prediction_is_cached_on_regression_model():
     called_indexes = []