Source code for ontolearn.verbalizer

# -----------------------------------------------------------------------------
# MIT License
#
# Copyright (c) 2024 Ontolearn Team
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
# -----------------------------------------------------------------------------

import requests
from openai import OpenAI
from ontolearn.utils.static_funcs import assert_class_expression_type
from typing import Optional, Union



[docs] class LLMVerbalizer: def __init__(self, model: str = "mixtral:8x7b", url: str = "http://tentris-ml.cs.upb.de:8000/api/generate", api_key: Optional[str] = None): self.model = model self.url = url self.api_key = api_key if api_key: self.client = OpenAI(base_url=self.url, api_key=self.api_key)
[docs] def __call__(self, text: str): """ :param text: String representation of an OWL Class Expression """ assert isinstance(text, str) or assert_class_expression_type(text), "Input must be a string or either of the family OWL class expression" prompt = f"<s> [INST] You are an expert in description logics. You are particularly good at explaining complex concepts with few sentences. [/INST] Model answer</s> [INST] Verbalize {text} in natural language with 1 sentence. Provide no explanations or write no notes.[/INST]" print("Waiting for the verbalization..") try: if not self.api_key: response = requests.get(url=self.url, headers={"accept": "application/json", "Content-Type": "application/json"}, json={"model": self.model, "prompt": prompt}, timeout=30) if response.ok: return response.json()["response"] else: return f"No verbalization due to the HTTP connection\t{response.text}" else: assert isinstance(self.api_key, str) and self.api_key != '', "Use a valid api key as string" response = self.client.chat.completions.create( model=self.model, messages=[ {"role": "system", "content": "You are a helpful assistant."}, {"role": "user", "content": prompt}] ) return (response.choices[0].message.content) except: return f"No verbalization. Error at HTTP connection"
[docs] def verbalize_learner_prediction(prediction: Union[str, object] = None, num_predictions: int = 3) -> None: """ Generate and print multiple verbalized versions of a learner's prediction using an LLM verbalizer. This function takes a prediction (either a string or object), uses an LLMVerbalizer to generate three verbalized responses, and prints them. This is useful for inspecting how the model might rephrase or interpret a given prediction. Parameters: prediction (Union[str, object]): The learner's prediction to verbalize. Must not be None. num_predictions (int): Number of prediction ouputs from the verbalizer with default value of 3 Raises: AssertionError: If the prediction is None. """ assert prediction is not None, "Learner prediction cannot be None" verbalizer = LLMVerbalizer() # Insert your access credentials if needed predictions = [verbalizer(text=prediction) for _ in range(num_predictions)] print(predictions)