You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
198 lines
6.9 KiB
198 lines
6.9 KiB
import os
|
|
|
|
import openai
|
|
|
|
# An enum of two modes, TOP_P or TEMPERATURE
|
|
class Mode:
|
|
TOP_P = "top_p"
|
|
TEMPERATURE = "temperature"
|
|
|
|
|
|
class Models:
|
|
DAVINCI = "text-davinci-003"
|
|
CURIE = "text-curie-001"
|
|
|
|
class Model:
|
|
def __init__(self, usage_service):
|
|
self._mode = Mode.TEMPERATURE
|
|
self._temp = 0.6 # Higher value means more random, lower value means more likely to be a coherent sentence
|
|
self._top_p = 0.9 # 1 is equivalent to greedy sampling, 0.1 means that the model will only consider the top 10% of the probability distribution
|
|
self._max_tokens = 4000 # The maximum number of tokens the model can generate
|
|
self._presence_penalty = 0 # Penalize new tokens based on whether they appear in the text so far
|
|
self._frequency_penalty = 0 # Penalize new tokens based on their existing frequency in the text so far. (Higher frequency = lower probability of being chosen.)
|
|
self._best_of = 1 # Number of responses to compare the loglikelihoods of
|
|
self._prompt_min_length = 20
|
|
self._max_conversation_length = 5
|
|
self._model = Models.DAVINCI
|
|
self._low_usage_mode = False
|
|
self.usage_service = usage_service
|
|
self.DAVINCI_ROLES = ["admin", "Admin", "GPT", "gpt"]
|
|
|
|
openai.api_key = os.getenv('OPENAI_TOKEN')
|
|
|
|
# Use the @property and @setter decorators for all the self fields to provide value checking
|
|
|
|
@property
|
|
def low_usage_mode(self):
|
|
return self._low_usage_mode
|
|
|
|
@low_usage_mode.setter
|
|
def low_usage_mode(self, value):
|
|
try:
|
|
value = bool(value)
|
|
except ValueError:
|
|
raise ValueError("low_usage_mode must be a boolean")
|
|
|
|
if value:
|
|
self._model = Models.CURIE
|
|
self.max_tokens = 1900
|
|
else:
|
|
self._model = Models.DAVINCI
|
|
self.max_tokens = 4000
|
|
|
|
@property
|
|
def model(self):
|
|
return self._model
|
|
|
|
@model.setter
|
|
def model(self, model):
|
|
if model not in [Models.DAVINCI, Models.CURIE]:
|
|
raise ValueError("Invalid model, must be text-davinci-003 or text-curie-001")
|
|
self._model = model
|
|
|
|
@property
|
|
def max_conversation_length(self):
|
|
return self._max_conversation_length
|
|
|
|
@max_conversation_length.setter
|
|
def max_conversation_length(self, value):
|
|
value = int(value)
|
|
if value < 1:
|
|
raise ValueError("Max conversation length must be greater than 1")
|
|
if value > 30:
|
|
raise ValueError("Max conversation length must be less than 30, this will start using credits quick.")
|
|
self._max_conversation_length = value
|
|
|
|
@property
|
|
def mode(self):
|
|
return self._mode
|
|
|
|
@mode.setter
|
|
def mode(self, value):
|
|
if value not in [Mode.TOP_P, Mode.TEMPERATURE]:
|
|
raise ValueError("mode must be either 'top_p' or 'temperature'")
|
|
if value == Mode.TOP_P:
|
|
self._top_p = 0.1
|
|
self._temp = 0.7
|
|
elif value == Mode.TEMPERATURE:
|
|
self._top_p = 0.9
|
|
self._temp = 0.6
|
|
|
|
self._mode = value
|
|
|
|
@property
|
|
def temp(self):
|
|
return self._temp
|
|
|
|
@temp.setter
|
|
def temp(self, value):
|
|
value = float(value)
|
|
if value < 0 or value > 1:
|
|
raise ValueError("temperature must be greater than 0 and less than 1, it is currently " + str(value))
|
|
|
|
self._temp = value
|
|
|
|
@property
|
|
def top_p(self):
|
|
return self._top_p
|
|
|
|
@top_p.setter
|
|
def top_p(self, value):
|
|
value = float(value)
|
|
if value < 0 or value > 1:
|
|
raise ValueError("top_p must be greater than 0 and less than 1, it is currently " + str(value))
|
|
self._top_p = value
|
|
|
|
@property
|
|
def max_tokens(self):
|
|
return self._max_tokens
|
|
|
|
@max_tokens.setter
|
|
def max_tokens(self, value):
|
|
value = int(value)
|
|
if value < 15 or value > 4096:
|
|
raise ValueError("max_tokens must be greater than 15 and less than 4096, it is currently " + str(value))
|
|
self._max_tokens = value
|
|
|
|
@property
|
|
def presence_penalty(self):
|
|
return self._presence_penalty
|
|
|
|
@presence_penalty.setter
|
|
def presence_penalty(self, value):
|
|
if int(value) < 0:
|
|
raise ValueError("presence_penalty must be greater than 0, it is currently " + str(value))
|
|
self._presence_penalty = value
|
|
|
|
@property
|
|
def frequency_penalty(self):
|
|
return self._frequency_penalty
|
|
|
|
@frequency_penalty.setter
|
|
def frequency_penalty(self, value):
|
|
if int(value) < 0:
|
|
raise ValueError("frequency_penalty must be greater than 0, it is currently " + str(value))
|
|
self._frequency_penalty = value
|
|
|
|
@property
|
|
def best_of(self):
|
|
return self._best_of
|
|
|
|
@best_of.setter
|
|
def best_of(self, value):
|
|
value = int(value)
|
|
if value < 1 or value > 3:
|
|
raise ValueError(
|
|
"best_of must be greater than 0 and ideally less than 3 to save tokens, it is currently " + str(value))
|
|
self._best_of = value
|
|
|
|
@property
|
|
def prompt_min_length(self):
|
|
return self._prompt_min_length
|
|
|
|
@prompt_min_length.setter
|
|
def prompt_min_length(self, value):
|
|
value = int(value)
|
|
if value < 10 or value > 4096:
|
|
raise ValueError(
|
|
"prompt_min_length must be greater than 10 and less than 4096, it is currently " + str(value))
|
|
self._prompt_min_length = value
|
|
|
|
def send_request(self, prompt, message):
|
|
# Validate that all the parameters are in a good state before we send the request
|
|
if len(prompt) < self.prompt_min_length:
|
|
raise ValueError("Prompt must be greater than 25 characters, it is currently " + str(len(prompt)))
|
|
|
|
|
|
print("The prompt about to be sent is " + prompt)
|
|
prompt_tokens = self.usage_service.count_tokens(prompt)
|
|
print(f"The prompt tokens will be {prompt_tokens}")
|
|
print(f"The total max tokens will then be {self.max_tokens - prompt_tokens}")
|
|
|
|
response = openai.Completion.create(
|
|
model=Models.DAVINCI if any(role.name in self.DAVINCI_ROLES for role in message.author.roles) else self.model, # Davinci override for admin users
|
|
prompt=prompt,
|
|
temperature=self.temp,
|
|
top_p=self.top_p,
|
|
max_tokens=self.max_tokens - prompt_tokens,
|
|
presence_penalty=self.presence_penalty,
|
|
frequency_penalty=self.frequency_penalty,
|
|
best_of=self.best_of,
|
|
)
|
|
print(response.__dict__)
|
|
|
|
# Parse the total tokens used for this request and response pair from the response
|
|
tokens_used = int(response['usage']['total_tokens'])
|
|
self.usage_service.update_usage(tokens_used)
|
|
|
|
return response |