"...composable_kernel.git" did not exist on "dd6a8de48c944e3243bef7db90ae9da07939450f"
Unverified Commit d5d4f473 authored by Haodong Duan's avatar Haodong Duan Committed by GitHub
Browse files

[API] Refine OpenAI (#175)

parent af436f59
...@@ -80,6 +80,7 @@ class OpenAI(BaseAPIModel): ...@@ -80,6 +80,7 @@ class OpenAI(BaseAPIModel):
self.orgs = org self.orgs = org
self.org_ctr = 0 self.org_ctr = 0
self.url = openai_api_base self.url = openai_api_base
self.path = path
def generate( def generate(
self, self,
...@@ -146,9 +147,17 @@ class OpenAI(BaseAPIModel): ...@@ -146,9 +147,17 @@ class OpenAI(BaseAPIModel):
messages.append(msg) messages.append(msg)
# max num token for gpt-3.5-turbo is 4097 # max num token for gpt-3.5-turbo is 4097
context_window = 4096
if '32k' in self.path:
context_window = 32768
elif '16k' in self.path:
context_window = 16384
elif 'gpt-4' in self.path:
context_window = 8192
# Hold out 100 tokens due to potential errors in tiktoken calculation
max_out_len = min( max_out_len = min(
max_out_len, max_out_len, context_window - self.get_token_len(str(input)) - 100)
self.max_seq_len - 50 - self.get_token_len(str(input)))
if max_out_len <= 0: if max_out_len <= 0:
return '' return ''
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment