Spaces:

Quardo
/

gpt-4o-mini

Running

App Files Files Community

Quardo commited on 13 days ago

Commit

d89748a

•

1 Parent(s): 4b342a9

Updated space.

Browse files

Files changed (1) hide show

app.py +40 -22

app.py CHANGED Viewed

@@ -296,25 +296,27 @@ async def streamChat(params):
             if message["role"] == "system":
                 message["role"] = "user"
                 message["content"] = f"[System: {message['content']}]"
-    async with aiohttp.ClientSession() as session:
-        try:
-            async with session.post(f"{base_url}/chat/completions", headers={"Authorization": f"Bearer {get_api_key(call='api_key')}", "Content-Type": "application/json"}, json=params) as r:
-                r.raise_for_status()
-                async for line in r.content:
-                    if line:
-                        line_str = line.decode('utf-8')
-                        if line_str.startswith("data: "):
-                            line_str = line_str[6:].strip()
-                        if line_str == "[DONE]":
-                            continue
-                        try:
-                            message = json.loads(line_str)
-                            yield message
-                        except json.JSONDecodeError:
-                            continue
-        except aiohttp.ClientError:
             try:
-                async with session.post("https://api.openai.com/v1/chat/completions", headers={"Authorization": f"Bearer {get_api_key(call='oai_api_key')}", "Content-Type": "application/json"}, json=params) as r:
                     r.raise_for_status()
                     async for line in r.content:
                         if line:
@@ -329,7 +331,23 @@ async def streamChat(params):
                             except json.JSONDecodeError:
                                 continue
             except aiohttp.ClientError:
-                return
 def imagine(prompt):
     try:
@@ -594,15 +612,15 @@ async def respond(
 handleApiKeys();loadModels();checkModels();loadENV();
-lastUpdateMessage = "New API handling (the old one is shutdown)."
 demo = gr.ChatInterface(
     respond,
-    title="GPT-4O-mini",
     description=f"A OpenAI API proxy!<br/>View API docs [here](/api/v1/docs) <strong>[Yes you can use this as an API in a simpler manner]</strong>.<br/><strong>[Last update: {lastUpdateMessage}]</strong> Also you can only submit images to vision models; txt/code/etc. to all models.",
     multimodal=True,
     additional_inputs=[
         gr.Textbox(value="You are a helpful assistant. You are an OpenAI GPT model. Please adhere to OpenAI's usage policies and guidelines. Ensure your responses are accurate, respectful, and within the scope of OpenAI's rules.", label="System message"),
-        gr.Dropdown(choices=models, value="gpt-4o-mini-2024-07-18", label="Model"),
         gr.Slider(minimum=1, maximum=4096, value=4096, step=1, label="Max new tokens"),
         gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.05, label="Temperature"),
         gr.Slider(minimum=0.05, maximum=1.0, value=0.95, step=0.05, label="Top-p (nucleus sampling)"),

             if message["role"] == "system":
                 message["role"] = "user"
                 message["content"] = f"[System: {message['content']}]"
+        params["stream"] = False;
+        async with aiohttp.ClientSession() as session:
             try:
+                async with session.post(f"{base_url}/chat/completions", headers={"Authorization": f"Bearer {get_api_key(call='api_key')}", "Content-Type": "application/json"}, json=params) as r:
+                    r.raise_for_status()
+                    response_data = await r.json()
+                    yield {"choices": [{"delta": {"content": response_data["choices"][0]["message"]["content"]}}]}
+                    yield {"choices": [{"delta": {"content": "[DONE]"}}]}
+            except aiohttp.ClientError:
+                try:
+                    async with session.post("https://api.openai.com/v1/chat/completions", headers={"Authorization": f"Bearer {get_api_key(call='oai_api_key')}", "Content-Type": "application/json"}, json=params) as r:
+                        r.raise_for_status()
+                        response_data = await r.json()
+                        yield {"choices": [{"delta": {"content": response_data["choices"][0]["message"]["content"]}}]}
+                        yield {"choices": [{"delta": {"content": "[DONE]"}}]}
+                except aiohttp.ClientError:
+                    return
+    else:
+        async with aiohttp.ClientSession() as session:
+            try:
+                async with session.post(f"{base_url}/chat/completions", headers={"Authorization": f"Bearer {get_api_key(call='api_key')}", "Content-Type": "application/json"}, json=params) as r:
                     r.raise_for_status()
                     async for line in r.content:
                         if line:
                             except json.JSONDecodeError:
                                 continue
             except aiohttp.ClientError:
+                try:
+                    async with session.post("https://api.openai.com/v1/chat/completions", headers={"Authorization": f"Bearer {get_api_key(call='oai_api_key')}", "Content-Type": "application/json"}, json=params) as r:
+                        r.raise_for_status()
+                        async for line in r.content:
+                            if line:
+                                line_str = line.decode('utf-8')
+                                if line_str.startswith("data: "):
+                                    line_str = line_str[6:].strip()
+                                if line_str == "[DONE]":
+                                    continue
+                                try:
+                                    message = json.loads(line_str)
+                                    yield message
+                                except json.JSONDecodeError:
+                                    continue
+                except aiohttp.ClientError:
+                    return
 def imagine(prompt):
     try:
 handleApiKeys();loadModels();checkModels();loadENV();
+lastUpdateMessage = "New model support O1-* (no streaming/temp/top-p tho, and a bit edited system prompt thingies)"
 demo = gr.ChatInterface(
     respond,
+    title="O1-preview",
     description=f"A OpenAI API proxy!<br/>View API docs [here](/api/v1/docs) <strong>[Yes you can use this as an API in a simpler manner]</strong>.<br/><strong>[Last update: {lastUpdateMessage}]</strong> Also you can only submit images to vision models; txt/code/etc. to all models.",
     multimodal=True,
     additional_inputs=[
         gr.Textbox(value="You are a helpful assistant. You are an OpenAI GPT model. Please adhere to OpenAI's usage policies and guidelines. Ensure your responses are accurate, respectful, and within the scope of OpenAI's rules.", label="System message"),
+        gr.Dropdown(choices=models, value="o1-mini", label="Model"),
         gr.Slider(minimum=1, maximum=4096, value=4096, step=1, label="Max new tokens"),
         gr.Slider(minimum=0.1, maximum=2.0, value=0.7, step=0.05, label="Temperature"),
         gr.Slider(minimum=0.05, maximum=1.0, value=0.95, step=0.05, label="Top-p (nucleus sampling)"),