-
Notifications
You must be signed in to change notification settings - Fork 1.1k
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge branch 'master' into tohtana/offload_states
- Loading branch information
Showing
205 changed files
with
37,422 additions
and
39 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
57 changes: 57 additions & 0 deletions
57
benchmarks/inference/deepspeedometer/src/deepspeedometer/clients/openai_client.py
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,57 @@ | ||
import os | ||
import json | ||
import requests | ||
import subprocess | ||
import time | ||
from typing import Any, Dict | ||
|
||
from loguru import logger | ||
from pydantic import Field | ||
|
||
from .base import BaseClient | ||
from ..config import BaseConfigModel | ||
from ..prompt import Prompt | ||
|
||
|
||
# client to test any openai API | ||
class openaiClientConfig(BaseConfigModel): | ||
model: str = Field(..., description="HuggingFace.co model name") | ||
url: str = "http://127.0.0.1:26500/v1/completions" | ||
|
||
|
||
class openaiClient(BaseClient): | ||
def __init__(self, config: openaiClientConfig): | ||
super().__init__(config) | ||
|
||
def start_service(self) -> None: | ||
pass | ||
|
||
def stop_service(self) -> None: | ||
pass | ||
|
||
def prepare_request(self, prompt: Prompt) -> Dict[str, Any]: | ||
api_url = self.config.url | ||
headers = { | ||
"User-Agent": "Benchmark Client", | ||
"Content-Type": "application/json", | ||
"Authorization": f"Bearer {os.environ.get('OPENAI_API_KEY')}" | ||
} | ||
pload = { | ||
"prompt": prompt.text, | ||
"model": self.config.model, | ||
"n": 1, | ||
"use_beam_search": False, | ||
"temperature": 1.0, | ||
"top_p": 0.9, | ||
"max_tokens": prompt.max_new_tokens, | ||
"ignore_eos": False, | ||
} | ||
return {"url": api_url, "headers": headers, "json": pload, "timeout": 180} | ||
|
||
def send_request(self, request_kwargs: Dict[str, Any]) -> Any: | ||
response = requests.post(**request_kwargs) | ||
output = json.loads(response.content) | ||
return output | ||
|
||
def process_response(self, raw_response: Any) -> str: | ||
return raw_response["choices"][0]["text"] |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.