Skip to content

Commit

Permalink
fix(models): chat ui
Browse files Browse the repository at this point in the history
  • Loading branch information
bojiang committed Jul 8, 2024
1 parent fa4f044 commit 32665a4
Show file tree
Hide file tree
Showing 2,017 changed files with 8,478 additions and 8,478 deletions.
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# gemma:2b-instruct-fp16-da36
# gemma:2b-instruct-fp16-26b3

[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML)
[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -1036,6 +1036,39 @@ paths:
tags:
- Service APIs
x-bentoml-name: generate
/chat/:
get:
operationId: serve_chat_html__get
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
summary: Serve Chat Html
/chat/{full_path}:
get:
operationId: catch_all__full_path__get
parameters:
- in: path
name: full_path
required: true
schema:
title: Full Path
type: string
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
'422':
content:
application/json:
schema:
$ref: '#/components/schemas/HTTPValidationError'
description: Validation Error
summary: Catch All
/healthz:
get:
description: Health check endpoint. Expecting an empty response with status
Expand Down Expand Up @@ -1076,39 +1109,6 @@ paths:
description: Successful Response
tags:
- Infrastructure
/ui/:
get:
operationId: serve_chat_html__get
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
summary: Serve Chat Html
/ui/{full_path}:
get:
operationId: catch_all__full_path__get
parameters:
- in: path
name: full_path
required: true
schema:
title: Full Path
type: string
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
'422':
content:
application/json:
schema:
$ref: '#/components/schemas/HTTPValidationError'
description: Validation Error
summary: Catch All
/v1/chat/completions:
post:
operationId: create_chat_completion_chat_completions_post
Expand Down
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
service: service:VLLM
name: gemma
version: 2b-instruct-fp16-da36
version: 2b-instruct-fp16-26b3
bentoml_version: 1.2.19
creation_time: '2024-07-05T07:31:05.934035+00:00'
creation_time: '2024-07-08T07:57:26.100524+00:00'
labels:
openllm_alias: 2b,2b-instruct
openllm_hf_model_id: google/gemma-2b-it
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -143,5 +143,5 @@ yarl==1.9.4
zipp==3.19.2

# The following packages are considered to be unsafe in a requirements file:
pip==24.1.1
pip==24.1.2
setuptools==70.2.0
Original file line number Diff line number Diff line change
Expand Up @@ -85,7 +85,7 @@ async def catch_all(full_path: str):


@bentoml.mount_asgi_app(openai_api_app, path="/v1")
@bentoml.mount_asgi_app(ui_app, path="/ui")
@bentoml.mount_asgi_app(ui_app, path="/chat")
@bentoml.service(**SERVICE_CONFIG)
class VLLM:
def __init__(self) -> None:
Expand Down
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# gemma:7b-instruct-awq-4bit-6a74
# gemma:7b-instruct-awq-4bit-d670

[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML)
[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -1036,6 +1036,39 @@ paths:
tags:
- Service APIs
x-bentoml-name: generate
/chat/:
get:
operationId: serve_chat_html__get
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
summary: Serve Chat Html
/chat/{full_path}:
get:
operationId: catch_all__full_path__get
parameters:
- in: path
name: full_path
required: true
schema:
title: Full Path
type: string
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
'422':
content:
application/json:
schema:
$ref: '#/components/schemas/HTTPValidationError'
description: Validation Error
summary: Catch All
/healthz:
get:
description: Health check endpoint. Expecting an empty response with status
Expand Down Expand Up @@ -1076,39 +1109,6 @@ paths:
description: Successful Response
tags:
- Infrastructure
/ui/:
get:
operationId: serve_chat_html__get
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
summary: Serve Chat Html
/ui/{full_path}:
get:
operationId: catch_all__full_path__get
parameters:
- in: path
name: full_path
required: true
schema:
title: Full Path
type: string
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
'422':
content:
application/json:
schema:
$ref: '#/components/schemas/HTTPValidationError'
description: Validation Error
summary: Catch All
/v1/chat/completions:
post:
operationId: create_chat_completion_chat_completions_post
Expand Down
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
service: service:VLLM
name: gemma
version: 7b-instruct-awq-4bit-6a74
version: 7b-instruct-awq-4bit-d670
bentoml_version: 1.2.19
creation_time: '2024-07-05T07:32:14.773611+00:00'
creation_time: '2024-07-08T07:59:18.619602+00:00'
labels:
openllm_alias: 7b-4bit,7b-instruct-4bit
openllm_hf_model_id: casperhansen/gemma-7b-it-awq
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -143,5 +143,5 @@ yarl==1.9.4
zipp==3.19.2

# The following packages are considered to be unsafe in a requirements file:
pip==24.1.1
pip==24.1.2
setuptools==70.2.0
Original file line number Diff line number Diff line change
Expand Up @@ -85,7 +85,7 @@ async def catch_all(full_path: str):


@bentoml.mount_asgi_app(openai_api_app, path="/v1")
@bentoml.mount_asgi_app(ui_app, path="/ui")
@bentoml.mount_asgi_app(ui_app, path="/chat")
@bentoml.service(**SERVICE_CONFIG)
class VLLM:
def __init__(self) -> None:
Expand Down
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# gemma:7b-instruct-fp16-dafc
# gemma:7b-instruct-fp16-ae3e

[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML)
[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -1036,6 +1036,39 @@ paths:
tags:
- Service APIs
x-bentoml-name: generate
/chat/:
get:
operationId: serve_chat_html__get
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
summary: Serve Chat Html
/chat/{full_path}:
get:
operationId: catch_all__full_path__get
parameters:
- in: path
name: full_path
required: true
schema:
title: Full Path
type: string
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
'422':
content:
application/json:
schema:
$ref: '#/components/schemas/HTTPValidationError'
description: Validation Error
summary: Catch All
/healthz:
get:
description: Health check endpoint. Expecting an empty response with status
Expand Down Expand Up @@ -1076,39 +1109,6 @@ paths:
description: Successful Response
tags:
- Infrastructure
/ui/:
get:
operationId: serve_chat_html__get
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
summary: Serve Chat Html
/ui/{full_path}:
get:
operationId: catch_all__full_path__get
parameters:
- in: path
name: full_path
required: true
schema:
title: Full Path
type: string
responses:
'200':
content:
application/json:
schema: {}
description: Successful Response
'422':
content:
application/json:
schema:
$ref: '#/components/schemas/HTTPValidationError'
description: Validation Error
summary: Catch All
/v1/chat/completions:
post:
operationId: create_chat_completion_chat_completions_post
Expand Down
Original file line number Diff line number Diff line change
@@ -1,8 +1,8 @@
service: service:VLLM
name: gemma
version: 7b-instruct-fp16-dafc
version: 7b-instruct-fp16-ae3e
bentoml_version: 1.2.19
creation_time: '2024-07-05T07:31:38.255529+00:00'
creation_time: '2024-07-08T07:58:22.853090+00:00'
labels:
openllm_alias: 7b,7b-instruct
openllm_hf_model_id: google/gemma-7b-it
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -143,5 +143,5 @@ yarl==1.9.4
zipp==3.19.2

# The following packages are considered to be unsafe in a requirements file:
pip==24.1.1
pip==24.1.2
setuptools==70.2.0
Original file line number Diff line number Diff line change
Expand Up @@ -85,7 +85,7 @@ async def catch_all(full_path: str):


@bentoml.mount_asgi_app(openai_api_app, path="/v1")
@bentoml.mount_asgi_app(ui_app, path="/ui")
@bentoml.mount_asgi_app(ui_app, path="/chat")
@bentoml.service(**SERVICE_CONFIG)
class VLLM:
def __init__(self) -> None:
Expand Down
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# llama2:70b-chat-fp16-4512
# llama2:13b-chat-fp16-4059

[![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML)
[![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)
Expand Down
Loading

0 comments on commit 32665a4

Please sign in to comment.