add llamacpp

bentoml · Jul 5, 2024 · a3ced7c · a3ced7c
1 parent ddd7094
commit a3ced7c
Show file tree

Hide file tree

Showing 2,016 changed files with 9,654 additions and 8,487 deletions.
diff --git a/...tos/gemma/2b-instruct-fp16-ad2d/README.md → ...tos/gemma/2b-instruct-fp16-da36/README.md b/...tos/gemma/2b-instruct-fp16-ad2d/README.md → ...tos/gemma/2b-instruct-fp16-da36/README.md
@@ -1,4 +1,4 @@
-# gemma:2b-instruct-fp16-ad2d
+# gemma:2b-instruct-fp16-da36
 
 [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML)
 [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)

diff --git a/...a/2b-instruct-fp16-ad2d/apis/openapi.yaml → ...a/2b-instruct-fp16-da36/apis/openapi.yaml b/...a/2b-instruct-fp16-ad2d/apis/openapi.yaml → ...a/2b-instruct-fp16-da36/apis/openapi.yaml
@@ -1036,39 +1036,6 @@ paths:
       tags:
       - Service APIs
       x-bentoml-name: generate
-  /chat/:
-    get:
-      operationId: serve_chat_html__get
-      responses:
-        '200':
-          content:
-            application/json:
-              schema: {}
-          description: Successful Response
-      summary: Serve Chat Html
-  /chat/{full_path}:
-    get:
-      operationId: catch_all__full_path__get
-      parameters:
-      - in: path
-        name: full_path
-        required: true
-        schema:
-          title: Full Path
-          type: string
-      responses:
-        '200':
-          content:
-            application/json:
-              schema: {}
-          description: Successful Response
-        '422':
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/HTTPValidationError'
-          description: Validation Error
-      summary: Catch All
   /healthz:
     get:
       description: Health check endpoint. Expecting an empty response with status
@@ -1109,6 +1076,39 @@ paths:
           description: Successful Response
       tags:
       - Infrastructure
+  /ui/:
+    get:
+      operationId: serve_chat_html__get
+      responses:
+        '200':
+          content:
+            application/json:
+              schema: {}
+          description: Successful Response
+      summary: Serve Chat Html
+  /ui/{full_path}:
+    get:
+      operationId: catch_all__full_path__get
+      parameters:
+      - in: path
+        name: full_path
+        required: true
+        schema:
+          title: Full Path
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema: {}
+          description: Successful Response
+        '422':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/HTTPValidationError'
+          description: Validation Error
+      summary: Catch All
   /v1/chat/completions:
     post:
       operationId: create_chat_completion_chat_completions_post

diff --git a/...ma/2b-instruct-fp16-ad2d/apis/schema.json → ...ma/2b-instruct-fp16-da36/apis/schema.json b/...ma/2b-instruct-fp16-ad2d/apis/schema.json → ...ma/2b-instruct-fp16-da36/apis/schema.json
diff --git a/...os/gemma/2b-instruct-fp16-ad2d/bento.yaml → ...os/gemma/2b-instruct-fp16-da36/bento.yaml b/...os/gemma/2b-instruct-fp16-ad2d/bento.yaml → ...os/gemma/2b-instruct-fp16-da36/bento.yaml
@@ -1,14 +1,14 @@
 service: service:VLLM
 name: gemma
-version: 2b-instruct-fp16-ad2d
+version: 2b-instruct-fp16-da36
 bentoml_version: 1.2.19
-creation_time: '2024-07-03T09:42:28.113622+00:00'
+creation_time: '2024-07-05T07:31:05.934035+00:00'
 labels:
   openllm_alias: 2b,2b-instruct
   openllm_hf_model_id: google/gemma-2b-it
   owner: bentoml-team
   platforms: linux
-  source: https://github.com/bentoml/openllm-repo-recipe/tree/main/vllm-chat
+  source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat
 models: []
 runners: []
 entry_service: gemma

diff --git a/...-instruct-fp16-ad2d/env/docker/Dockerfile → ...-instruct-fp16-da36/env/docker/Dockerfile b/...-instruct-fp16-ad2d/env/docker/Dockerfile → ...-instruct-fp16-da36/env/docker/Dockerfile
diff --git a/...struct-fp16-ad2d/env/docker/entrypoint.sh → ...struct-fp16-da36/env/docker/entrypoint.sh b/...struct-fp16-ad2d/env/docker/entrypoint.sh → ...struct-fp16-da36/env/docker/entrypoint.sh
diff --git a/...-instruct-fp16-ad2d/env/python/install.sh → ...-instruct-fp16-da36/env/python/install.sh b/...-instruct-fp16-ad2d/env/python/install.sh → ...-instruct-fp16-da36/env/python/install.sh
diff --git a/...bit-5b23/env/python/requirements.lock.txt → ...p16-da36/env/python/requirements.lock.txt b/...bit-5b23/env/python/requirements.lock.txt → ...p16-da36/env/python/requirements.lock.txt
@@ -9,13 +9,13 @@ attrs==23.2.0
 bentoml==1.2.19
 build==1.2.1
 cattrs==23.1.2
-certifi==2024.6.2
+certifi==2024.7.4
 charset-normalizer==3.3.2
 circus==0.18.0
 click==8.1.7
 click-option-group==0.5.6
 cloudpickle==3.0.0
-cmake==3.29.6
+cmake==3.30.0
 deepmerge==1.1.1
 deprecated==1.2.14
 diskcache==5.6.3
@@ -70,7 +70,7 @@ nvidia-ml-py==11.525.150
 nvidia-nccl-cu12==2.20.5
 nvidia-nvjitlink-cu12==12.5.82
 nvidia-nvtx-cu12==12.1.105
-openai==1.35.9
+openai==1.35.10
 opentelemetry-api==1.20.0
 opentelemetry-instrumentation==0.41b0
 opentelemetry-instrumentation-aiohttp-client==0.41b0
@@ -89,8 +89,8 @@ prometheus-fastapi-instrumentator==7.0.0
 protobuf==5.27.2
 psutil==6.0.0
 py-cpuinfo==9.0.0
-pydantic==2.8.0
-pydantic-core==2.20.0
+pydantic==2.8.2
+pydantic-core==2.20.1
 pygments==2.18.0
 pyparsing==3.1.2
 pyproject-hooks==1.1.0

diff --git a/...uct-fp16-ad2d/env/python/requirements.txt → ...uct-fp16-da36/env/python/requirements.txt b/...uct-fp16-ad2d/env/python/requirements.txt → ...uct-fp16-da36/env/python/requirements.txt
diff --git a/...instruct-fp16-ad2d/env/python/version.txt → ...instruct-fp16-da36/env/python/version.txt b/...instruct-fp16-ad2d/env/python/version.txt → ...instruct-fp16-da36/env/python/version.txt
diff --git a/...instruct-fp16-ad2d/src/bento_constants.py → ...instruct-fp16-da36/src/bento_constants.py b/...instruct-fp16-ad2d/src/bento_constants.py → ...instruct-fp16-da36/src/bento_constants.py
diff --git a/.../2b-instruct-fp16-ad2d/src/bentofile.yaml → .../2b-instruct-fp16-da36/src/bentofile.yaml b/.../2b-instruct-fp16-ad2d/src/bentofile.yaml → .../2b-instruct-fp16-da36/src/bentofile.yaml
@@ -32,7 +32,7 @@ labels:
   openllm_hf_model_id: google/gemma-2b-it
   owner: bentoml-team
   platforms: linux
-  source: https://github.com/bentoml/openllm-repo-recipe/tree/main/vllm-chat
+  source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat
 models: []
 name: null
 python:

diff --git a/...hat_templates/chat_templates/alpaca.jinja → ...hat_templates/chat_templates/alpaca.jinja b/...hat_templates/chat_templates/alpaca.jinja → ...hat_templates/chat_templates/alpaca.jinja
diff --git a/..._templates/chat_templates/amberchat.jinja → ..._templates/chat_templates/amberchat.jinja b/..._templates/chat_templates/amberchat.jinja → ..._templates/chat_templates/amberchat.jinja
diff --git a/...hat_templates/chat_templates/chatml.jinja → ...hat_templates/chat_templates/chatml.jinja b/...hat_templates/chat_templates/chatml.jinja → ...hat_templates/chat_templates/chatml.jinja
diff --git a/...hat_templates/chat_templates/chatqa.jinja → ...hat_templates/chat_templates/chatqa.jinja b/...hat_templates/chat_templates/chatqa.jinja → ...hat_templates/chat_templates/chatqa.jinja
diff --git a/...ates/chat_templates/falcon-instruct.jinja → ...ates/chat_templates/falcon-instruct.jinja b/...ates/chat_templates/falcon-instruct.jinja → ...ates/chat_templates/falcon-instruct.jinja
diff --git a/...t_templates/chat_templates/gemma-it.jinja → ...t_templates/chat_templates/gemma-it.jinja b/...t_templates/chat_templates/gemma-it.jinja → ...t_templates/chat_templates/gemma-it.jinja
diff --git a/...mplates/chat_templates/llama-2-chat.jinja → ...mplates/chat_templates/llama-2-chat.jinja b/...mplates/chat_templates/llama-2-chat.jinja → ...mplates/chat_templates/llama-2-chat.jinja
diff --git a/...mplates/chat_templates/llama-3-chat.jinja → ...mplates/chat_templates/llama-3-chat.jinja b/...mplates/chat_templates/llama-3-chat.jinja → ...mplates/chat_templates/llama-3-chat.jinja
diff --git a/...tes/chat_templates/mistral-instruct.jinja → ...tes/chat_templates/mistral-instruct.jinja b/...tes/chat_templates/mistral-instruct.jinja → ...tes/chat_templates/mistral-instruct.jinja
diff --git a/...t_templates/chat_templates/openchat.jinja → ...t_templates/chat_templates/openchat.jinja b/...t_templates/chat_templates/openchat.jinja → ...t_templates/chat_templates/openchat.jinja
diff --git a/...chat_templates/chat_templates/phi-3.jinja → ...chat_templates/chat_templates/phi-3.jinja b/...chat_templates/chat_templates/phi-3.jinja → ...chat_templates/chat_templates/phi-3.jinja
diff --git a/...chat_templates/chat_templates/saiga.jinja → ...chat_templates/chat_templates/saiga.jinja b/...chat_templates/chat_templates/saiga.jinja → ...chat_templates/chat_templates/saiga.jinja
diff --git a/...lates/chat_templates/solar-instruct.jinja → ...lates/chat_templates/solar-instruct.jinja b/...lates/chat_templates/solar-instruct.jinja → ...lates/chat_templates/solar-instruct.jinja
diff --git a/...hat_templates/chat_templates/vicuna.jinja → ...hat_templates/chat_templates/vicuna.jinja b/...hat_templates/chat_templates/vicuna.jinja → ...hat_templates/chat_templates/vicuna.jinja
diff --git a/...hat_templates/chat_templates/zephyr.jinja → ...hat_templates/chat_templates/zephyr.jinja b/...hat_templates/chat_templates/zephyr.jinja → ...hat_templates/chat_templates/zephyr.jinja
diff --git a/..._templates/generation_configs/alpaca.json → ..._templates/generation_configs/alpaca.json b/..._templates/generation_configs/alpaca.json → ..._templates/generation_configs/alpaca.json
diff --git a/...mplates/generation_configs/amberchat.json → ...mplates/generation_configs/amberchat.json b/...mplates/generation_configs/amberchat.json → ...mplates/generation_configs/amberchat.json
diff --git a/..._templates/generation_configs/chatqa.json → ..._templates/generation_configs/chatqa.json b/..._templates/generation_configs/chatqa.json → ..._templates/generation_configs/chatqa.json
diff --git a/...emplates/generation_configs/gemma-it.json → ...emplates/generation_configs/gemma-it.json b/...emplates/generation_configs/gemma-it.json → ...emplates/generation_configs/gemma-it.json
diff --git a/...ates/generation_configs/llama-2-chat.json → ...ates/generation_configs/llama-2-chat.json b/...ates/generation_configs/llama-2-chat.json → ...ates/generation_configs/llama-2-chat.json
diff --git a/...ates/generation_configs/llama-3-chat.json → ...ates/generation_configs/llama-3-chat.json b/...ates/generation_configs/llama-3-chat.json → ...ates/generation_configs/llama-3-chat.json
diff --git a/.../generation_configs/mistral-instruct.json → .../generation_configs/mistral-instruct.json b/.../generation_configs/mistral-instruct.json → .../generation_configs/mistral-instruct.json
diff --git a/...emplates/generation_configs/openchat.json → ...emplates/generation_configs/openchat.json b/...emplates/generation_configs/openchat.json → ...emplates/generation_configs/openchat.json
diff --git a/..._templates/generation_configs/orca-2.json → ..._templates/generation_configs/orca-2.json b/..._templates/generation_configs/orca-2.json → ..._templates/generation_configs/orca-2.json
diff --git a/...t_templates/generation_configs/phi-3.json → ...t_templates/generation_configs/phi-3.json b/...t_templates/generation_configs/phi-3.json → ...t_templates/generation_configs/phi-3.json
diff --git a/...plates/generation_configs/qwen2-chat.json → ...plates/generation_configs/qwen2-chat.json b/...plates/generation_configs/qwen2-chat.json → ...plates/generation_configs/qwen2-chat.json
diff --git a/...t_templates/generation_configs/saiga.json → ...t_templates/generation_configs/saiga.json b/...t_templates/generation_configs/saiga.json → ...t_templates/generation_configs/saiga.json
diff --git a/...es/generation_configs/solar-instruct.json → ...es/generation_configs/solar-instruct.json b/...es/generation_configs/solar-instruct.json → ...es/generation_configs/solar-instruct.json
diff --git a/..._templates/generation_configs/vicuna.json → ..._templates/generation_configs/vicuna.json b/..._templates/generation_configs/vicuna.json → ..._templates/generation_configs/vicuna.json
diff --git a/...templates/generation_configs/yi-chat.json → ...templates/generation_configs/yi-chat.json b/...templates/generation_configs/yi-chat.json → ...templates/generation_configs/yi-chat.json
diff --git a/..._templates/generation_configs/zephyr.json → ..._templates/generation_configs/zephyr.json b/..._templates/generation_configs/zephyr.json → ..._templates/generation_configs/zephyr.json
diff --git a/...emma/2b-instruct-fp16-ad2d/src/service.py → ...emma/2b-instruct-fp16-da36/src/service.py b/...emma/2b-instruct-fp16-ad2d/src/service.py → ...emma/2b-instruct-fp16-da36/src/service.py
@@ -85,7 +85,7 @@ async def catch_all(full_path: str):
 
 
 @bentoml.mount_asgi_app(openai_api_app, path="/v1")
-@bentoml.mount_asgi_app(ui_app, path="/chat")
+@bentoml.mount_asgi_app(ui_app, path="/ui")
 @bentoml.service(**SERVICE_CONFIG)
 class VLLM:
     def __init__(self) -> None:

diff --git a/...mma/2b-instruct-fp16-ad2d/src/ui/404.html → ...mma/2b-instruct-fp16-da36/src/ui/404.html b/...mma/2b-instruct-fp16-ad2d/src/ui/404.html → ...mma/2b-instruct-fp16-da36/src/ui/404.html
diff --git a/...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js → ...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js → ...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js
diff --git a/...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js → ...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js → ...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js
diff --git a/...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js → ...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js b/...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js → ...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js
diff --git a/...tatic/chunks/370b0802-87e84e603248538e.js → ...tatic/chunks/370b0802-87e84e603248538e.js b/...tatic/chunks/370b0802-87e84e603248538e.js → ...tatic/chunks/370b0802-87e84e603248538e.js
diff --git a/...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js → ...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js → ...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js
diff --git a/...tatic/chunks/479ba886-0c92f49cb8e74e58.js → ...tatic/chunks/479ba886-0c92f49cb8e74e58.js b/...tatic/chunks/479ba886-0c92f49cb8e74e58.js → ...tatic/chunks/479ba886-0c92f49cb8e74e58.js
diff --git a/...tatic/chunks/59650de3-87b10f0662b51900.js → ...tatic/chunks/59650de3-87b10f0662b51900.js b/...tatic/chunks/59650de3-87b10f0662b51900.js → ...tatic/chunks/59650de3-87b10f0662b51900.js
diff --git a/...tatic/chunks/66ec4792-34336521b476aa45.js → ...tatic/chunks/66ec4792-34336521b476aa45.js b/...tatic/chunks/66ec4792-34336521b476aa45.js → ...tatic/chunks/66ec4792-34336521b476aa45.js
diff --git a/...ext/static/chunks/674-a1fcdac3696c5ed0.js → ...ext/static/chunks/674-a1fcdac3696c5ed0.js b/...ext/static/chunks/674-a1fcdac3696c5ed0.js → ...ext/static/chunks/674-a1fcdac3696c5ed0.js
diff --git a/...next/static/chunks/69-bf2efb63b1299e3b.js → ...next/static/chunks/69-bf2efb63b1299e3b.js b/...next/static/chunks/69-bf2efb63b1299e3b.js → ...next/static/chunks/69-bf2efb63b1299e3b.js
diff --git a/...ext/static/chunks/700-532b1fe2415e5859.js → ...ext/static/chunks/700-532b1fe2415e5859.js b/...ext/static/chunks/700-532b1fe2415e5859.js → ...ext/static/chunks/700-532b1fe2415e5859.js
diff --git a/...ext/static/chunks/899-fa939dd99dc7a1df.js → ...ext/static/chunks/899-fa939dd99dc7a1df.js b/...ext/static/chunks/899-fa939dd99dc7a1df.js → ...ext/static/chunks/899-fa939dd99dc7a1df.js
diff --git a/...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js → ...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js b/...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js → ...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js
diff --git a/...tatic/chunks/94730671-0f73873f7f5896de.js → ...tatic/chunks/94730671-0f73873f7f5896de.js b/...tatic/chunks/94730671-0f73873f7f5896de.js → ...tatic/chunks/94730671-0f73873f7f5896de.js
diff --git a/...ext/static/chunks/995-34374f39bb210839.js → ...ext/static/chunks/995-34374f39bb210839.js b/...ext/static/chunks/995-34374f39bb210839.js → ...ext/static/chunks/995-34374f39bb210839.js
diff --git a/...hunks/app/(site)/page-5b6e14439f55739b.js → ...hunks/app/(site)/page-5b6e14439f55739b.js b/...hunks/app/(site)/page-5b6e14439f55739b.js → ...hunks/app/(site)/page-5b6e14439f55739b.js
diff --git a/.../chunks/app/chat/page-9c8e223f40771eb6.js → .../chunks/app/chat/page-9c8e223f40771eb6.js b/.../chunks/app/chat/page-9c8e223f40771eb6.js → .../chunks/app/chat/page-9c8e223f40771eb6.js
diff --git a/...tic/chunks/app/layout-df2dea9dba0ceb06.js → ...tic/chunks/app/layout-df2dea9dba0ceb06.js b/...tic/chunks/app/layout-df2dea9dba0ceb06.js → ...tic/chunks/app/layout-df2dea9dba0ceb06.js
diff --git a/.../chunks/app/not-found-c76dccfb8b88da53.js → .../chunks/app/not-found-c76dccfb8b88da53.js b/.../chunks/app/not-found-c76dccfb8b88da53.js → .../chunks/app/not-found-c76dccfb8b88da53.js
diff --git a/...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js → ...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js b/...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js → ...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js
diff --git a/...tatic/chunks/fd9d1056-32c33f3919735051.js → ...tatic/chunks/fd9d1056-32c33f3919735051.js b/...tatic/chunks/fd9d1056-32c33f3919735051.js → ...tatic/chunks/fd9d1056-32c33f3919735051.js
diff --git a/...atic/chunks/framework-00a8ba1a63cfdc9e.js → ...atic/chunks/framework-00a8ba1a63cfdc9e.js b/...atic/chunks/framework-00a8ba1a63cfdc9e.js → ...atic/chunks/framework-00a8ba1a63cfdc9e.js
diff --git a/...tatic/chunks/main-app-e95f89b5006af8a8.js → ...tatic/chunks/main-app-e95f89b5006af8a8.js b/...tatic/chunks/main-app-e95f89b5006af8a8.js → ...tatic/chunks/main-app-e95f89b5006af8a8.js
diff --git a/...xt/static/chunks/main-bf1416cb53f2b4c0.js → ...xt/static/chunks/main-bf1416cb53f2b4c0.js b/...xt/static/chunks/main-bf1416cb53f2b4c0.js → ...xt/static/chunks/main-bf1416cb53f2b4c0.js
diff --git a/...tic/chunks/pages/_app-d21e88acd55d90f1.js → ...tic/chunks/pages/_app-d21e88acd55d90f1.js b/...tic/chunks/pages/_app-d21e88acd55d90f1.js → ...tic/chunks/pages/_app-d21e88acd55d90f1.js
diff --git a/...c/chunks/pages/_error-d6107f1aac0c574c.js → ...c/chunks/pages/_error-d6107f1aac0c574c.js b/...c/chunks/pages/_error-d6107f1aac0c574c.js → ...c/chunks/pages/_error-d6107f1aac0c574c.js
diff --git a/...atic/chunks/polyfills-c67a75d1b6f99dc8.js → ...atic/chunks/polyfills-c67a75d1b6f99dc8.js b/...atic/chunks/polyfills-c67a75d1b6f99dc8.js → ...atic/chunks/polyfills-c67a75d1b6f99dc8.js
diff --git a/...static/chunks/webpack-ee8b17d5a5297ccd.js → ...static/chunks/webpack-ee8b17d5a5297ccd.js b/...static/chunks/webpack-ee8b17d5a5297ccd.js → ...static/chunks/webpack-ee8b17d5a5297ccd.js
diff --git a/.../ui/_next/static/css/429544bd3cd8ce3a.css → .../ui/_next/static/css/429544bd3cd8ce3a.css b/.../ui/_next/static/css/429544bd3cd8ce3a.css → .../ui/_next/static/css/429544bd3cd8ce3a.css
diff --git a/.../ui/_next/static/css/5b67f082b31cfc7b.css → .../ui/_next/static/css/5b67f082b31cfc7b.css b/.../ui/_next/static/css/5b67f082b31cfc7b.css → .../ui/_next/static/css/5b67f082b31cfc7b.css
diff --git a/.../ui/_next/static/css/9e63023b20ddb15e.css → .../ui/_next/static/css/9e63023b20ddb15e.css b/.../ui/_next/static/css/9e63023b20ddb15e.css → .../ui/_next/static/css/9e63023b20ddb15e.css
diff --git a/...uct-fp16-ad2d/src/ui/apple-touch-icon.png → ...uct-fp16-da36/src/ui/apple-touch-icon.png b/...uct-fp16-ad2d/src/ui/apple-touch-icon.png → ...uct-fp16-da36/src/ui/apple-touch-icon.png
diff --git a/...ma/2b-instruct-fp16-ad2d/src/ui/chat.html → ...ma/2b-instruct-fp16-da36/src/ui/chat.html b/...ma/2b-instruct-fp16-ad2d/src/ui/chat.html → ...ma/2b-instruct-fp16-da36/src/ui/chat.html
diff --git a/...mma/2b-instruct-fp16-ad2d/src/ui/chat.txt → ...mma/2b-instruct-fp16-da36/src/ui/chat.txt b/...mma/2b-instruct-fp16-ad2d/src/ui/chat.txt → ...mma/2b-instruct-fp16-da36/src/ui/chat.txt
diff --git a/...struct-fp16-ad2d/src/ui/favicon-16x16.png → ...struct-fp16-da36/src/ui/favicon-16x16.png b/...struct-fp16-ad2d/src/ui/favicon-16x16.png → ...struct-fp16-da36/src/ui/favicon-16x16.png
diff --git a/.../2b-instruct-fp16-ad2d/src/ui/favicon.ico → .../2b-instruct-fp16-da36/src/ui/favicon.ico b/.../2b-instruct-fp16-ad2d/src/ui/favicon.ico → .../2b-instruct-fp16-da36/src/ui/favicon.ico
diff --git a/...a/2b-instruct-fp16-ad2d/src/ui/index.html → ...a/2b-instruct-fp16-da36/src/ui/index.html b/...a/2b-instruct-fp16-ad2d/src/ui/index.html → ...a/2b-instruct-fp16-da36/src/ui/index.html
diff --git a/...ma/2b-instruct-fp16-ad2d/src/ui/index.txt → ...ma/2b-instruct-fp16-da36/src/ui/index.txt b/...ma/2b-instruct-fp16-ad2d/src/ui/index.txt → ...ma/2b-instruct-fp16-da36/src/ui/index.txt
diff --git a/...gemma/7b-instruct-awq-4bit-5b23/README.md → ...gemma/7b-instruct-awq-4bit-6a74/README.md b/...gemma/7b-instruct-awq-4bit-5b23/README.md → ...gemma/7b-instruct-awq-4bit-6a74/README.md
@@ -1,4 +1,4 @@
-# gemma:7b-instruct-awq-4bit-5b23
+# gemma:7b-instruct-awq-4bit-6a74
 
 [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML)
 [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)

diff --git a/...-instruct-awq-4bit-5b23/apis/openapi.yaml → ...-instruct-awq-4bit-6a74/apis/openapi.yaml b/...-instruct-awq-4bit-5b23/apis/openapi.yaml → ...-instruct-awq-4bit-6a74/apis/openapi.yaml
@@ -1036,39 +1036,6 @@ paths:
       tags:
       - Service APIs
       x-bentoml-name: generate
-  /chat/:
-    get:
-      operationId: serve_chat_html__get
-      responses:
-        '200':
-          content:
-            application/json:
-              schema: {}
-          description: Successful Response
-      summary: Serve Chat Html
-  /chat/{full_path}:
-    get:
-      operationId: catch_all__full_path__get
-      parameters:
-      - in: path
-        name: full_path
-        required: true
-        schema:
-          title: Full Path
-          type: string
-      responses:
-        '200':
-          content:
-            application/json:
-              schema: {}
-          description: Successful Response
-        '422':
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/HTTPValidationError'
-          description: Validation Error
-      summary: Catch All
   /healthz:
     get:
       description: Health check endpoint. Expecting an empty response with status
@@ -1109,6 +1076,39 @@ paths:
           description: Successful Response
       tags:
       - Infrastructure
+  /ui/:
+    get:
+      operationId: serve_chat_html__get
+      responses:
+        '200':
+          content:
+            application/json:
+              schema: {}
+          description: Successful Response
+      summary: Serve Chat Html
+  /ui/{full_path}:
+    get:
+      operationId: catch_all__full_path__get
+      parameters:
+      - in: path
+        name: full_path
+        required: true
+        schema:
+          title: Full Path
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema: {}
+          description: Successful Response
+        '422':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/HTTPValidationError'
+          description: Validation Error
+      summary: Catch All
   /v1/chat/completions:
     post:
       operationId: create_chat_completion_chat_completions_post

diff --git a/...b-instruct-awq-4bit-5b23/apis/schema.json → ...b-instruct-awq-4bit-6a74/apis/schema.json b/...b-instruct-awq-4bit-5b23/apis/schema.json → ...b-instruct-awq-4bit-6a74/apis/schema.json
diff --git a/...emma/7b-instruct-awq-4bit-5b23/bento.yaml → ...emma/7b-instruct-awq-4bit-6a74/bento.yaml b/...emma/7b-instruct-awq-4bit-5b23/bento.yaml → ...emma/7b-instruct-awq-4bit-6a74/bento.yaml
@@ -1,14 +1,14 @@
 service: service:VLLM
 name: gemma
-version: 7b-instruct-awq-4bit-5b23
+version: 7b-instruct-awq-4bit-6a74
 bentoml_version: 1.2.19
-creation_time: '2024-07-03T09:43:50.470130+00:00'
+creation_time: '2024-07-05T07:32:14.773611+00:00'
 labels:
   openllm_alias: 7b-4bit,7b-instruct-4bit
   openllm_hf_model_id: casperhansen/gemma-7b-it-awq
   owner: bentoml-team
   platforms: linux
-  source: https://github.com/bentoml/openllm-repo-recipe/tree/main/vllm-chat
+  source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat
 models: []
 runners: []
 entry_service: gemma

diff --git a/...truct-awq-4bit-5b23/env/docker/Dockerfile → ...truct-awq-4bit-6a74/env/docker/Dockerfile b/...truct-awq-4bit-5b23/env/docker/Dockerfile → ...truct-awq-4bit-6a74/env/docker/Dockerfile
diff --git a/...ct-awq-4bit-5b23/env/docker/entrypoint.sh → ...ct-awq-4bit-6a74/env/docker/entrypoint.sh b/...ct-awq-4bit-5b23/env/docker/entrypoint.sh → ...ct-awq-4bit-6a74/env/docker/entrypoint.sh
diff --git a/...truct-awq-4bit-5b23/env/python/install.sh → ...truct-awq-4bit-6a74/env/python/install.sh b/...truct-awq-4bit-5b23/env/python/install.sh → ...truct-awq-4bit-6a74/env/python/install.sh
diff --git a/...p16-262a/env/python/requirements.lock.txt → ...bit-6a74/env/python/requirements.lock.txt b/...p16-262a/env/python/requirements.lock.txt → ...bit-6a74/env/python/requirements.lock.txt
@@ -9,13 +9,13 @@ attrs==23.2.0
 bentoml==1.2.19
 build==1.2.1
 cattrs==23.1.2
-certifi==2024.6.2
+certifi==2024.7.4
 charset-normalizer==3.3.2
 circus==0.18.0
 click==8.1.7
 click-option-group==0.5.6
 cloudpickle==3.0.0
-cmake==3.29.6
+cmake==3.30.0
 deepmerge==1.1.1
 deprecated==1.2.14
 diskcache==5.6.3
@@ -70,7 +70,7 @@ nvidia-ml-py==11.525.150
 nvidia-nccl-cu12==2.20.5
 nvidia-nvjitlink-cu12==12.5.82
 nvidia-nvtx-cu12==12.1.105
-openai==1.35.9
+openai==1.35.10
 opentelemetry-api==1.20.0
 opentelemetry-instrumentation==0.41b0
 opentelemetry-instrumentation-aiohttp-client==0.41b0
@@ -89,8 +89,8 @@ prometheus-fastapi-instrumentator==7.0.0
 protobuf==5.27.2
 psutil==6.0.0
 py-cpuinfo==9.0.0
-pydantic==2.8.0
-pydantic-core==2.20.0
+pydantic==2.8.2
+pydantic-core==2.20.1
 pygments==2.18.0
 pyparsing==3.1.2
 pyproject-hooks==1.1.0

diff --git a/...awq-4bit-5b23/env/python/requirements.txt → ...awq-4bit-6a74/env/python/requirements.txt b/...awq-4bit-5b23/env/python/requirements.txt → ...awq-4bit-6a74/env/python/requirements.txt
diff --git a/...ruct-awq-4bit-5b23/env/python/version.txt → ...ruct-awq-4bit-6a74/env/python/version.txt b/...ruct-awq-4bit-5b23/env/python/version.txt → ...ruct-awq-4bit-6a74/env/python/version.txt
diff --git a/...ruct-awq-4bit-5b23/src/bento_constants.py → ...ruct-awq-4bit-6a74/src/bento_constants.py b/...ruct-awq-4bit-5b23/src/bento_constants.py → ...ruct-awq-4bit-6a74/src/bento_constants.py
diff --git a/...instruct-awq-4bit-5b23/src/bentofile.yaml → ...instruct-awq-4bit-6a74/src/bentofile.yaml b/...instruct-awq-4bit-5b23/src/bentofile.yaml → ...instruct-awq-4bit-6a74/src/bentofile.yaml
@@ -32,7 +32,7 @@ labels:
   openllm_hf_model_id: casperhansen/gemma-7b-it-awq
   owner: bentoml-team
   platforms: linux
-  source: https://github.com/bentoml/openllm-repo-recipe/tree/main/vllm-chat
+  source: https://github.com/bentoml/openllm-models-feed/tree/main/source/vllm-chat
 models: []
 name: null
 python:

diff --git a/...hat_templates/chat_templates/alpaca.jinja → ...hat_templates/chat_templates/alpaca.jinja b/...hat_templates/chat_templates/alpaca.jinja → ...hat_templates/chat_templates/alpaca.jinja
diff --git a/..._templates/chat_templates/amberchat.jinja → ..._templates/chat_templates/amberchat.jinja b/..._templates/chat_templates/amberchat.jinja → ..._templates/chat_templates/amberchat.jinja
diff --git a/...hat_templates/chat_templates/chatml.jinja → ...hat_templates/chat_templates/chatml.jinja b/...hat_templates/chat_templates/chatml.jinja → ...hat_templates/chat_templates/chatml.jinja
diff --git a/...hat_templates/chat_templates/chatqa.jinja → ...hat_templates/chat_templates/chatqa.jinja b/...hat_templates/chat_templates/chatqa.jinja → ...hat_templates/chat_templates/chatqa.jinja
diff --git a/...ates/chat_templates/falcon-instruct.jinja → ...ates/chat_templates/falcon-instruct.jinja b/...ates/chat_templates/falcon-instruct.jinja → ...ates/chat_templates/falcon-instruct.jinja
diff --git a/...t_templates/chat_templates/gemma-it.jinja → ...t_templates/chat_templates/gemma-it.jinja b/...t_templates/chat_templates/gemma-it.jinja → ...t_templates/chat_templates/gemma-it.jinja
diff --git a/...mplates/chat_templates/llama-2-chat.jinja → ...mplates/chat_templates/llama-2-chat.jinja b/...mplates/chat_templates/llama-2-chat.jinja → ...mplates/chat_templates/llama-2-chat.jinja
diff --git a/...mplates/chat_templates/llama-3-chat.jinja → ...mplates/chat_templates/llama-3-chat.jinja b/...mplates/chat_templates/llama-3-chat.jinja → ...mplates/chat_templates/llama-3-chat.jinja
diff --git a/...tes/chat_templates/mistral-instruct.jinja → ...tes/chat_templates/mistral-instruct.jinja b/...tes/chat_templates/mistral-instruct.jinja → ...tes/chat_templates/mistral-instruct.jinja
diff --git a/...t_templates/chat_templates/openchat.jinja → ...t_templates/chat_templates/openchat.jinja b/...t_templates/chat_templates/openchat.jinja → ...t_templates/chat_templates/openchat.jinja
diff --git a/...chat_templates/chat_templates/phi-3.jinja → ...chat_templates/chat_templates/phi-3.jinja b/...chat_templates/chat_templates/phi-3.jinja → ...chat_templates/chat_templates/phi-3.jinja
diff --git a/...chat_templates/chat_templates/saiga.jinja → ...chat_templates/chat_templates/saiga.jinja b/...chat_templates/chat_templates/saiga.jinja → ...chat_templates/chat_templates/saiga.jinja
diff --git a/...lates/chat_templates/solar-instruct.jinja → ...lates/chat_templates/solar-instruct.jinja b/...lates/chat_templates/solar-instruct.jinja → ...lates/chat_templates/solar-instruct.jinja
diff --git a/...hat_templates/chat_templates/vicuna.jinja → ...hat_templates/chat_templates/vicuna.jinja b/...hat_templates/chat_templates/vicuna.jinja → ...hat_templates/chat_templates/vicuna.jinja
diff --git a/...hat_templates/chat_templates/zephyr.jinja → ...hat_templates/chat_templates/zephyr.jinja b/...hat_templates/chat_templates/zephyr.jinja → ...hat_templates/chat_templates/zephyr.jinja
diff --git a/..._templates/generation_configs/alpaca.json → ..._templates/generation_configs/alpaca.json b/..._templates/generation_configs/alpaca.json → ..._templates/generation_configs/alpaca.json
diff --git a/...mplates/generation_configs/amberchat.json → ...mplates/generation_configs/amberchat.json b/...mplates/generation_configs/amberchat.json → ...mplates/generation_configs/amberchat.json
diff --git a/..._templates/generation_configs/chatqa.json → ..._templates/generation_configs/chatqa.json b/..._templates/generation_configs/chatqa.json → ..._templates/generation_configs/chatqa.json
diff --git a/...emplates/generation_configs/gemma-it.json → ...emplates/generation_configs/gemma-it.json b/...emplates/generation_configs/gemma-it.json → ...emplates/generation_configs/gemma-it.json
diff --git a/...ates/generation_configs/llama-2-chat.json → ...ates/generation_configs/llama-2-chat.json b/...ates/generation_configs/llama-2-chat.json → ...ates/generation_configs/llama-2-chat.json
diff --git a/...ates/generation_configs/llama-3-chat.json → ...ates/generation_configs/llama-3-chat.json b/...ates/generation_configs/llama-3-chat.json → ...ates/generation_configs/llama-3-chat.json
diff --git a/.../generation_configs/mistral-instruct.json → .../generation_configs/mistral-instruct.json b/.../generation_configs/mistral-instruct.json → .../generation_configs/mistral-instruct.json
diff --git a/...emplates/generation_configs/openchat.json → ...emplates/generation_configs/openchat.json b/...emplates/generation_configs/openchat.json → ...emplates/generation_configs/openchat.json
diff --git a/..._templates/generation_configs/orca-2.json → ..._templates/generation_configs/orca-2.json b/..._templates/generation_configs/orca-2.json → ..._templates/generation_configs/orca-2.json
diff --git a/...t_templates/generation_configs/phi-3.json → ...t_templates/generation_configs/phi-3.json b/...t_templates/generation_configs/phi-3.json → ...t_templates/generation_configs/phi-3.json
diff --git a/...plates/generation_configs/qwen2-chat.json → ...plates/generation_configs/qwen2-chat.json b/...plates/generation_configs/qwen2-chat.json → ...plates/generation_configs/qwen2-chat.json
diff --git a/...t_templates/generation_configs/saiga.json → ...t_templates/generation_configs/saiga.json b/...t_templates/generation_configs/saiga.json → ...t_templates/generation_configs/saiga.json
diff --git a/...es/generation_configs/solar-instruct.json → ...es/generation_configs/solar-instruct.json b/...es/generation_configs/solar-instruct.json → ...es/generation_configs/solar-instruct.json
diff --git a/..._templates/generation_configs/vicuna.json → ..._templates/generation_configs/vicuna.json b/..._templates/generation_configs/vicuna.json → ..._templates/generation_configs/vicuna.json
diff --git a/...templates/generation_configs/yi-chat.json → ...templates/generation_configs/yi-chat.json b/...templates/generation_configs/yi-chat.json → ...templates/generation_configs/yi-chat.json
diff --git a/..._templates/generation_configs/zephyr.json → ..._templates/generation_configs/zephyr.json b/..._templates/generation_configs/zephyr.json → ..._templates/generation_configs/zephyr.json
diff --git a/.../7b-instruct-awq-4bit-5b23/src/service.py → .../7b-instruct-awq-4bit-6a74/src/service.py b/.../7b-instruct-awq-4bit-5b23/src/service.py → .../7b-instruct-awq-4bit-6a74/src/service.py
@@ -85,7 +85,7 @@ async def catch_all(full_path: str):
 
 
 @bentoml.mount_asgi_app(openai_api_app, path="/v1")
-@bentoml.mount_asgi_app(ui_app, path="/chat")
+@bentoml.mount_asgi_app(ui_app, path="/ui")
 @bentoml.service(**SERVICE_CONFIG)
 class VLLM:
     def __init__(self) -> None:

diff --git a/...7b-instruct-awq-4bit-5b23/src/ui/404.html → ...7b-instruct-awq-4bit-6a74/src/ui/404.html b/...7b-instruct-awq-4bit-5b23/src/ui/404.html → ...7b-instruct-awq-4bit-6a74/src/ui/404.html
diff --git a/...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js → ...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js → ...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js
diff --git a/...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js → ...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js → ...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js
diff --git a/...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js → ...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js b/...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js → ...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js
diff --git a/...tatic/chunks/370b0802-87e84e603248538e.js → ...tatic/chunks/370b0802-87e84e603248538e.js b/...tatic/chunks/370b0802-87e84e603248538e.js → ...tatic/chunks/370b0802-87e84e603248538e.js
diff --git a/...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js → ...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js → ...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js
diff --git a/...tatic/chunks/479ba886-0c92f49cb8e74e58.js → ...tatic/chunks/479ba886-0c92f49cb8e74e58.js b/...tatic/chunks/479ba886-0c92f49cb8e74e58.js → ...tatic/chunks/479ba886-0c92f49cb8e74e58.js
diff --git a/...tatic/chunks/59650de3-87b10f0662b51900.js → ...tatic/chunks/59650de3-87b10f0662b51900.js b/...tatic/chunks/59650de3-87b10f0662b51900.js → ...tatic/chunks/59650de3-87b10f0662b51900.js
diff --git a/...tatic/chunks/66ec4792-34336521b476aa45.js → ...tatic/chunks/66ec4792-34336521b476aa45.js b/...tatic/chunks/66ec4792-34336521b476aa45.js → ...tatic/chunks/66ec4792-34336521b476aa45.js
diff --git a/...ext/static/chunks/674-a1fcdac3696c5ed0.js → ...ext/static/chunks/674-a1fcdac3696c5ed0.js b/...ext/static/chunks/674-a1fcdac3696c5ed0.js → ...ext/static/chunks/674-a1fcdac3696c5ed0.js
diff --git a/...next/static/chunks/69-bf2efb63b1299e3b.js → ...next/static/chunks/69-bf2efb63b1299e3b.js b/...next/static/chunks/69-bf2efb63b1299e3b.js → ...next/static/chunks/69-bf2efb63b1299e3b.js
diff --git a/...ext/static/chunks/700-532b1fe2415e5859.js → ...ext/static/chunks/700-532b1fe2415e5859.js b/...ext/static/chunks/700-532b1fe2415e5859.js → ...ext/static/chunks/700-532b1fe2415e5859.js
diff --git a/...ext/static/chunks/899-fa939dd99dc7a1df.js → ...ext/static/chunks/899-fa939dd99dc7a1df.js b/...ext/static/chunks/899-fa939dd99dc7a1df.js → ...ext/static/chunks/899-fa939dd99dc7a1df.js
diff --git a/...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js → ...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js b/...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js → ...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js
diff --git a/...tatic/chunks/94730671-0f73873f7f5896de.js → ...tatic/chunks/94730671-0f73873f7f5896de.js b/...tatic/chunks/94730671-0f73873f7f5896de.js → ...tatic/chunks/94730671-0f73873f7f5896de.js
diff --git a/...ext/static/chunks/995-34374f39bb210839.js → ...ext/static/chunks/995-34374f39bb210839.js b/...ext/static/chunks/995-34374f39bb210839.js → ...ext/static/chunks/995-34374f39bb210839.js
diff --git a/...hunks/app/(site)/page-5b6e14439f55739b.js → ...hunks/app/(site)/page-5b6e14439f55739b.js b/...hunks/app/(site)/page-5b6e14439f55739b.js → ...hunks/app/(site)/page-5b6e14439f55739b.js
diff --git a/.../chunks/app/chat/page-9c8e223f40771eb6.js → .../chunks/app/chat/page-9c8e223f40771eb6.js b/.../chunks/app/chat/page-9c8e223f40771eb6.js → .../chunks/app/chat/page-9c8e223f40771eb6.js
diff --git a/...tic/chunks/app/layout-df2dea9dba0ceb06.js → ...tic/chunks/app/layout-df2dea9dba0ceb06.js b/...tic/chunks/app/layout-df2dea9dba0ceb06.js → ...tic/chunks/app/layout-df2dea9dba0ceb06.js
diff --git a/.../chunks/app/not-found-c76dccfb8b88da53.js → .../chunks/app/not-found-c76dccfb8b88da53.js b/.../chunks/app/not-found-c76dccfb8b88da53.js → .../chunks/app/not-found-c76dccfb8b88da53.js
diff --git a/...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js → ...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js b/...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js → ...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js
diff --git a/...tatic/chunks/fd9d1056-32c33f3919735051.js → ...tatic/chunks/fd9d1056-32c33f3919735051.js b/...tatic/chunks/fd9d1056-32c33f3919735051.js → ...tatic/chunks/fd9d1056-32c33f3919735051.js
diff --git a/...atic/chunks/framework-00a8ba1a63cfdc9e.js → ...atic/chunks/framework-00a8ba1a63cfdc9e.js b/...atic/chunks/framework-00a8ba1a63cfdc9e.js → ...atic/chunks/framework-00a8ba1a63cfdc9e.js
diff --git a/...tatic/chunks/main-app-e95f89b5006af8a8.js → ...tatic/chunks/main-app-e95f89b5006af8a8.js b/...tatic/chunks/main-app-e95f89b5006af8a8.js → ...tatic/chunks/main-app-e95f89b5006af8a8.js
diff --git a/...xt/static/chunks/main-bf1416cb53f2b4c0.js → ...xt/static/chunks/main-bf1416cb53f2b4c0.js b/...xt/static/chunks/main-bf1416cb53f2b4c0.js → ...xt/static/chunks/main-bf1416cb53f2b4c0.js
diff --git a/...tic/chunks/pages/_app-d21e88acd55d90f1.js → ...tic/chunks/pages/_app-d21e88acd55d90f1.js b/...tic/chunks/pages/_app-d21e88acd55d90f1.js → ...tic/chunks/pages/_app-d21e88acd55d90f1.js
diff --git a/...c/chunks/pages/_error-d6107f1aac0c574c.js → ...c/chunks/pages/_error-d6107f1aac0c574c.js b/...c/chunks/pages/_error-d6107f1aac0c574c.js → ...c/chunks/pages/_error-d6107f1aac0c574c.js
diff --git a/...atic/chunks/polyfills-c67a75d1b6f99dc8.js → ...atic/chunks/polyfills-c67a75d1b6f99dc8.js b/...atic/chunks/polyfills-c67a75d1b6f99dc8.js → ...atic/chunks/polyfills-c67a75d1b6f99dc8.js
diff --git a/...static/chunks/webpack-ee8b17d5a5297ccd.js → ...static/chunks/webpack-ee8b17d5a5297ccd.js b/...static/chunks/webpack-ee8b17d5a5297ccd.js → ...static/chunks/webpack-ee8b17d5a5297ccd.js
diff --git a/.../ui/_next/static/css/429544bd3cd8ce3a.css → .../ui/_next/static/css/429544bd3cd8ce3a.css b/.../ui/_next/static/css/429544bd3cd8ce3a.css → .../ui/_next/static/css/429544bd3cd8ce3a.css
diff --git a/.../ui/_next/static/css/5b67f082b31cfc7b.css → .../ui/_next/static/css/5b67f082b31cfc7b.css b/.../ui/_next/static/css/5b67f082b31cfc7b.css → .../ui/_next/static/css/5b67f082b31cfc7b.css
diff --git a/.../ui/_next/static/css/9e63023b20ddb15e.css → .../ui/_next/static/css/9e63023b20ddb15e.css b/.../ui/_next/static/css/9e63023b20ddb15e.css → .../ui/_next/static/css/9e63023b20ddb15e.css
diff --git a/...awq-4bit-5b23/src/ui/apple-touch-icon.png → ...awq-4bit-6a74/src/ui/apple-touch-icon.png b/...awq-4bit-5b23/src/ui/apple-touch-icon.png → ...awq-4bit-6a74/src/ui/apple-touch-icon.png
diff --git a/...b-instruct-awq-4bit-5b23/src/ui/chat.html → ...b-instruct-awq-4bit-6a74/src/ui/chat.html b/...b-instruct-awq-4bit-5b23/src/ui/chat.html → ...b-instruct-awq-4bit-6a74/src/ui/chat.html
diff --git a/...7b-instruct-awq-4bit-5b23/src/ui/chat.txt → ...7b-instruct-awq-4bit-6a74/src/ui/chat.txt b/...7b-instruct-awq-4bit-5b23/src/ui/chat.txt → ...7b-instruct-awq-4bit-6a74/src/ui/chat.txt
diff --git a/...ct-awq-4bit-5b23/src/ui/favicon-16x16.png → ...ct-awq-4bit-6a74/src/ui/favicon-16x16.png b/...ct-awq-4bit-5b23/src/ui/favicon-16x16.png → ...ct-awq-4bit-6a74/src/ui/favicon-16x16.png
diff --git a/...instruct-awq-4bit-5b23/src/ui/favicon.ico → ...instruct-awq-4bit-6a74/src/ui/favicon.ico b/...instruct-awq-4bit-5b23/src/ui/favicon.ico → ...instruct-awq-4bit-6a74/src/ui/favicon.ico
diff --git a/...-instruct-awq-4bit-5b23/src/ui/index.html → ...-instruct-awq-4bit-6a74/src/ui/index.html b/...-instruct-awq-4bit-5b23/src/ui/index.html → ...-instruct-awq-4bit-6a74/src/ui/index.html
diff --git a/...b-instruct-awq-4bit-5b23/src/ui/index.txt → ...b-instruct-awq-4bit-6a74/src/ui/index.txt b/...b-instruct-awq-4bit-5b23/src/ui/index.txt → ...b-instruct-awq-4bit-6a74/src/ui/index.txt
diff --git a/...tos/gemma/7b-instruct-fp16-262a/README.md → ...tos/gemma/7b-instruct-fp16-dafc/README.md b/...tos/gemma/7b-instruct-fp16-262a/README.md → ...tos/gemma/7b-instruct-fp16-dafc/README.md
@@ -1,4 +1,4 @@
-# gemma:7b-instruct-fp16-262a
+# gemma:7b-instruct-fp16-dafc
 
 [![pypi_status](https://img.shields.io/badge/BentoML-1.2.19-informational)](https://pypi.org/project/BentoML)
 [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)