feat: Support llama-3.1 405B awq (#6)

bentoml · Jul 24, 2024 · c478576 · c478576
1 parent 5777664
commit c478576
Show file tree

Hide file tree

Showing 604 changed files with 2,879 additions and 40 deletions.
diff --git a/bentoml/bentos/gemma/2b-instruct-fp16-f020/bento.yaml b/bentoml/bentos/gemma/2b-instruct-fp16-f020/bento.yaml
@@ -2,7 +2,7 @@ service: service:VLLM
 name: gemma
 version: 2b-instruct-fp16-f020
 bentoml_version: 1.3.0
-creation_time: '2024-07-24T01:41:41.538750+00:00'
+creation_time: '2024-07-24T08:19:28.675802+00:00'
 labels:
   model_name: google/gemma-2b-it
   openllm_alias: 2b,2b-instruct

diff --git a/bentoml/bentos/gemma/7b-instruct-awq-4bit-2eed/bento.yaml b/bentoml/bentos/gemma/7b-instruct-awq-4bit-2eed/bento.yaml
@@ -2,7 +2,7 @@ service: service:VLLM
 name: gemma
 version: 7b-instruct-awq-4bit-2eed
 bentoml_version: 1.3.0
-creation_time: '2024-07-24T01:41:55.950169+00:00'
+creation_time: '2024-07-24T08:19:43.100369+00:00'
 labels:
   model_name: casperhansen/gemma-7b-it-awq
   openllm_alias: 7b-4bit,7b-instruct-4bit

diff --git a/bentoml/bentos/gemma/7b-instruct-fp16-1e96/bento.yaml b/bentoml/bentos/gemma/7b-instruct-fp16-1e96/bento.yaml
@@ -2,7 +2,7 @@ service: service:VLLM
 name: gemma
 version: 7b-instruct-fp16-1e96
 bentoml_version: 1.3.0
-creation_time: '2024-07-24T01:41:48.722559+00:00'
+creation_time: '2024-07-24T08:19:35.937782+00:00'
 labels:
   model_name: google/gemma-7b-it
   openllm_alias: 7b,7b-instruct

diff --git a/bentoml/bentos/llama2/13b-chat-fp16-603a/bento.yaml b/bentoml/bentos/llama2/13b-chat-fp16-603a/bento.yaml
@@ -2,7 +2,7 @@ service: service:VLLM
 name: llama2
 version: 13b-chat-fp16-603a
 bentoml_version: 1.3.0
-creation_time: '2024-07-24T01:40:08.002412+00:00'
+creation_time: '2024-07-24T08:17:48.252205+00:00'
 labels:
   model_name: meta-llama/Llama-2-13b-chat-hf
   openllm_alias: 13b,13b-chat

diff --git a/...entos/llama2/70b-chat-fp16-95c5/README.md → ...entos/llama2/70b-chat-fp16-11af/README.md b/...entos/llama2/70b-chat-fp16-95c5/README.md → ...entos/llama2/70b-chat-fp16-11af/README.md
@@ -1,4 +1,4 @@
-# llama2:70b-chat-fp16-95c5
+# llama2:70b-chat-fp16-11af
 
 [![pypi_status](https://img.shields.io/badge/BentoML-1.3.0-informational)](https://pypi.org/project/BentoML)
 [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)

diff --git a/...ama2/70b-chat-fp16-95c5/apis/openapi.yaml → ...ama2/70b-chat-fp16-11af/apis/openapi.yaml b/...ama2/70b-chat-fp16-95c5/apis/openapi.yaml → ...ama2/70b-chat-fp16-11af/apis/openapi.yaml
diff --git a/...lama2/70b-chat-fp16-95c5/apis/schema.json → ...lama2/70b-chat-fp16-11af/apis/schema.json b/...lama2/70b-chat-fp16-95c5/apis/schema.json → ...lama2/70b-chat-fp16-11af/apis/schema.json
diff --git a/...ntos/llama2/70b-chat-fp16-95c5/bento.yaml → ...ntos/llama2/70b-chat-fp16-11af/bento.yaml b/...ntos/llama2/70b-chat-fp16-95c5/bento.yaml → ...ntos/llama2/70b-chat-fp16-11af/bento.yaml
@@ -1,8 +1,8 @@
 service: service:VLLM
 name: llama2
-version: 70b-chat-fp16-95c5
+version: 70b-chat-fp16-11af
 bentoml_version: 1.3.0
-creation_time: '2024-07-24T01:40:15.203387+00:00'
+creation_time: '2024-07-24T08:17:55.444721+00:00'
 labels:
   model_name: meta-llama/Llama-2-70b-chat-hf
   openllm_alias: 70b,70b-chat

diff --git a/.../70b-chat-fp16-95c5/env/docker/Dockerfile → .../70b-chat-fp16-11af/env/docker/Dockerfile b/.../70b-chat-fp16-95c5/env/docker/Dockerfile → .../70b-chat-fp16-11af/env/docker/Dockerfile
diff --git a/...b-chat-fp16-95c5/env/docker/entrypoint.sh → ...b-chat-fp16-11af/env/docker/entrypoint.sh b/...b-chat-fp16-95c5/env/docker/entrypoint.sh → ...b-chat-fp16-11af/env/docker/entrypoint.sh
diff --git a/.../70b-chat-fp16-95c5/env/python/install.sh → .../70b-chat-fp16-11af/env/python/install.sh b/.../70b-chat-fp16-95c5/env/python/install.sh → .../70b-chat-fp16-11af/env/python/install.sh
diff --git a/...p16-95c5/env/python/requirements.lock.txt → ...p16-11af/env/python/requirements.lock.txt b/...p16-95c5/env/python/requirements.lock.txt → ...p16-11af/env/python/requirements.lock.txt
diff --git a/...hat-fp16-95c5/env/python/requirements.txt → ...hat-fp16-11af/env/python/requirements.txt b/...hat-fp16-95c5/env/python/requirements.txt → ...hat-fp16-11af/env/python/requirements.txt
diff --git a/...70b-chat-fp16-95c5/env/python/version.txt → ...70b-chat-fp16-11af/env/python/version.txt b/...70b-chat-fp16-95c5/env/python/version.txt → ...70b-chat-fp16-11af/env/python/version.txt
diff --git a/...70b-chat-fp16-95c5/src/bento_constants.py → ...70b-chat-fp16-11af/src/bento_constants.py b/...70b-chat-fp16-95c5/src/bento_constants.py → ...70b-chat-fp16-11af/src/bento_constants.py
@@ -5,6 +5,7 @@
   dtype: half
   max_model_len: 1024
   model: meta-llama/Llama-2-70b-chat-hf
+  tensor_parallel_size: 2
 extra_labels:
   model_name: meta-llama/Llama-2-70b-chat-hf
   openllm_alias: 70b,70b-chat

diff --git a/...ma2/70b-chat-fp16-95c5/src/bentofile.yaml → ...ma2/70b-chat-fp16-11af/src/bentofile.yaml b/...ma2/70b-chat-fp16-95c5/src/bentofile.yaml → ...ma2/70b-chat-fp16-11af/src/bentofile.yaml
diff --git a/...hat_templates/chat_templates/alpaca.jinja → ...hat_templates/chat_templates/alpaca.jinja b/...hat_templates/chat_templates/alpaca.jinja → ...hat_templates/chat_templates/alpaca.jinja
diff --git a/..._templates/chat_templates/amberchat.jinja → ..._templates/chat_templates/amberchat.jinja b/..._templates/chat_templates/amberchat.jinja → ..._templates/chat_templates/amberchat.jinja
diff --git a/...hat_templates/chat_templates/chatml.jinja → ...hat_templates/chat_templates/chatml.jinja b/...hat_templates/chat_templates/chatml.jinja → ...hat_templates/chat_templates/chatml.jinja
diff --git a/...hat_templates/chat_templates/chatqa.jinja → ...hat_templates/chat_templates/chatqa.jinja b/...hat_templates/chat_templates/chatqa.jinja → ...hat_templates/chat_templates/chatqa.jinja
diff --git a/...ates/chat_templates/falcon-instruct.jinja → ...ates/chat_templates/falcon-instruct.jinja b/...ates/chat_templates/falcon-instruct.jinja → ...ates/chat_templates/falcon-instruct.jinja
diff --git a/...t_templates/chat_templates/gemma-it.jinja → ...t_templates/chat_templates/gemma-it.jinja b/...t_templates/chat_templates/gemma-it.jinja → ...t_templates/chat_templates/gemma-it.jinja
diff --git a/...mplates/chat_templates/llama-2-chat.jinja → ...mplates/chat_templates/llama-2-chat.jinja b/...mplates/chat_templates/llama-2-chat.jinja → ...mplates/chat_templates/llama-2-chat.jinja
diff --git a/...mplates/chat_templates/llama-3-chat.jinja → ...mplates/chat_templates/llama-3-chat.jinja b/...mplates/chat_templates/llama-3-chat.jinja → ...mplates/chat_templates/llama-3-chat.jinja
diff --git a/...tes/chat_templates/mistral-instruct.jinja → ...tes/chat_templates/mistral-instruct.jinja b/...tes/chat_templates/mistral-instruct.jinja → ...tes/chat_templates/mistral-instruct.jinja
diff --git a/...t_templates/chat_templates/openchat.jinja → ...t_templates/chat_templates/openchat.jinja b/...t_templates/chat_templates/openchat.jinja → ...t_templates/chat_templates/openchat.jinja
diff --git a/...chat_templates/chat_templates/phi-3.jinja → ...chat_templates/chat_templates/phi-3.jinja b/...chat_templates/chat_templates/phi-3.jinja → ...chat_templates/chat_templates/phi-3.jinja
diff --git a/...chat_templates/chat_templates/saiga.jinja → ...chat_templates/chat_templates/saiga.jinja b/...chat_templates/chat_templates/saiga.jinja → ...chat_templates/chat_templates/saiga.jinja
diff --git a/...lates/chat_templates/solar-instruct.jinja → ...lates/chat_templates/solar-instruct.jinja b/...lates/chat_templates/solar-instruct.jinja → ...lates/chat_templates/solar-instruct.jinja
diff --git a/...hat_templates/chat_templates/vicuna.jinja → ...hat_templates/chat_templates/vicuna.jinja b/...hat_templates/chat_templates/vicuna.jinja → ...hat_templates/chat_templates/vicuna.jinja
diff --git a/...hat_templates/chat_templates/zephyr.jinja → ...hat_templates/chat_templates/zephyr.jinja b/...hat_templates/chat_templates/zephyr.jinja → ...hat_templates/chat_templates/zephyr.jinja
diff --git a/..._templates/generation_configs/alpaca.json → ..._templates/generation_configs/alpaca.json b/..._templates/generation_configs/alpaca.json → ..._templates/generation_configs/alpaca.json
diff --git a/...mplates/generation_configs/amberchat.json → ...mplates/generation_configs/amberchat.json b/...mplates/generation_configs/amberchat.json → ...mplates/generation_configs/amberchat.json
diff --git a/..._templates/generation_configs/chatqa.json → ..._templates/generation_configs/chatqa.json b/..._templates/generation_configs/chatqa.json → ..._templates/generation_configs/chatqa.json
diff --git a/...emplates/generation_configs/gemma-it.json → ...emplates/generation_configs/gemma-it.json b/...emplates/generation_configs/gemma-it.json → ...emplates/generation_configs/gemma-it.json
diff --git a/...ates/generation_configs/llama-2-chat.json → ...ates/generation_configs/llama-2-chat.json b/...ates/generation_configs/llama-2-chat.json → ...ates/generation_configs/llama-2-chat.json
diff --git a/...ates/generation_configs/llama-3-chat.json → ...ates/generation_configs/llama-3-chat.json b/...ates/generation_configs/llama-3-chat.json → ...ates/generation_configs/llama-3-chat.json
diff --git a/.../generation_configs/mistral-instruct.json → .../generation_configs/mistral-instruct.json b/.../generation_configs/mistral-instruct.json → .../generation_configs/mistral-instruct.json
diff --git a/...emplates/generation_configs/openchat.json → ...emplates/generation_configs/openchat.json b/...emplates/generation_configs/openchat.json → ...emplates/generation_configs/openchat.json
diff --git a/..._templates/generation_configs/orca-2.json → ..._templates/generation_configs/orca-2.json b/..._templates/generation_configs/orca-2.json → ..._templates/generation_configs/orca-2.json
diff --git a/...t_templates/generation_configs/phi-3.json → ...t_templates/generation_configs/phi-3.json b/...t_templates/generation_configs/phi-3.json → ...t_templates/generation_configs/phi-3.json
diff --git a/...plates/generation_configs/qwen2-chat.json → ...plates/generation_configs/qwen2-chat.json b/...plates/generation_configs/qwen2-chat.json → ...plates/generation_configs/qwen2-chat.json
diff --git a/...t_templates/generation_configs/saiga.json → ...t_templates/generation_configs/saiga.json b/...t_templates/generation_configs/saiga.json → ...t_templates/generation_configs/saiga.json
diff --git a/...es/generation_configs/solar-instruct.json → ...es/generation_configs/solar-instruct.json b/...es/generation_configs/solar-instruct.json → ...es/generation_configs/solar-instruct.json
diff --git a/..._templates/generation_configs/vicuna.json → ..._templates/generation_configs/vicuna.json b/..._templates/generation_configs/vicuna.json → ..._templates/generation_configs/vicuna.json
diff --git a/...templates/generation_configs/yi-chat.json → ...templates/generation_configs/yi-chat.json b/...templates/generation_configs/yi-chat.json → ...templates/generation_configs/yi-chat.json
diff --git a/..._templates/generation_configs/zephyr.json → ..._templates/generation_configs/zephyr.json b/..._templates/generation_configs/zephyr.json → ..._templates/generation_configs/zephyr.json
diff --git a/.../llama2/70b-chat-fp16-95c5/src/service.py → .../llama2/70b-chat-fp16-11af/src/service.py b/.../llama2/70b-chat-fp16-95c5/src/service.py → .../llama2/70b-chat-fp16-11af/src/service.py
diff --git a/...llama2/70b-chat-fp16-95c5/src/ui/404.html → ...llama2/70b-chat-fp16-11af/src/ui/404.html b/...llama2/70b-chat-fp16-95c5/src/ui/404.html → ...llama2/70b-chat-fp16-11af/src/ui/404.html
diff --git a/...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js → ...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js b/...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js → ...c/UFSnOXBHq5ysU6-5BuENB/_buildManifest.js
diff --git a/...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js → ...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js b/...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js → ...tic/UFSnOXBHq5ysU6-5BuENB/_ssgManifest.js
diff --git a/...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js → ...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js b/...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js → ...tatic/chunks/0e5ce63c-f5957df8d97fa48f.js
diff --git a/...tatic/chunks/370b0802-87e84e603248538e.js → ...tatic/chunks/370b0802-87e84e603248538e.js b/...tatic/chunks/370b0802-87e84e603248538e.js → ...tatic/chunks/370b0802-87e84e603248538e.js
diff --git a/...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js → ...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js b/...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js → ...tatic/chunks/3d47b92a-f8bda4b39f1e2d9d.js
diff --git a/...tatic/chunks/479ba886-0c92f49cb8e74e58.js → ...tatic/chunks/479ba886-0c92f49cb8e74e58.js b/...tatic/chunks/479ba886-0c92f49cb8e74e58.js → ...tatic/chunks/479ba886-0c92f49cb8e74e58.js
diff --git a/...tatic/chunks/59650de3-87b10f0662b51900.js → ...tatic/chunks/59650de3-87b10f0662b51900.js b/...tatic/chunks/59650de3-87b10f0662b51900.js → ...tatic/chunks/59650de3-87b10f0662b51900.js
diff --git a/...tatic/chunks/66ec4792-34336521b476aa45.js → ...tatic/chunks/66ec4792-34336521b476aa45.js b/...tatic/chunks/66ec4792-34336521b476aa45.js → ...tatic/chunks/66ec4792-34336521b476aa45.js
diff --git a/...ext/static/chunks/674-a1fcdac3696c5ed0.js → ...ext/static/chunks/674-a1fcdac3696c5ed0.js b/...ext/static/chunks/674-a1fcdac3696c5ed0.js → ...ext/static/chunks/674-a1fcdac3696c5ed0.js
diff --git a/...next/static/chunks/69-bf2efb63b1299e3b.js → ...next/static/chunks/69-bf2efb63b1299e3b.js b/...next/static/chunks/69-bf2efb63b1299e3b.js → ...next/static/chunks/69-bf2efb63b1299e3b.js
diff --git a/...ext/static/chunks/700-532b1fe2415e5859.js → ...ext/static/chunks/700-532b1fe2415e5859.js b/...ext/static/chunks/700-532b1fe2415e5859.js → ...ext/static/chunks/700-532b1fe2415e5859.js
diff --git a/...ext/static/chunks/899-fa939dd99dc7a1df.js → ...ext/static/chunks/899-fa939dd99dc7a1df.js b/...ext/static/chunks/899-fa939dd99dc7a1df.js → ...ext/static/chunks/899-fa939dd99dc7a1df.js
diff --git a/...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js → ...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js b/...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js → ...tatic/chunks/8e1d74a4-a6b9a2554f9153c0.js
diff --git a/...tatic/chunks/94730671-0f73873f7f5896de.js → ...tatic/chunks/94730671-0f73873f7f5896de.js b/...tatic/chunks/94730671-0f73873f7f5896de.js → ...tatic/chunks/94730671-0f73873f7f5896de.js
diff --git a/...ext/static/chunks/995-34374f39bb210839.js → ...ext/static/chunks/995-34374f39bb210839.js b/...ext/static/chunks/995-34374f39bb210839.js → ...ext/static/chunks/995-34374f39bb210839.js
diff --git a/...hunks/app/(site)/page-5b6e14439f55739b.js → ...hunks/app/(site)/page-5b6e14439f55739b.js b/...hunks/app/(site)/page-5b6e14439f55739b.js → ...hunks/app/(site)/page-5b6e14439f55739b.js
diff --git a/.../chunks/app/chat/page-9c8e223f40771eb6.js → .../chunks/app/chat/page-9c8e223f40771eb6.js b/.../chunks/app/chat/page-9c8e223f40771eb6.js → .../chunks/app/chat/page-9c8e223f40771eb6.js
diff --git a/...tic/chunks/app/layout-df2dea9dba0ceb06.js → ...tic/chunks/app/layout-df2dea9dba0ceb06.js b/...tic/chunks/app/layout-df2dea9dba0ceb06.js → ...tic/chunks/app/layout-df2dea9dba0ceb06.js
diff --git a/.../chunks/app/not-found-c76dccfb8b88da53.js → .../chunks/app/not-found-c76dccfb8b88da53.js b/.../chunks/app/not-found-c76dccfb8b88da53.js → .../chunks/app/not-found-c76dccfb8b88da53.js
diff --git a/...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js → ...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js b/...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js → ...tatic/chunks/d3ac728e-0c798b3b8aa3bf53.js
diff --git a/...tatic/chunks/fd9d1056-32c33f3919735051.js → ...tatic/chunks/fd9d1056-32c33f3919735051.js b/...tatic/chunks/fd9d1056-32c33f3919735051.js → ...tatic/chunks/fd9d1056-32c33f3919735051.js
diff --git a/...atic/chunks/framework-00a8ba1a63cfdc9e.js → ...atic/chunks/framework-00a8ba1a63cfdc9e.js b/...atic/chunks/framework-00a8ba1a63cfdc9e.js → ...atic/chunks/framework-00a8ba1a63cfdc9e.js
diff --git a/...tatic/chunks/main-app-e95f89b5006af8a8.js → ...tatic/chunks/main-app-e95f89b5006af8a8.js b/...tatic/chunks/main-app-e95f89b5006af8a8.js → ...tatic/chunks/main-app-e95f89b5006af8a8.js
diff --git a/...xt/static/chunks/main-bf1416cb53f2b4c0.js → ...xt/static/chunks/main-bf1416cb53f2b4c0.js b/...xt/static/chunks/main-bf1416cb53f2b4c0.js → ...xt/static/chunks/main-bf1416cb53f2b4c0.js
diff --git a/...tic/chunks/pages/_app-d21e88acd55d90f1.js → ...tic/chunks/pages/_app-d21e88acd55d90f1.js b/...tic/chunks/pages/_app-d21e88acd55d90f1.js → ...tic/chunks/pages/_app-d21e88acd55d90f1.js
diff --git a/...c/chunks/pages/_error-d6107f1aac0c574c.js → ...c/chunks/pages/_error-d6107f1aac0c574c.js b/...c/chunks/pages/_error-d6107f1aac0c574c.js → ...c/chunks/pages/_error-d6107f1aac0c574c.js
diff --git a/...atic/chunks/polyfills-c67a75d1b6f99dc8.js → ...atic/chunks/polyfills-c67a75d1b6f99dc8.js b/...atic/chunks/polyfills-c67a75d1b6f99dc8.js → ...atic/chunks/polyfills-c67a75d1b6f99dc8.js
diff --git a/...static/chunks/webpack-ee8b17d5a5297ccd.js → ...static/chunks/webpack-ee8b17d5a5297ccd.js b/...static/chunks/webpack-ee8b17d5a5297ccd.js → ...static/chunks/webpack-ee8b17d5a5297ccd.js
diff --git a/.../ui/_next/static/css/429544bd3cd8ce3a.css → .../ui/_next/static/css/429544bd3cd8ce3a.css b/.../ui/_next/static/css/429544bd3cd8ce3a.css → .../ui/_next/static/css/429544bd3cd8ce3a.css
diff --git a/.../ui/_next/static/css/5b67f082b31cfc7b.css → .../ui/_next/static/css/5b67f082b31cfc7b.css b/.../ui/_next/static/css/5b67f082b31cfc7b.css → .../ui/_next/static/css/5b67f082b31cfc7b.css
diff --git a/.../ui/_next/static/css/9e63023b20ddb15e.css → .../ui/_next/static/css/9e63023b20ddb15e.css b/.../ui/_next/static/css/9e63023b20ddb15e.css → .../ui/_next/static/css/9e63023b20ddb15e.css
diff --git a/...hat-fp16-95c5/src/ui/apple-touch-icon.png → ...hat-fp16-11af/src/ui/apple-touch-icon.png b/...hat-fp16-95c5/src/ui/apple-touch-icon.png → ...hat-fp16-11af/src/ui/apple-touch-icon.png
diff --git a/...lama2/70b-chat-fp16-95c5/src/ui/chat.html → ...lama2/70b-chat-fp16-11af/src/ui/chat.html b/...lama2/70b-chat-fp16-95c5/src/ui/chat.html → ...lama2/70b-chat-fp16-11af/src/ui/chat.html
diff --git a/...llama2/70b-chat-fp16-95c5/src/ui/chat.txt → ...llama2/70b-chat-fp16-11af/src/ui/chat.txt b/...llama2/70b-chat-fp16-95c5/src/ui/chat.txt → ...llama2/70b-chat-fp16-11af/src/ui/chat.txt
diff --git a/...b-chat-fp16-95c5/src/ui/favicon-16x16.png → ...b-chat-fp16-11af/src/ui/favicon-16x16.png b/...b-chat-fp16-95c5/src/ui/favicon-16x16.png → ...b-chat-fp16-11af/src/ui/favicon-16x16.png
diff --git a/...ma2/70b-chat-fp16-95c5/src/ui/favicon.ico → ...ma2/70b-chat-fp16-11af/src/ui/favicon.ico b/...ma2/70b-chat-fp16-95c5/src/ui/favicon.ico → ...ma2/70b-chat-fp16-11af/src/ui/favicon.ico
diff --git a/...ama2/70b-chat-fp16-95c5/src/ui/index.html → ...ama2/70b-chat-fp16-11af/src/ui/index.html b/...ama2/70b-chat-fp16-95c5/src/ui/index.html → ...ama2/70b-chat-fp16-11af/src/ui/index.html
diff --git a/...lama2/70b-chat-fp16-95c5/src/ui/index.txt → ...lama2/70b-chat-fp16-11af/src/ui/index.txt b/...lama2/70b-chat-fp16-95c5/src/ui/index.txt → ...lama2/70b-chat-fp16-11af/src/ui/index.txt
diff --git a/bentoml/bentos/llama2/7b-chat-awq-4bit-c733/bento.yaml b/bentoml/bentos/llama2/7b-chat-awq-4bit-c733/bento.yaml
@@ -2,7 +2,7 @@ service: service:VLLM
 name: llama2
 version: 7b-chat-awq-4bit-c733
 bentoml_version: 1.3.0
-creation_time: '2024-07-24T01:40:22.459480+00:00'
+creation_time: '2024-07-24T08:18:02.586833+00:00'
 labels:
   model_name: TheBloke/Llama-2-7B-Chat-AWQ
   openllm_alias: 7b-4bit,7b-chat-4bit

diff --git a/bentoml/bentos/llama2/7b-chat-fp16-b8c6/bento.yaml b/bentoml/bentos/llama2/7b-chat-fp16-b8c6/bento.yaml
@@ -2,7 +2,7 @@ service: service:VLLM
 name: llama2
 version: 7b-chat-fp16-b8c6
 bentoml_version: 1.3.0
-creation_time: '2024-07-24T01:40:00.852316+00:00'
+creation_time: '2024-07-24T08:17:41.042045+00:00'
 labels:
   model_name: meta-llama/Llama-2-7b-chat-hf
   openllm_alias: 7b,7b-chat

diff --git a/...al/8x7b-instruct-v0.1-fp16-39ff/README.md → ...3.1/405b-instruct-awq-4bit-a733/README.md b/...al/8x7b-instruct-v0.1-fp16-39ff/README.md → ...3.1/405b-instruct-awq-4bit-a733/README.md
@@ -1,4 +1,4 @@
-# mixtral:8x7b-instruct-v0.1-fp16-39ff
+# llama3.1:405b-instruct-awq-4bit-a733
 
 [![pypi_status](https://img.shields.io/badge/BentoML-1.3.0-informational)](https://pypi.org/project/BentoML)
 [![documentation_status](https://readthedocs.org/projects/bentoml/badge/?version=latest)](https://docs.bentoml.com/)