Skip to content

Commit 32665a4

Browse files
committed
fix(models): chat ui
1 parent fa4f044 commit 32665a4

File tree

2,017 files changed

+8478
-8478
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

2,017 files changed

+8478
-8478
lines changed

bentoml/bentos/gemma/2b-instruct-fp16-da36/README.md renamed to bentoml/bentos/gemma/2b-instruct-fp16-26b3/README.md

+1-1

bentoml/bentos/gemma/2b-instruct-fp16-da36/apis/openapi.yaml renamed to bentoml/bentos/gemma/2b-instruct-fp16-26b3/apis/openapi.yaml

+33-33
Original file line numberDiff line numberDiff line change
@@ -1036,6 +1036,39 @@ paths:
10361036
tags:
10371037
- Service APIs
10381038
x-bentoml-name: generate
1039+
/chat/:
1040+
get:
1041+
operationId: serve_chat_html__get
1042+
responses:
1043+
'200':
1044+
content:
1045+
application/json:
1046+
schema: {}
1047+
description: Successful Response
1048+
summary: Serve Chat Html
1049+
/chat/{full_path}:
1050+
get:
1051+
operationId: catch_all__full_path__get
1052+
parameters:
1053+
- in: path
1054+
name: full_path
1055+
required: true
1056+
schema:
1057+
title: Full Path
1058+
type: string
1059+
responses:
1060+
'200':
1061+
content:
1062+
application/json:
1063+
schema: {}
1064+
description: Successful Response
1065+
'422':
1066+
content:
1067+
application/json:
1068+
schema:
1069+
$ref: '#/components/schemas/HTTPValidationError'
1070+
description: Validation Error
1071+
summary: Catch All
10391072
/healthz:
10401073
get:
10411074
description: Health check endpoint. Expecting an empty response with status
@@ -1076,39 +1109,6 @@ paths:
10761109
description: Successful Response
10771110
tags:
10781111
- Infrastructure
1079-
/ui/:
1080-
get:
1081-
operationId: serve_chat_html__get
1082-
responses:
1083-
'200':
1084-
content:
1085-
application/json:
1086-
schema: {}
1087-
description: Successful Response
1088-
summary: Serve Chat Html
1089-
/ui/{full_path}:
1090-
get:
1091-
operationId: catch_all__full_path__get
1092-
parameters:
1093-
- in: path
1094-
name: full_path
1095-
required: true
1096-
schema:
1097-
title: Full Path
1098-
type: string
1099-
responses:
1100-
'200':
1101-
content:
1102-
application/json:
1103-
schema: {}
1104-
description: Successful Response
1105-
'422':
1106-
content:
1107-
application/json:
1108-
schema:
1109-
$ref: '#/components/schemas/HTTPValidationError'
1110-
description: Validation Error
1111-
summary: Catch All
11121112
/v1/chat/completions:
11131113
post:
11141114
operationId: create_chat_completion_chat_completions_post

bentoml/bentos/gemma/2b-instruct-fp16-da36/bento.yaml renamed to bentoml/bentos/gemma/2b-instruct-fp16-26b3/bento.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
service: service:VLLM
22
name: gemma
3-
version: 2b-instruct-fp16-da36
3+
version: 2b-instruct-fp16-26b3
44
bentoml_version: 1.2.19
5-
creation_time: '2024-07-05T07:31:05.934035+00:00'
5+
creation_time: '2024-07-08T07:57:26.100524+00:00'
66
labels:
77
openllm_alias: 2b,2b-instruct
88
openllm_hf_model_id: google/gemma-2b-it

bentoml/bentos/gemma/7b-instruct-awq-4bit-6a74/env/python/requirements.lock.txt renamed to bentoml/bentos/gemma/2b-instruct-fp16-26b3/env/python/requirements.lock.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -143,5 +143,5 @@ yarl==1.9.4
143143
zipp==3.19.2
144144

145145
# The following packages are considered to be unsafe in a requirements file:
146-
pip==24.1.1
146+
pip==24.1.2
147147
setuptools==70.2.0

bentoml/bentos/gemma/2b-instruct-fp16-da36/src/service.py renamed to bentoml/bentos/gemma/2b-instruct-fp16-26b3/src/service.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -85,7 +85,7 @@ async def catch_all(full_path: str):
8585

8686

8787
@bentoml.mount_asgi_app(openai_api_app, path="/v1")
88-
@bentoml.mount_asgi_app(ui_app, path="/ui")
88+
@bentoml.mount_asgi_app(ui_app, path="/chat")
8989
@bentoml.service(**SERVICE_CONFIG)
9090
class VLLM:
9191
def __init__(self) -> None:

bentoml/bentos/gemma/7b-instruct-awq-4bit-6a74/README.md renamed to bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/README.md

+1-1

bentoml/bentos/gemma/7b-instruct-awq-4bit-6a74/apis/openapi.yaml renamed to bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/apis/openapi.yaml

+33-33
Original file line numberDiff line numberDiff line change
@@ -1036,6 +1036,39 @@ paths:
10361036
tags:
10371037
- Service APIs
10381038
x-bentoml-name: generate
1039+
/chat/:
1040+
get:
1041+
operationId: serve_chat_html__get
1042+
responses:
1043+
'200':
1044+
content:
1045+
application/json:
1046+
schema: {}
1047+
description: Successful Response
1048+
summary: Serve Chat Html
1049+
/chat/{full_path}:
1050+
get:
1051+
operationId: catch_all__full_path__get
1052+
parameters:
1053+
- in: path
1054+
name: full_path
1055+
required: true
1056+
schema:
1057+
title: Full Path
1058+
type: string
1059+
responses:
1060+
'200':
1061+
content:
1062+
application/json:
1063+
schema: {}
1064+
description: Successful Response
1065+
'422':
1066+
content:
1067+
application/json:
1068+
schema:
1069+
$ref: '#/components/schemas/HTTPValidationError'
1070+
description: Validation Error
1071+
summary: Catch All
10391072
/healthz:
10401073
get:
10411074
description: Health check endpoint. Expecting an empty response with status
@@ -1076,39 +1109,6 @@ paths:
10761109
description: Successful Response
10771110
tags:
10781111
- Infrastructure
1079-
/ui/:
1080-
get:
1081-
operationId: serve_chat_html__get
1082-
responses:
1083-
'200':
1084-
content:
1085-
application/json:
1086-
schema: {}
1087-
description: Successful Response
1088-
summary: Serve Chat Html
1089-
/ui/{full_path}:
1090-
get:
1091-
operationId: catch_all__full_path__get
1092-
parameters:
1093-
- in: path
1094-
name: full_path
1095-
required: true
1096-
schema:
1097-
title: Full Path
1098-
type: string
1099-
responses:
1100-
'200':
1101-
content:
1102-
application/json:
1103-
schema: {}
1104-
description: Successful Response
1105-
'422':
1106-
content:
1107-
application/json:
1108-
schema:
1109-
$ref: '#/components/schemas/HTTPValidationError'
1110-
description: Validation Error
1111-
summary: Catch All
11121112
/v1/chat/completions:
11131113
post:
11141114
operationId: create_chat_completion_chat_completions_post

bentoml/bentos/gemma/7b-instruct-awq-4bit-6a74/bento.yaml renamed to bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/bento.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
service: service:VLLM
22
name: gemma
3-
version: 7b-instruct-awq-4bit-6a74
3+
version: 7b-instruct-awq-4bit-d670
44
bentoml_version: 1.2.19
5-
creation_time: '2024-07-05T07:32:14.773611+00:00'
5+
creation_time: '2024-07-08T07:59:18.619602+00:00'
66
labels:
77
openllm_alias: 7b-4bit,7b-instruct-4bit
88
openllm_hf_model_id: casperhansen/gemma-7b-it-awq

bentoml/bentos/gemma/7b-instruct-fp16-dafc/env/python/requirements.lock.txt renamed to bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/env/python/requirements.lock.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -143,5 +143,5 @@ yarl==1.9.4
143143
zipp==3.19.2
144144

145145
# The following packages are considered to be unsafe in a requirements file:
146-
pip==24.1.1
146+
pip==24.1.2
147147
setuptools==70.2.0

bentoml/bentos/gemma/7b-instruct-awq-4bit-6a74/src/service.py renamed to bentoml/bentos/gemma/7b-instruct-awq-4bit-d670/src/service.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -85,7 +85,7 @@ async def catch_all(full_path: str):
8585

8686

8787
@bentoml.mount_asgi_app(openai_api_app, path="/v1")
88-
@bentoml.mount_asgi_app(ui_app, path="/ui")
88+
@bentoml.mount_asgi_app(ui_app, path="/chat")
8989
@bentoml.service(**SERVICE_CONFIG)
9090
class VLLM:
9191
def __init__(self) -> None:

bentoml/bentos/gemma/7b-instruct-fp16-dafc/README.md renamed to bentoml/bentos/gemma/7b-instruct-fp16-ae3e/README.md

+1-1

bentoml/bentos/gemma/7b-instruct-fp16-dafc/apis/openapi.yaml renamed to bentoml/bentos/gemma/7b-instruct-fp16-ae3e/apis/openapi.yaml

+33-33
Original file line numberDiff line numberDiff line change
@@ -1036,6 +1036,39 @@ paths:
10361036
tags:
10371037
- Service APIs
10381038
x-bentoml-name: generate
1039+
/chat/:
1040+
get:
1041+
operationId: serve_chat_html__get
1042+
responses:
1043+
'200':
1044+
content:
1045+
application/json:
1046+
schema: {}
1047+
description: Successful Response
1048+
summary: Serve Chat Html
1049+
/chat/{full_path}:
1050+
get:
1051+
operationId: catch_all__full_path__get
1052+
parameters:
1053+
- in: path
1054+
name: full_path
1055+
required: true
1056+
schema:
1057+
title: Full Path
1058+
type: string
1059+
responses:
1060+
'200':
1061+
content:
1062+
application/json:
1063+
schema: {}
1064+
description: Successful Response
1065+
'422':
1066+
content:
1067+
application/json:
1068+
schema:
1069+
$ref: '#/components/schemas/HTTPValidationError'
1070+
description: Validation Error
1071+
summary: Catch All
10391072
/healthz:
10401073
get:
10411074
description: Health check endpoint. Expecting an empty response with status
@@ -1076,39 +1109,6 @@ paths:
10761109
description: Successful Response
10771110
tags:
10781111
- Infrastructure
1079-
/ui/:
1080-
get:
1081-
operationId: serve_chat_html__get
1082-
responses:
1083-
'200':
1084-
content:
1085-
application/json:
1086-
schema: {}
1087-
description: Successful Response
1088-
summary: Serve Chat Html
1089-
/ui/{full_path}:
1090-
get:
1091-
operationId: catch_all__full_path__get
1092-
parameters:
1093-
- in: path
1094-
name: full_path
1095-
required: true
1096-
schema:
1097-
title: Full Path
1098-
type: string
1099-
responses:
1100-
'200':
1101-
content:
1102-
application/json:
1103-
schema: {}
1104-
description: Successful Response
1105-
'422':
1106-
content:
1107-
application/json:
1108-
schema:
1109-
$ref: '#/components/schemas/HTTPValidationError'
1110-
description: Validation Error
1111-
summary: Catch All
11121112
/v1/chat/completions:
11131113
post:
11141114
operationId: create_chat_completion_chat_completions_post

bentoml/bentos/gemma/7b-instruct-fp16-dafc/bento.yaml renamed to bentoml/bentos/gemma/7b-instruct-fp16-ae3e/bento.yaml

+2-2
Original file line numberDiff line numberDiff line change
@@ -1,8 +1,8 @@
11
service: service:VLLM
22
name: gemma
3-
version: 7b-instruct-fp16-dafc
3+
version: 7b-instruct-fp16-ae3e
44
bentoml_version: 1.2.19
5-
creation_time: '2024-07-05T07:31:38.255529+00:00'
5+
creation_time: '2024-07-08T07:58:22.853090+00:00'
66
labels:
77
openllm_alias: 7b,7b-instruct
88
openllm_hf_model_id: google/gemma-7b-it

bentoml/bentos/llama2/13b-chat-fp16-0b04/env/python/requirements.lock.txt renamed to bentoml/bentos/gemma/7b-instruct-fp16-ae3e/env/python/requirements.lock.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -143,5 +143,5 @@ yarl==1.9.4
143143
zipp==3.19.2
144144

145145
# The following packages are considered to be unsafe in a requirements file:
146-
pip==24.1.1
146+
pip==24.1.2
147147
setuptools==70.2.0

bentoml/bentos/gemma/7b-instruct-fp16-dafc/src/service.py renamed to bentoml/bentos/gemma/7b-instruct-fp16-ae3e/src/service.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -85,7 +85,7 @@ async def catch_all(full_path: str):
8585

8686

8787
@bentoml.mount_asgi_app(openai_api_app, path="/v1")
88-
@bentoml.mount_asgi_app(ui_app, path="/ui")
88+
@bentoml.mount_asgi_app(ui_app, path="/chat")
8989
@bentoml.service(**SERVICE_CONFIG)
9090
class VLLM:
9191
def __init__(self) -> None:

bentoml/bentos/llama2/70b-chat-fp16-4512/README.md renamed to bentoml/bentos/llama2/13b-chat-fp16-4059/README.md

+1-1

0 commit comments

Comments
 (0)