|
51 | 51 | gpu_memory_utilization=orjson.loads(coreutils.getenv('gpu_memory_utilization', default=orjson.dumps({__gpu_memory_utilization__}), var=['GPU_MEMORY_UTILISATION'])) |
52 | 52 | services_config=orjson.loads(coreutils.getenv('services_config',"""{__services_config__}""")) |
53 | 53 | ''' |
54 | | -_DOCKERFILE_TEMPLATE = """\ |
55 | | -{% extends bento_base_template %} |
56 | | -{% block SETUP_BENTO_BASE_IMAGE %} |
57 | | -{{ super() }} |
58 | | -{% endblock %} |
59 | | -""" |
60 | 54 |
|
61 | 55 |
|
62 | 56 | class ItemState(enum.Enum): |
@@ -235,6 +229,7 @@ def start_command( |
235 | 229 | """ |
236 | 230 | import transformers |
237 | 231 |
|
| 232 | + from _bentoml_impl.server import serve_http |
238 | 233 | from bentoml._internal.service.loader import load |
239 | 234 | from bentoml._internal.log import configure_server_logging |
240 | 235 |
|
@@ -284,9 +279,8 @@ def start_command( |
284 | 279 | working_dir = os.path.abspath(os.path.dirname(__file__)) |
285 | 280 | if sys.path[0] != working_dir: |
286 | 281 | sys.path.insert(0, working_dir) |
287 | | - load('.', working_dir=working_dir).serve_http( |
288 | | - working_dir=working_dir, reload=check_bool_env('RELOAD', default=False), development_mode=DEBUG |
289 | | - ) |
| 282 | + load('.', working_dir=working_dir).inject_config() |
| 283 | + serve_http('.', working_dir=working_dir, reload=check_bool_env('RELOAD', default=False), development_mode=DEBUG) |
290 | 284 |
|
291 | 285 |
|
292 | 286 | def construct_python_options(llm_config, llm_fs): |
|
0 commit comments