Spaces:
Runtime error
Runtime error
Update app.py
Browse files
app.py
CHANGED
|
@@ -1,8 +1,8 @@
|
|
| 1 |
from lmdeploy.serve.gradio.turbomind_coupled import *
|
| 2 |
from lmdeploy.messages import TurbomindEngineConfig
|
| 3 |
|
| 4 |
-
backend_config = TurbomindEngineConfig(max_batch_size=1, cache_max_entry_count=0.05
|
| 5 |
-
model_path = 'internlm/internlm2-
|
| 6 |
|
| 7 |
InterFace.async_engine = AsyncEngine(
|
| 8 |
model_path=model_path,
|
|
@@ -80,13 +80,13 @@ with gr.Blocks(css=CSS, theme=THEME) as demo:
|
|
| 80 |
with gr.Row():
|
| 81 |
request_output_len = gr.Slider(1,
|
| 82 |
2048,
|
| 83 |
-
value=
|
| 84 |
step=1,
|
| 85 |
label='Maximum new tokens')
|
| 86 |
-
top_p = gr.Slider(0.01, 1, value=0
|
| 87 |
temperature = gr.Slider(0.01,
|
| 88 |
1.5,
|
| 89 |
-
value=0.
|
| 90 |
step=0.01,
|
| 91 |
label='Temperature')
|
| 92 |
|
|
|
|
| 1 |
from lmdeploy.serve.gradio.turbomind_coupled import *
|
| 2 |
from lmdeploy.messages import TurbomindEngineConfig
|
| 3 |
|
| 4 |
+
backend_config = TurbomindEngineConfig(max_batch_size=1, cache_max_entry_count=0.05)#, model_format='awq')
|
| 5 |
+
model_path = 'internlm/internlm2-math-7b'
|
| 6 |
|
| 7 |
InterFace.async_engine = AsyncEngine(
|
| 8 |
model_path=model_path,
|
|
|
|
| 80 |
with gr.Row():
|
| 81 |
request_output_len = gr.Slider(1,
|
| 82 |
2048,
|
| 83 |
+
value=1024,
|
| 84 |
step=1,
|
| 85 |
label='Maximum new tokens')
|
| 86 |
+
top_p = gr.Slider(0.01, 1, value=1.0, step=0.01, label='Top_p')
|
| 87 |
temperature = gr.Slider(0.01,
|
| 88 |
1.5,
|
| 89 |
+
value=0.01,
|
| 90 |
step=0.01,
|
| 91 |
label='Temperature')
|
| 92 |
|