File tree Expand file tree Collapse file tree
Expand file tree Collapse file tree Original file line number Diff line number Diff line change @@ -88,11 +88,13 @@ def parse_generation_response(
8888 # Extract routed_experts information if available
8989 routed_experts = meta_info .get ("routed_experts" , None )
9090 if routed_experts is not None :
91- num_sgl_token = meta_info ['prompt_tokens' ] + meta_info ['completion_tokens' ]- 1
91+ num_sgl_token = (
92+ meta_info ["prompt_tokens" ] + meta_info ["completion_tokens" ] - 1
93+ )
9294 # Extract expert_id and reshape to (num_sgl_token, num_layers*expert_top_k)
9395 routed_experts = np .frombuffer (
9496 pybase64 .b64decode (routed_experts .encode ("utf-8" )), dtype = np .int32
95- ).reshape (num_sgl_token ,- 1 )
97+ ).reshape (num_sgl_token , - 1 )
9698
9799 if stop_reason == "abort" and stop_message .startswith ("Abort before prefill" ):
98100 return HttpGenerationResult (
Original file line number Diff line number Diff line change 1212from areal .api .alloc_mode import AllocationMode
1313from areal .api .cli_args import (
1414 ClusterSpecConfig ,
15- GenerationHyperparameters ,
1615 NameResolveConfig ,
1716 SGLangConfig ,
1817 parse_cli_args ,
Original file line number Diff line number Diff line change @@ -575,6 +575,7 @@ https://github.com/sgl-project/sglang for detailed documentation.
575575| ` enable_metrics ` | boolean | ` True ` | - |
576576| ` decode_log_interval ` | integer | ` 1 ` | - |
577577| ` enable_multithread_load ` | boolean | ` False ` | - |
578+ | ` enable_return_routed_experts ` | boolean | ` False ` | - |
578579
579580(section-v-llm)=
580581
@@ -747,7 +748,7 @@ Configuration for SwanLab experiment tracking and monitoring.
747748| ` config ` | ` dict ` \| None | ` None ` | - |
748749| ` logdir ` | string \| None | ` None ` | - |
749750| ` mode ` | string \| None | ` "disabled" ` | - |
750- | ` api_key ` | string \| None | ` None ` | - |
751+ | ` api_key ` | string \| None | ` "4KHJ20cRg6fuVkvwvGaXD" ` | - |
751752
752753(section-tensor-board)=
753754
You can’t perform that action at this time.
0 commit comments