| .. |
|
configs
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
models
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
double-sparsity-config-Llama-3.1-8B-Instruct.json
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
experiment_runner.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
kv_cache_scales_llama3_1_8b.json
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
kv_cache_scales_llama3_8b.json
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
kv_cache_scales_qwen2_1_5b.json
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
run_suite.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_abort.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_awq.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_bench_one_batch.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_bench_serving.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_block_int8.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_cache_report.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_chunked_prefill.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_create_kvindices.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_custom_allreduce.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_data_parallelism.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_double_sparsity.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_dp_attention.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_eagle_infer.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_ebnf_constrained.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_embedding_openai_server.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_eval_accuracy_large.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_eval_fp8_accuracy.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_expert_distribution.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_fim_completion.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_fp8_kernel.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_fp8_kvcache.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_function_calling.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_fused_moe.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_get_weights_by_name.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_gguf.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_gptqmodel_dynamic.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_health_check.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_hicache.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_hicache_mla.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_hidden_states.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_input_embeddings.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_int8_kernel.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_json_constrained.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_large_max_new_tokens.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_matched_stop.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_metrics.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_mla.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_mla_deepseek_v3.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_mla_flashinfer.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_mla_fp8.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_mla_int8_deepseek_v3.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_mla_tp.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_modelopt_fp8kvcache.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_models_from_modelscope.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_moe_deepep.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_moe_ep.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_moe_eval_accuracy_large.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_nightly_gsm8k_eval.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_nightly_human_eval.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_nightly_math_eval.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_no_chunked_prefill.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_no_overlap_scheduler.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_openai_server.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_page_size.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_patch_torch.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_penalty.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_pytorch_sampling_backend.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_radix_attention.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_reasoning_content.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_regex_constrained.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_release_memory_occupation.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_request_length_validation.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_retract_decode.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_sagemaker_server.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_schedule_policy.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_server_args.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_session_control.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_skip_tokenizer_init.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_srt_endpoint.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_srt_engine.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_srt_engine_with_quant_args.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_torch_compile.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_torch_compile_moe.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_torch_native_attention_backend.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_torch_tp.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_torchao.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_triton_attention_backend.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_triton_attention_kernels.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_triton_attention_rocm_mla.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_update_weights_from_disk.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_update_weights_from_distributed.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_update_weights_from_tensor.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_verl_engine.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_vertex_endpoint.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_vision_chunked_prefill.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_vision_openai_server.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_vllm_dependency.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_vlm_accuracy.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |
|
test_w8a8_quantization.py
|
first commit @ sglang v0.4.5.post1
|
2025-06-29 18:55:37 +08:00 |