Skip to content

Commit 1f0fa29

Browse files
committed
Remove unused imports in prefill.py, decode.py, and npu_graph_runner.py
- Comes from merge conflicts
1 parent 9b06d38 commit 1f0fa29

File tree

3 files changed

+4
-10
lines changed

3 files changed

+4
-10
lines changed

python/sglang/srt/disaggregation/decode.py

Lines changed: 2 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525
from collections import deque
2626
from dataclasses import dataclass
2727
from http import HTTPStatus
28-
from typing import TYPE_CHECKING, Dict, List, Optional, Tuple, Type, Union
28+
from typing import TYPE_CHECKING, List, Optional, Tuple, Type, Union
2929

3030
import torch
3131
from torch.distributed import ProcessGroup
@@ -48,10 +48,7 @@
4848
)
4949
from sglang.srt.layers.dp_attention import get_attention_tp_size
5050
from sglang.srt.managers.schedule_batch import FINISH_ABORT, RequestStage, ScheduleBatch
51-
from sglang.srt.mem_cache.allocator import (
52-
BaseTokenToKVPoolAllocator,
53-
SWATokenToKVPoolAllocator,
54-
)
51+
from sglang.srt.mem_cache.allocator import BaseTokenToKVPoolAllocator
5552
from sglang.srt.mem_cache.base_prefix_cache import BasePrefixCache
5653
from sglang.srt.mem_cache.memory_pool import (
5754
HybridLinearKVPool,
@@ -61,7 +58,6 @@
6158
ReqToTokenPool,
6259
SWAKVPool,
6360
)
64-
from sglang.srt.model_executor.forward_batch_info import ForwardMode
6561
from sglang.srt.utils import get_int_env_var, require_mlp_sync
6662
from sglang.srt.utils.torch_memory_saver_adapter import TorchMemorySaverAdapter
6763

python/sglang/srt/disaggregation/prefill.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,7 +20,6 @@
2020
from __future__ import annotations
2121

2222
import logging
23-
import threading
2423
import time
2524
from collections import deque
2625
from http import HTTPStatus
@@ -54,7 +53,7 @@
5453
NSATokenToKVPool,
5554
SWAKVPool,
5655
)
57-
from sglang.srt.model_executor.forward_batch_info import ForwardMode, PPProxyTensors
56+
from sglang.srt.model_executor.forward_batch_info import PPProxyTensors
5857
from sglang.srt.utils import (
5958
DynamicGradMode,
6059
broadcast_pyobj,

python/sglang/srt/model_executor/npu_graph_runner.py

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -19,10 +19,9 @@
1919
import threading
2020
from typing import TYPE_CHECKING, Optional, Union
2121

22-
import numpy as np
2322
import torch
2423

25-
from sglang.srt.configs.model_config import AttentionArch, is_deepseek_nsa
24+
from sglang.srt.configs.model_config import is_deepseek_nsa
2625
from sglang.srt.model_executor.cuda_graph_runner import CudaGraphRunner
2726

2827
logger = logging.getLogger(__name__)

0 commit comments

Comments
 (0)