Skip to content

Commit

Permalink
Use SGLang imports for linear layer (sgl-project#1696)
Browse files Browse the repository at this point in the history
  • Loading branch information
janimo authored and qeternity committed Oct 27, 2024
1 parent e23bc9e commit e9cc2b7
Showing 1 changed file with 5 additions and 5 deletions.
10 changes: 5 additions & 5 deletions python/sglang/srt/models/olmo.py
Original file line number Diff line number Diff line change
Expand Up @@ -22,11 +22,6 @@
from torch import nn
from transformers import OlmoConfig
from vllm.distributed import get_tensor_model_parallel_world_size
from vllm.model_executor.layers.linear import (
MergedColumnParallelLinear,
QKVParallelLinear,
RowParallelLinear,
)
from vllm.model_executor.layers.rotary_embedding import get_rope
from vllm.model_executor.layers.vocab_parallel_embedding import (
ParallelLMHead,
Expand All @@ -35,6 +30,11 @@
from vllm.model_executor.model_loader.weight_utils import default_weight_loader

from sglang.srt.layers.activation import SiluAndMul
from sglang.srt.layers.linear import (
MergedColumnParallelLinear,
QKVParallelLinear,
RowParallelLinear,
)
from sglang.srt.layers.logits_processor import LogitsProcessor
from sglang.srt.layers.quantization.base_config import QuantizationConfig
from sglang.srt.layers.radix_attention import RadixAttention
Expand Down

0 comments on commit e9cc2b7

Please sign in to comment.