File tree Expand file tree Collapse file tree 2 files changed +39
-0
lines changed
vllm/distributed/kv_transfer/kv_lookup_buffer Expand file tree Collapse file tree 2 files changed +39
-0
lines changed Original file line number Diff line number Diff line change 1+ # SPDX-License-Identifier: Apache-2.0
2+
3+ import os
4+ import random
5+
6+ import torch
7+ from tqdm import tqdm
8+
9+ from vllm .config import KVTransferConfig
10+ from vllm .config import VllmConfig
11+ from vllm .distributed .kv_transfer .kv_lookup_buffer .base import MooncakeStore
12+
13+
14+ if __name__ == "__main__" :
15+
16+ # my_rank = int(os.environ['RANK'])
17+
18+ # print(f"initialized! My rank is {my_rank}")
19+
20+ # config = KVTransferConfig(
21+ # kv_connector='PyNcclConnector',
22+ # kv_buffer_device='cuda',
23+ # kv_buffer_size=1e9,
24+ # kv_rank=my_rank,
25+ # kv_role="kv_both", # this arg doesn't matter in this test
26+ # kv_parallel_size=2,
27+ # kv_ip="127.0.0.1",
28+ # kv_port=12345,
29+ # )
30+ vllm_config = VllmConfig ()
31+ mooncake = MooncakeStore ("localhost" , 0 , vllm_config )
32+
33+ print ('Done' )
Original file line number Diff line number Diff line change 1414from vllm .distributed .kv_transfer .kv_pipe .mooncake_pipe import MooncakeTransferEngineConfig
1515
1616import torch
17+ from vllm .logger import init_logger
18+
19+ logger = init_logger (__name__ )
1720
1821
1922class KVLookupBufferBase (ABC ):
@@ -157,6 +160,9 @@ def drop_select(
157160 roi : Optional [torch .Tensor ]) -> List [Optional [torch .Tensor ]]:
158161 # V1 (get and unpack all tensors): consume tensors from MooncakeStore's buffer
159162 raise NotImplementedError ("Insert method is not implemented" )
163+
164+ def close (self ):
165+ pass
160166
161167 def put (
162168 self ,
You can’t perform that action at this time.
0 commit comments