Skip to content

Commit 1dd2338

Browse files
authored
[Misc] Update usage with mooncake lib for kv transfer (vllm-project#16523)
Signed-off-by: Shangming Cai <[email protected]>
1 parent 7cbfc10 commit 1dd2338

File tree

2 files changed

+11
-11
lines changed

2 files changed

+11
-11
lines changed

vllm/distributed/kv_transfer/kv_lookup_buffer/mooncake_store.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -70,7 +70,7 @@ def __init__(
7070
):
7171

7272
try:
73-
from mooncake_vllm_adaptor import MooncakeDistributedStore
73+
from mooncake.store import MooncakeDistributedStore
7474
except ImportError as e:
7575
raise ImportError(
7676
"Please install mooncake by following the instructions at "

vllm/distributed/kv_transfer/kv_pipe/mooncake_pipe.py

Lines changed: 10 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -57,14 +57,14 @@ class MooncakeTransferEngine:
5757

5858
def __init__(self, kv_rank: int, local_rank: int):
5959
try:
60-
import mooncake_vllm_adaptor as mva
60+
from mooncake.engine import TransferEngine
6161
except ImportError as e:
6262
raise ImportError(
6363
"Please install mooncake by following the instructions at "
6464
"https://github.com/kvcache-ai/Mooncake/blob/main/doc/en/build.md " # noqa: E501
6565
"to run vLLM with MooncakeConnector.") from e
6666

67-
self.engine = mva.mooncake_vllm_adaptor()
67+
self.engine = TransferEngine()
6868
self.local_rank = local_rank
6969

7070
try:
@@ -140,26 +140,26 @@ def initialize(self, local_hostname: str, metadata_server: str,
140140
"Mooncake Configuration error. `metadata_backend`"
141141
f" should be one of {supported_backend}.")
142142

143-
self.engine.initializeExt(local_hostname, metadata_server,
144-
protocol, device_name, metadata_backend)
143+
self.engine.initialize_ext(local_hostname, metadata_server,
144+
protocol, device_name, metadata_backend)
145145

146146
def allocate_managed_buffer(self, length: int) -> int:
147147
"""Allocate a managed buffer of the specified length."""
148-
ret = self.engine.allocateManagedBuffer(length)
148+
ret = self.engine.allocate_managed_buffer(length)
149149
if ret <= 0:
150150
logger.error("Allocation Return Error")
151151
raise Exception("Allocation Return Error")
152152
return ret
153153

154154
def free_managed_buffer(self, buffer: int, length: int) -> int:
155155
"""Free a previously allocated managed buffer."""
156-
return self.engine.freeManagedBuffer(buffer, length)
156+
return self.engine.free_managed_buffer(buffer, length)
157157

158158
def transfer_sync(self, buffer: int, peer_buffer_address: int,
159159
length: int) -> int:
160160
"""Synchronously transfer data to the specified address."""
161-
ret = self.engine.transferSync(self.remote_url, buffer,
162-
peer_buffer_address, length)
161+
ret = self.engine.transfer_sync_read(self.remote_url, buffer,
162+
peer_buffer_address, length)
163163
if ret < 0:
164164
logger.error("Transfer Return Error")
165165
raise Exception("Transfer Return Error")
@@ -168,11 +168,11 @@ def transfer_sync(self, buffer: int, peer_buffer_address: int,
168168
def write_bytes_to_buffer(self, buffer: int, user_data: bytes,
169169
length: int) -> int:
170170
"""Write bytes to the allocated buffer."""
171-
return self.engine.writeBytesToBuffer(buffer, user_data, length)
171+
return self.engine.write_bytes_to_buffer(buffer, user_data, length)
172172

173173
def read_bytes_from_buffer(self, buffer: int, length: int) -> bytes:
174174
"""Read bytes from the allocated buffer."""
175-
return self.engine.readBytesFromBuffer(buffer, length)
175+
return self.engine.read_bytes_from_buffer(buffer, length)
176176

177177
def wait_for_ack(self, src_ptr: int, length: int) -> None:
178178
"""Asynchronously wait for ACK from the receiver."""

0 commit comments

Comments
 (0)