@@ -57,14 +57,14 @@ class MooncakeTransferEngine:
57
57
58
58
def __init__ (self , kv_rank : int , local_rank : int ):
59
59
try :
60
- import mooncake_vllm_adaptor as mva
60
+ from mooncake . engine import TransferEngine
61
61
except ImportError as e :
62
62
raise ImportError (
63
63
"Please install mooncake by following the instructions at "
64
64
"https://github.com/kvcache-ai/Mooncake/blob/main/doc/en/build.md " # noqa: E501
65
65
"to run vLLM with MooncakeConnector." ) from e
66
66
67
- self .engine = mva . mooncake_vllm_adaptor ()
67
+ self .engine = TransferEngine ()
68
68
self .local_rank = local_rank
69
69
70
70
try :
@@ -140,26 +140,26 @@ def initialize(self, local_hostname: str, metadata_server: str,
140
140
"Mooncake Configuration error. `metadata_backend`"
141
141
f" should be one of { supported_backend } ." )
142
142
143
- self .engine .initializeExt (local_hostname , metadata_server ,
144
- protocol , device_name , metadata_backend )
143
+ self .engine .initialize_ext (local_hostname , metadata_server ,
144
+ protocol , device_name , metadata_backend )
145
145
146
146
def allocate_managed_buffer (self , length : int ) -> int :
147
147
"""Allocate a managed buffer of the specified length."""
148
- ret = self .engine .allocateManagedBuffer (length )
148
+ ret = self .engine .allocate_managed_buffer (length )
149
149
if ret <= 0 :
150
150
logger .error ("Allocation Return Error" )
151
151
raise Exception ("Allocation Return Error" )
152
152
return ret
153
153
154
154
def free_managed_buffer (self , buffer : int , length : int ) -> int :
155
155
"""Free a previously allocated managed buffer."""
156
- return self .engine .freeManagedBuffer (buffer , length )
156
+ return self .engine .free_managed_buffer (buffer , length )
157
157
158
158
def transfer_sync (self , buffer : int , peer_buffer_address : int ,
159
159
length : int ) -> int :
160
160
"""Synchronously transfer data to the specified address."""
161
- ret = self .engine .transferSync (self .remote_url , buffer ,
162
- peer_buffer_address , length )
161
+ ret = self .engine .transfer_sync_read (self .remote_url , buffer ,
162
+ peer_buffer_address , length )
163
163
if ret < 0 :
164
164
logger .error ("Transfer Return Error" )
165
165
raise Exception ("Transfer Return Error" )
@@ -168,11 +168,11 @@ def transfer_sync(self, buffer: int, peer_buffer_address: int,
168
168
def write_bytes_to_buffer (self , buffer : int , user_data : bytes ,
169
169
length : int ) -> int :
170
170
"""Write bytes to the allocated buffer."""
171
- return self .engine .writeBytesToBuffer (buffer , user_data , length )
171
+ return self .engine .write_bytes_to_buffer (buffer , user_data , length )
172
172
173
173
def read_bytes_from_buffer (self , buffer : int , length : int ) -> bytes :
174
174
"""Read bytes from the allocated buffer."""
175
- return self .engine .readBytesFromBuffer (buffer , length )
175
+ return self .engine .read_bytes_from_buffer (buffer , length )
176
176
177
177
def wait_for_ack (self , src_ptr : int , length : int ) -> None :
178
178
"""Asynchronously wait for ACK from the receiver."""
0 commit comments