@@ -210,8 +210,8 @@ def __init__(
210210 model_name : Optional [str ] = None ,
211211 max_batch_size : Optional [int ] = None ,
212212 max_sequence_length : Optional [int ] = None ,
213- param_hosting_ratio : float = 0.65 ,
214- kv_cache_ratio : float = 0.25 ,
213+ param_mem_ratio : float = 0.65 ,
214+ kvcache_mem_ratio : float = 0.25 ,
215215 ):
216216 self .recv_from_peer_addr = recv_from_peer_addr
217217 self .send_to_peer_addr = send_to_peer_addr
@@ -230,8 +230,8 @@ def __init__(
230230 self .model_name = model_name
231231 self .max_batch_size = max_batch_size
232232 self .max_sequence_length = max_sequence_length
233- self .param_hosting_ratio = param_hosting_ratio
234- self .kv_cache_ratio = kv_cache_ratio
233+ self .param_mem_ratio = param_mem_ratio
234+ self .kvcache_mem_ratio = kvcache_mem_ratio
235235 self .prefix_id = f"{ dht_prefix } _announce"
236236 self .lattica = None
237237 self .routing_table = None
@@ -686,8 +686,8 @@ def get_node_info(self, is_update: bool = False):
686686 info = {
687687 "node_id" : self .lattica .peer_id (),
688688 "hardware" : detect_node_hardware (self .lattica .peer_id ()),
689- "kv_cache_ratio " : self .kv_cache_ratio ,
690- "param_hosting_ratio " : self .param_hosting_ratio ,
689+ "kvcache_mem_ratio " : self .kvcache_mem_ratio ,
690+ "param_mem_ratio " : self .param_mem_ratio ,
691691 "max_concurrent_requests" : self .max_batch_size ,
692692 "max_sequence_length" : (
693693 1024 if self .max_sequence_length is None else self .max_sequence_length
@@ -753,8 +753,8 @@ def launch_p2p_server(
753753 model_name : Optional [str ],
754754 max_batch_size : Optional [int ] = None ,
755755 max_sequence_length : Optional [int ] = None ,
756- param_hosting_ratio : float = 0.65 ,
757- kv_cache_ratio : float = 0.25 ,
756+ param_mem_ratio : float = 0.65 ,
757+ kvcache_mem_ratio : float = 0.25 ,
758758):
759759 server = GradientServer (
760760 recv_from_peer_addr = recv_from_peer_addr ,
@@ -774,8 +774,8 @@ def launch_p2p_server(
774774 model_name = model_name ,
775775 max_batch_size = max_batch_size ,
776776 max_sequence_length = max_sequence_length ,
777- param_hosting_ratio = param_hosting_ratio ,
778- kv_cache_ratio = kv_cache_ratio ,
777+ param_mem_ratio = param_mem_ratio ,
778+ kvcache_mem_ratio = kvcache_mem_ratio ,
779779 )
780780 # Start the server
781781 thread = threading .Thread (target = server .run , daemon = True )
0 commit comments