|
@@ -54,7 +54,7 @@ class StandardNode(Node):
|
|
|
is_finished = is_finished or len(self.buffered_token_output[request_id][0]) >= self.max_generate_tokens
|
|
|
if is_finished:
|
|
|
self.buffered_token_output[request_id] = (self.buffered_token_output[request_id][0], True)
|
|
|
- asyncio.create_task(self.broadcast_result(request_id, self.buffered_token_output[request_id][0], is_finished))
|
|
|
+ asyncio.create_task(self.broadcast_result(request_id, self.buffered_token_output[request_id][0], is_finished)) # TODO: this is n^2 communication complexity
|
|
|
|
|
|
if result.size == 1:
|
|
|
self.buffered_token_output[request_id][0].append(result.item())
|
|
@@ -79,7 +79,7 @@ class StandardNode(Node):
|
|
|
is_finished = is_finished or len(self.buffered_token_output[request_id][0]) >= self.max_generate_tokens
|
|
|
if is_finished:
|
|
|
self.buffered_token_output[request_id] = (self.buffered_token_output[request_id][0], True)
|
|
|
- asyncio.create_task(self.broadcast_result(request_id, self.buffered_token_output[request_id][0], is_finished))
|
|
|
+ asyncio.create_task(self.broadcast_result(request_id, self.buffered_token_output[request_id][0], is_finished)) # TODO: this is n^2 communication complexity
|
|
|
|
|
|
if result.size == 1: # we got a new token out
|
|
|
self.buffered_token_output[request_id][0].append(result.item())
|