Skip to content
This repository was archived by the owner on Oct 9, 2024. It is now read-only.

Commit abfc97f

Browse files
committed
use descriptive method names
1 parent 9d48dbf commit abfc97f

File tree

4 files changed

+25
-25
lines changed

4 files changed

+25
-25
lines changed

inference_server/model_handler/deployment.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -132,16 +132,16 @@ def _initialize_grpc_client(self):
132132
self.stubs.append(stub)
133133

134134
# runs task in parallel and return the result from the first task
135-
async def _query_in_tensor_parallel(self, text: List[str], generate_kwargs: dict):
135+
async def generate_in_tensor_parallel(self, text: List[str], generate_kwargs: dict):
136136
responses = []
137137
for i in range(self.num_gpus):
138-
responses.append(self.asyncio_loop.create_task(self._request_async_response(i, text, generate_kwargs)))
138+
responses.append(self.asyncio_loop.create_task(self.generate_async(i, text, generate_kwargs)))
139139

140140
await responses[0]
141141
return responses[0]
142142

143-
async def _request_async_response(self, stub_id: int, text: List[str], generate_kwargs: dict):
144-
req = generation_pb2.GenerationRequest(texts=text, generate_kwargs=generate_kwargs)
143+
async def generate_async(self, stub_id: int, text: List[str], generate_kwargs: dict):
144+
req = generation_pb2.GenerationRequestProto(texts=text, generate_kwargs=generate_kwargs)
145145
response = await self.stubs[stub_id].Generate(req)
146146
return response
147147

@@ -157,7 +157,7 @@ def generate(self, **kwargs) -> GenerateResponse:
157157
generate_kwargs = self.dict_to_proto(generate_kwargs)
158158

159159
response = self.asyncio_loop.run_until_complete(
160-
self._query_in_tensor_parallel(text, generate_kwargs)
160+
self.generate_in_tensor_parallel(text, generate_kwargs)
161161
).result()
162162

163163
if response.error:

inference_server/model_handler/grpc_utils/pb/generation_pb2.py

Lines changed: 11 additions & 11 deletions
Some generated files are not rendered by default. Learn more about customizing how changed files appear on GitHub.

inference_server/model_handler/grpc_utils/pb/generation_pb2_grpc.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,8 @@ def __init__(self, channel):
1616
"""
1717
self.Generate = channel.unary_unary(
1818
"/generation.GenerationService/Generate",
19-
request_serializer=generation__pb2.GenerationRequest.SerializeToString,
20-
response_deserializer=generation__pb2.GenerationResponse.FromString,
19+
request_serializer=generation__pb2.GenerationRequestProto.SerializeToString,
20+
response_deserializer=generation__pb2.GenerationResponseProto.FromString,
2121
)
2222

2323

@@ -35,8 +35,8 @@ def add_GenerationServiceServicer_to_server(servicer, server):
3535
rpc_method_handlers = {
3636
"Generate": grpc.unary_unary_rpc_method_handler(
3737
servicer.Generate,
38-
request_deserializer=generation__pb2.GenerationRequest.FromString,
39-
response_serializer=generation__pb2.GenerationResponse.SerializeToString,
38+
request_deserializer=generation__pb2.GenerationRequestProto.FromString,
39+
response_serializer=generation__pb2.GenerationResponseProto.SerializeToString,
4040
),
4141
}
4242
generic_handler = grpc.method_handlers_generic_handler("generation.GenerationService", rpc_method_handlers)
@@ -64,8 +64,8 @@ def Generate(
6464
request,
6565
target,
6666
"/generation.GenerationService/Generate",
67-
generation__pb2.GenerationRequest.SerializeToString,
68-
generation__pb2.GenerationResponse.FromString,
67+
generation__pb2.GenerationRequestProto.SerializeToString,
68+
generation__pb2.GenerationResponseProto.FromString,
6969
options,
7070
channel_credentials,
7171
insecure,

inference_server/model_handler/grpc_utils/proto/generation.proto

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@ syntax = "proto3";
22
package generation;
33

44
service GenerationService {
5-
rpc Generate (GenerationRequest) returns (GenerationResponse) {}
5+
rpc Generate (GenerationRequestProto) returns (GenerationResponseProto) {}
66
}
77

88
message Value {
@@ -14,12 +14,12 @@ message Value {
1414
}
1515
}
1616

17-
message GenerationRequest {
17+
message GenerationRequestProto {
1818
repeated string texts = 1;
1919
map<string,Value> generate_kwargs = 2;
2020
}
2121

22-
message GenerationResponse {
22+
message GenerationResponseProto {
2323
repeated string texts = 1;
2424
repeated int32 num_generated_tokens = 2;
2525
string error = 3;

0 commit comments

Comments
 (0)