| | syntax = "proto3";
|
| |
|
| | package runtime.aot.machine_learning.parents.gpt;
|
| |
|
| | service GPTInferenceService {
|
| | rpc Predict (Request) returns (Response);
|
| | rpc PredictWithStream (Request) returns (stream Response);
|
| | }
|
| |
|
| |
|
| | message Message {
|
| | uint64 role = 1;
|
| | string message = 2;
|
| | }
|
| |
|
| |
|
| | message Request {
|
| | string models = 1;
|
| | repeated Message messages = 2;
|
| | double temperature = 3;
|
| | double top_p = 4;
|
| | }
|
| |
|
| |
|
| | message Response {
|
| | uint64 response_code = 2;
|
| | optional Body body = 4;
|
| | }
|
| |
|
| | message Body{
|
| | string id = 1;
|
| | string object = 2;
|
| | uint64 time = 3;
|
| | MessageWarpper message_warpper = 4;
|
| | Unknown unknown = 5;
|
| | }
|
| |
|
| | message MessageWarpper {
|
| | int64 arg1 = 1;
|
| | Message message = 2;
|
| | }
|
| |
|
| | message Unknown {
|
| |
|
| | int64 arg1 = 1;
|
| | int64 arg2 = 2;
|
| | int64 arg3 = 3;
|
| | } |