ake.jlama-net.0.4.0.source-code.JlamaService.proto Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of jlama-net Show documentation
Show all versions of jlama-net Show documentation
Jlama: A modern LLM inference engine for Java
syntax = "proto3";
option java_multiple_files = true;
package com.github.tjake.jlama.net;
message CombineRequest {
bytes workerid = 1;
bytes uuid = 2;
int32 layer = 3;
repeated bytes tensor = 4;
}
message CombineResponse {
repeated bytes tensor = 1;
}
message GenerateRequest {
bytes workerid = 1;
bytes session = 2;
bytes tensor = 3;
}
message GenerateResponse {
bytes session = 1;
int32 startPosition = 2;
repeated int32 tokens = 3;
}
/**
* Register a worker with the server
*/
message RegisterRequest {
bytes workerid = 1;
}
message RegisterResponse {
int32 modelShard = 1;
int32 numModelShards = 2;
int32 layerShard = 3;
int32 numLayerShards = 4;
}
service JlamaService {
rpc register(RegisterRequest) returns (RegisterResponse);
rpc generate(stream GenerateRequest) returns (stream GenerateResponse);
rpc combine(stream CombineRequest) returns (stream CombineResponse);
}