runtime.proto 777 B

123456789101112131415161718192021222324252627282930313233343536373839404142434445
  1. syntax = "proto3";
  2. service ConnectionHandler {
  3. // Listens to incoming requests for expert computation
  4. rpc info(ExpertUID) returns (ExpertInfo);
  5. rpc forward(ExpertRequest) returns (ExpertResponse);
  6. rpc backward(ExpertRequest) returns (ExpertResponse);
  7. }
  8. message ExpertUID {
  9. string uid = 1;
  10. }
  11. message ExpertInfo {
  12. bytes serialized_info = 1;
  13. }
  14. message ExpertRequest {
  15. string uid = 1;
  16. repeated Tensor tensors = 2;
  17. }
  18. message ExpertResponse {
  19. repeated Tensor tensors = 2;
  20. }
  21. enum CompressionType{
  22. NONE = 0;
  23. MEANSTD_16BIT = 1;
  24. FLOAT16 = 2;
  25. QUANTILE_8BIT = 3;
  26. UNIFORM_8BIT = 4;
  27. }
  28. message Tensor {
  29. bytes buffer = 1;
  30. repeated uint32 size = 2;
  31. bool requires_grad = 3;
  32. string dtype = 4;
  33. CompressionType compression = 5;
  34. int32 chunks = 6;
  35. }