runtime.proto 577 B

123456789101112131415161718192021222324252627282930313233343536373839
  1. syntax = "proto3";
  2. message ExpertUID {
  3. string uid = 1;
  4. }
  5. message ExpertInfo {
  6. bytes serialized_info = 1;
  7. }
  8. message ExpertRequest {
  9. string uid = 1;
  10. repeated Tensor tensors = 2;
  11. bytes metadata = 3;
  12. }
  13. message ExpertResponse {
  14. repeated Tensor tensors = 2;
  15. bytes metadata = 3;
  16. }
  17. enum CompressionType{
  18. NONE = 0;
  19. MEANSTD_16BIT = 1;
  20. FLOAT16 = 2;
  21. QUANTILE_8BIT = 3;
  22. UNIFORM_8BIT = 4;
  23. }
  24. message Tensor {
  25. bytes buffer = 1;
  26. repeated uint32 size = 2;
  27. bool requires_grad = 3;
  28. string dtype = 4;
  29. CompressionType compression = 5;
  30. int32 chunks = 6;
  31. }