config.yml 202 B

12345678910
  1. listen_on: 0.0.0.0:*
  2. num_experts: 16
  3. expert_cls: ffn
  4. hidden_dim: 1024
  5. expert_pattern: expert.[0:4].[0:4]
  6. max_batch_size: 16384
  7. optimizer: adam
  8. no_dht: True
  9. initial_peers: "[]"
  10. increase_file_limit: True