|
Tools for converting transformer blocks, applying quantization and/or tensor parallelism
|
|
Tools for converting transformer blocks, applying quantization and/or tensor parallelism
|
|
from typing import List, Optional, Sequence
|
|
from typing import List, Optional, Sequence
|