3 years ago · 0f5c427969
--- a/cli/run_server.py
+++ b/cli/run_server.py
@@ -2,26 +2,13 @@ import configargparse
 
															 from hivemind.proto.runtime_pb2 import CompressionType
														
 
															 from hivemind.utils.limits import increase_file_limit
														
 
															 from hivemind.utils.logging import get_logger, use_hivemind_log_handler
														
 
															+from humanfriendly import parse_size
														
 
															 from src.server.server import Server
														
 
															 use_hivemind_log_handler("in_root_logger")
														
 
															 logger = get_logger(__file__)
														
 
															-import re
														
 
															-
														
 
															-
														
 
															-def parse_size_as_bytes(size: str) -> int:
														
 
															-    """parse human-readable data size e.g. 1.5GB, based on https://stackoverflow.com/a/42865957/2002471"""
														
 
															-    units = {"B": 1, "KB": 2**10, "MB": 2**20, "GB": 2**30, "TB": 2**40, "PB": 2**50}
														
 
															-    size = size.strip().upper().replace("IB", "B")
														
 
															-    if not size.endswith("B"):
														
 
															-        size += "B"
														
 
															-    if not re.match(r" ", size):
														
 
															-        size = re.sub(r"([KMGT]?B)", r" \1", size)
														
 
															-    number, unit = [string.strip() for string in size.split()]
														
 
															-    return int(float(number) * units[unit])
														
 
															-
														
 
															 def main():
														
 
															     # fmt:off
														
@@ -58,7 +45,7 @@ def main():
 
															                              "By default, respect the dtypes in the pre-trained state dict.")
														
 
															     parser.add_argument('--attn_cache_size', type=str, default=None,
														
 
															                         help='The size of GPU memory allocated for storing past attention keys/values between inference'
														
 
															-                             ' steps; examples: 500MB or 1.2GB or 1073741824 (bytes); assumes 1KB = 1kB = 1024 bytes')
														
 
															+                             ' steps; examples: 500MB or 1.2GB or 1073741824 (bytes); be warned: 1KB != 1KiB')
														
 
															     parser.add_argument('--revision', type=str, default='main',
														
 
															                         help="The specific model version to use. It can be a branch name, a tag name, or a commit id, since we use a git-based system for storing models"
														
 
															                              "and other artifacts on huggingface.co, so `revision` can be any identifier allowed by git.")
														
@@ -100,7 +87,7 @@ def main():
 
															     attn_cache_size = args.pop("attn_cache_size")
														
 
															     if attn_cache_size is not None:
														
 
															-        attn_cache_size = parse_size_as_bytes(attn_cache_size)
														
 
															+        attn_cache_size = parse_size(attn_cache_size)
														
 
															     assert isinstance(
														
 
															         attn_cache_size, (int, type(None))
														
 
															     ), "unrecognized value for attention_cache_bytes, examples: 1.5GB or 1500MB or 1572864000 (bytes)"
														
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,5 +1,6 @@
 
															 torch==1.12.0
														
 
															 accelerate==0.10.0
														
 
															 huggingface-hub==0.7.0
														
 
															+humanfriendly
														
 
															 https://github.com/learning-at-home/hivemind/archive/20b3b3d5f225ed525515a5383a008a8f9fad8173.zip
														
 
															 https://github.com/huggingface/transformers/archive/6589e510fa4e6c442059de2fab84752535de9b23.zip