auto-assign gpu memory with --auto-devices alone

2024-10-01 01:26:03 -04:00 · 2023-02-10 16:36:06 -03:00 · 2023-02-10 16:36:06 -03:00 · 316e07f06a
commit 316e07f06a
parent 76d3d7ddb3
1 changed files with 1 additions and 1 deletions
--- a/server.py
+++ b/server.py
@ -130,7 +130,7 @@ def load_model(model_name):
            if args.gpu_memory:
                params.append(f"max_memory={{0: '{args.gpu_memory or '99'}GiB', 'cpu': '{args.cpu_memory or '99'}GiB'}}")
-            elif (args.gpu_memory or args.cpu_memory) and not args.load_in_8bit:
+            elif not args.load_in_8bit:
                total_mem = (torch.cuda.get_device_properties(0).total_memory/(1024*1024))
                suggestion = round((total_mem-1000)/1000)*1000
                if total_mem-suggestion < 800: