containers · ericcurtin · Feb 2, 2025 · sourcery-ai · Feb 2, 2025 · rhatdan
@@ -115,7 +115,7 @@ pass --group-add keep-groups to podman (default: False)
 Needed to access the gpu on some systems, but has an impact on security, use with caution.
 
 #### **--ngl**
-number of gpu layers (default: 999)
+number of gpu layers (default: -1)
-Needed to access the gpu on some systems, but has an impact on security, use with caution.
-
-#### **--ngl**
-number of gpu layers (default: 999)
-number of gpu layers (default: -1)
+Needed to access the GPU on some systems, but has an impact on security, use with caution.
+
+#### **--ngl**
+number of GPU layers (default: -1). A value of -1 means use all available GPU layers
-Needed to access the gpu on some systems, but has an impact on security, use with caution.
-
-#### **--ngl**
-number of gpu layers (default: 999)
-number of gpu layers (default: -1)
+Needed to access the GPU on some systems, but has an impact on security, use with caution.
+
+#### **--ngl**
+number of GPU layers (default: -1). A value of -1 means use all available GPU layers
 
 #### **--nocontainer**
 do not run RamaLama in the default container (default: False)

@@ -51,7 +51,7 @@
 
 # Default number of layers offloaded to the gpu
 #
-#ngl = 999
+#ngl = -1
 
 # Specify default port for services to listen on
 #

@@ -92,7 +92,7 @@ RAMALAMA_IMAGE environment variable overrides this field.
 Pass `--group-add keep-groups` to podman, when using podman.
 In some cases this is needed to access the gpu from a rootless container
 
-**ngl**=999
+**ngl**=-1
 
 Default number of layers to offload to the gpu
 

@@ -196,7 +196,7 @@ def configure_arguments(parser):
         "--ngl",
         dest="ngl",
         type=int,
-        default=config.get("ngl", 999),
+        default=config.get("ngl", -1),
         help="Number of layers to offload to the gpu, if available"
     )
     parser.add_argument(

@@ -193,7 +193,7 @@ def setup_container(self, args):
     def gpu_args(self, args, runner=False):
         gpu_args = []
         if (
-            args.gpu
+            args.gpu > 0
             or os.getenv("HIP_VISIBLE_DEVICES")
             or os.getenv("ASAHI_VISIBLE_DEVICES")
             or os.getenv("CUDA_VISIBLE_DEVICES")