You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
inputs.max_context_length=maxctx#initial value to use for ctx, can be overwritten
152
153
inputs.threads=args.threads
154
+
inputs.low_vram=args.lowvram
153
155
inputs.blasthreads=args.blasthreads
154
156
inputs.f16_kv=True
155
157
inputs.use_mmap= (notargs.nommap)
@@ -646,7 +648,7 @@ def onDropdownChange(event):
646
648
#load all the vars
647
649
args.threads=int(threads_var.get())
648
650
args.gpulayers=int(gpu_layers_var.get())
649
-
651
+
650
652
args.stream= (stream.get()==1)
651
653
args.smartcontext= (smartcontext.get()==1)
652
654
args.launch= (launchbrowser.get()==1)
@@ -861,6 +863,7 @@ def main(args):
861
863
parser.add_argument("--hordeconfig", help="Sets the display model name to something else, for easy use on AI Horde. Optional additional parameters set the horde max genlength and max ctxlen.",metavar=('[hordename]', '[hordelength] [hordectx]'), nargs='+')
862
864
compatgroup=parser.add_mutually_exclusive_group()
863
865
compatgroup.add_argument("--noblas", help="Do not use OpenBLAS for accelerated prompt ingestion", action='store_true')
866
+
parser.add_argument("--lowvram", help="Do not keep scratch memory in VRAM for CUDA", action='store_true')
864
867
compatgroup.add_argument("--useclblast", help="Use CLBlast instead of OpenBLAS for prompt ingestion. Must specify exactly 2 arguments, platform ID and device ID (e.g. --useclblast 1 0).", type=int, choices=range(0,9), nargs=2)
865
868
parser.add_argument("--gpulayers", help="Set number of layers to offload to GPU when using CLBlast. Requires CLBlast.",metavar=('[GPU layers]'), type=int, default=0)
0 commit comments