--cpu-memory CPU_MEMORY Maximum CPU memory in GiB to allocate for offloaded weights. Same as above. --disk If the model is too large for your GPU(s) and CPU combined, send the remaining layers to the disk. --dis
import multiprocessing import time #example worker, where you would put your stuff and report back def worker_func(input_queue, output_queue): while True: task = input_queue.get() if task["command"] == "exit": break elif task["command"] == "input": result = task["data"] #whatever...