if not HAS_EXLLAMA: if CAN_EXLLAMA: logger.warning( log_once( logger.warning, "Exllama GPTQ cuda kernels (which are faster) could have been used, but are not currently installed, try using BUILD_EXTENSIONS=True" ) use_exllama = False ...