2022-10-19 05:58:55 +02:00
""" task_manager.py: manage tasks dispatching and render threads.
Notes :
render_threads should be the only hard reference held by the manager to the threads .
Use weak_thread_data to store all other data using weak keys .
This will allow for garbage collection after the thread dies .
"""
2022-10-15 09:28:20 +02:00
import json
import traceback
2022-10-20 13:52:01 +02:00
TASK_TTL = 15 * 60 # seconds, Discard last session's task timeout
2022-10-15 09:28:20 +02:00
2022-11-09 14:47:44 +01:00
import torch
2022-10-18 19:21:15 +02:00
import queue , threading , time , weakref
2022-10-15 09:28:20 +02:00
from typing import Any , Generator , Hashable , Optional , Union
from pydantic import BaseModel
2022-11-14 06:53:22 +01:00
from sd_internal import Request , Response , runtime , device_manager
2022-10-15 09:28:20 +02:00
2022-10-17 05:06:41 +02:00
THREAD_NAME_PREFIX = ' Runtime-Render/ '
2022-10-17 03:41:39 +02:00
ERR_LOCK_FAILED = ' failed to acquire lock within timeout. '
LOCK_TIMEOUT = 15 # Maximum locking time in seconds before failing a task.
# It's better to get an exception than a deadlock... ALWAYS use timeout in critical paths.
2022-10-28 02:27:21 +02:00
DEVICE_START_TIMEOUT = 60 # seconds - Maximum time to wait for a render device to init.
2022-10-30 00:57:10 +02:00
CPU_UNLOAD_TIMEOUT = 4 * 60 # seconds - Idle time before CPU unload resource when GPUs are present.
2022-10-28 02:27:21 +02:00
2022-10-15 09:28:20 +02:00
class SymbolClass ( type ) : # Print nicely formatted Symbol names.
def __repr__ ( self ) : return self . __qualname__
def __str__ ( self ) : return self . __name__
class Symbol ( metaclass = SymbolClass ) : pass
class ServerStates :
class Init ( Symbol ) : pass
class LoadingModel ( Symbol ) : pass
class Online ( Symbol ) : pass
class Rendering ( Symbol ) : pass
class Unavailable ( Symbol ) : pass
class RenderTask ( ) : # Task with output queue and completion lock.
def __init__ ( self , req : Request ) :
self . request : Request = req # Initial Request
self . response : Any = None # Copy of the last reponse
2022-11-15 03:47:45 +01:00
self . render_device = None # Select the task afinity. (Not used to change active devices).
2022-10-21 07:30:49 +02:00
self . temp_images : list = [ None ] * req . num_outputs * ( 1 if req . show_only_filtered_image else 2 )
2022-10-15 09:28:20 +02:00
self . error : Exception = None
self . lock : threading . Lock = threading . Lock ( ) # Locks at task start and unlocks when task is completed
self . buffer_queue : queue . Queue = queue . Queue ( ) # Queue of JSON string segments
async def read_buffer_generator ( self ) :
try :
while not self . buffer_queue . empty ( ) :
res = self . buffer_queue . get ( block = False )
self . buffer_queue . task_done ( )
yield res
except queue . Empty as e : yield
# defaults from https://huggingface.co/blog/stable_diffusion
class ImageRequest ( BaseModel ) :
session_id : str = " session "
prompt : str = " "
negative_prompt : str = " "
init_image : str = None # base64
mask : str = None # base64
num_outputs : int = 1
num_inference_steps : int = 50
guidance_scale : float = 7.5
width : int = 512
height : int = 512
seed : int = 42
prompt_strength : float = 0.8
sampler : str = None # "ddim", "plms", "heun", "euler", "euler_a", "dpm2", "dpm2_a", "lms"
# allow_nsfw: bool = False
save_to_disk_path : str = None
turbo : bool = True
2022-10-29 23:33:44 +02:00
use_cpu : bool = False ##TODO Remove after UI and plugins transition.
2022-11-15 03:47:45 +01:00
render_device : str = None
2022-10-15 09:28:20 +02:00
use_full_precision : bool = False
use_face_correction : str = None # or "GFPGANv1.3"
use_upscale : str = None # or "RealESRGAN_x4plus" or "RealESRGAN_x4plus_anime_6B"
use_stable_diffusion_model : str = " sd-v1-4 "
2022-10-28 16:36:44 +02:00
use_vae_model : str = None
2022-10-15 09:28:20 +02:00
show_only_filtered_image : bool = False
output_format : str = " jpeg " # or "png"
stream_progress_updates : bool = False
stream_image_progress : bool = False
2022-10-17 03:41:39 +02:00
class FilterRequest ( BaseModel ) :
session_id : str = " session "
model : str = None
name : str = " "
init_image : str = None # base64
width : int = 512
height : int = 512
save_to_disk_path : str = None
turbo : bool = True
2022-10-29 23:33:44 +02:00
render_device : str = None
2022-10-17 03:41:39 +02:00
use_full_precision : bool = False
output_format : str = " jpeg " # or "png"
2022-10-15 09:28:20 +02:00
# Temporary cache to allow to query tasks results for a short time after they are completed.
class TaskCache ( ) :
def __init__ ( self ) :
self . _base = dict ( )
2022-10-17 03:41:39 +02:00
self . _lock : threading . Lock = threading . Lock ( )
2022-10-15 09:28:20 +02:00
def _get_ttl_time ( self , ttl : int ) - > int :
return int ( time . time ( ) ) + ttl
def _is_expired ( self , timestamp : int ) - > bool :
return int ( time . time ( ) ) > = timestamp
def clean ( self ) - > None :
2022-10-17 03:41:39 +02:00
if not self . _lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' TaskCache.clean ' + ERR_LOCK_FAILED )
2022-10-15 09:28:20 +02:00
try :
2022-10-15 10:39:45 +02:00
# Create a list of expired keys to delete
to_delete = [ ]
2022-10-15 09:28:20 +02:00
for key in self . _base :
ttl , _ = self . _base [ key ]
if self . _is_expired ( ttl ) :
2022-10-15 10:39:45 +02:00
to_delete . append ( key )
# Remove Items
for key in to_delete :
del self . _base [ key ]
print ( f ' Session { key } expired. Data removed. ' )
2022-10-15 09:28:20 +02:00
finally :
self . _lock . release ( )
def clear ( self ) - > None :
2022-10-17 03:41:39 +02:00
if not self . _lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' TaskCache.clear ' + ERR_LOCK_FAILED )
2022-10-15 09:28:20 +02:00
try : self . _base . clear ( )
finally : self . _lock . release ( )
def delete ( self , key : Hashable ) - > bool :
2022-10-17 03:41:39 +02:00
if not self . _lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' TaskCache.delete ' + ERR_LOCK_FAILED )
2022-10-15 09:28:20 +02:00
try :
if key not in self . _base :
return False
del self . _base [ key ]
return True
finally :
self . _lock . release ( )
def keep ( self , key : Hashable , ttl : int ) - > bool :
2022-10-17 03:41:39 +02:00
if not self . _lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' TaskCache.keep ' + ERR_LOCK_FAILED )
2022-10-15 09:28:20 +02:00
try :
if key in self . _base :
_ , value = self . _base . get ( key )
self . _base [ key ] = ( self . _get_ttl_time ( ttl ) , value )
return True
return False
finally :
self . _lock . release ( )
def put ( self , key : Hashable , value : Any , ttl : int ) - > bool :
2022-10-17 03:41:39 +02:00
if not self . _lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' TaskCache.put ' + ERR_LOCK_FAILED )
2022-10-15 09:28:20 +02:00
try :
self . _base [ key ] = (
self . _get_ttl_time ( ttl ) , value
)
2022-10-15 10:08:17 +02:00
except Exception as e :
print ( str ( e ) )
print ( traceback . format_exc ( ) )
2022-10-15 09:28:20 +02:00
return False
else :
return True
finally :
self . _lock . release ( )
def tryGet ( self , key : Hashable ) - > Any :
2022-10-17 03:41:39 +02:00
if not self . _lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' TaskCache.tryGet ' + ERR_LOCK_FAILED )
2022-10-15 09:28:20 +02:00
try :
ttl , value = self . _base . get ( key , ( None , None ) )
if ttl is not None and self . _is_expired ( ttl ) :
2022-10-15 10:39:45 +02:00
print ( f ' Session { key } expired. Discarding data. ' )
2022-10-17 03:41:39 +02:00
del self . _base [ key ]
2022-10-15 09:28:20 +02:00
return None
return value
finally :
self . _lock . release ( )
2022-10-17 07:05:27 +02:00
manager_lock = threading . RLock ( )
2022-10-17 03:41:39 +02:00
render_threads = [ ]
2022-10-15 09:28:20 +02:00
current_state = ServerStates . Init
current_state_error : Exception = None
current_model_path = None
2022-10-28 16:36:44 +02:00
current_vae_path = None
2022-10-17 03:41:39 +02:00
tasks_queue = [ ]
2022-10-15 09:28:20 +02:00
task_cache = TaskCache ( )
default_model_to_load = None
2022-10-28 16:36:44 +02:00
default_vae_to_load = None
2022-10-18 19:21:15 +02:00
weak_thread_data = weakref . WeakKeyDictionary ( )
2022-10-15 09:28:20 +02:00
2022-10-28 16:36:44 +02:00
def preload_model ( ckpt_file_path = None , vae_file_path = None ) :
2022-11-11 15:00:33 +01:00
global current_state , current_state_error , current_model_path , current_vae_path
2022-10-28 16:36:44 +02:00
if ckpt_file_path == None :
ckpt_file_path = default_model_to_load
if vae_file_path == None :
vae_file_path = default_vae_to_load
if ckpt_file_path == current_model_path and vae_file_path == current_vae_path :
2022-10-15 09:28:20 +02:00
return
current_state = ServerStates . LoadingModel
try :
from . import runtime
2022-10-28 16:36:44 +02:00
runtime . thread_data . ckpt_file = ckpt_file_path
runtime . thread_data . vae_file = vae_file_path
2022-10-17 03:41:39 +02:00
runtime . load_model_ckpt ( )
2022-10-28 16:36:44 +02:00
current_model_path = ckpt_file_path
current_vae_path = vae_file_path
2022-10-15 09:28:20 +02:00
current_state_error = None
current_state = ServerStates . Online
except Exception as e :
current_model_path = None
2022-10-28 16:36:44 +02:00
current_vae_path = None
2022-10-15 09:28:20 +02:00
current_state_error = e
current_state = ServerStates . Unavailable
print ( traceback . format_exc ( ) )
2022-10-22 04:45:19 +02:00
def thread_get_next_task ( ) :
2022-10-29 04:51:04 +02:00
from . import runtime
2022-10-22 04:45:19 +02:00
if not manager_lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) :
print ( ' Render thread on device ' , runtime . thread_data . device , ' failed to acquire manager lock. ' )
return None
if len ( tasks_queue ) < = 0 :
manager_lock . release ( )
return None
task = None
try : # Select a render task.
for queued_task in tasks_queue :
2022-11-14 07:21:18 +01:00
if queued_task . request . use_face_correction and runtime . thread_data . device == ' cpu ' and is_alive ( ) == 1 :
2022-11-14 07:21:56 +01:00
queued_task . error = Exception ( ' The CPU cannot be used to run this task currently. Please remove " Fix incorrect faces " from Image Settings and try again. ' )
2022-11-14 07:21:18 +01:00
task = queued_task
break
2022-10-29 23:33:44 +02:00
if queued_task . render_device and runtime . thread_data . device != queued_task . render_device :
# Is asking for a specific render device.
if is_alive ( queued_task . render_device ) > 0 :
continue # requested device alive, skip current one.
2022-10-22 04:45:19 +02:00
else :
2022-10-29 23:33:44 +02:00
# Requested device is not active, return error to UI.
2022-11-11 10:16:05 +01:00
queued_task . error = Exception ( queued_task . render_device + ' is not currently active. ' )
2022-10-22 04:45:19 +02:00
task = queued_task
break
2022-10-29 23:33:44 +02:00
if not queued_task . render_device and runtime . thread_data . device == ' cpu ' and is_alive ( ) > 1 :
2022-10-30 06:33:17 +01:00
# not asking for any specific devices, cpu want to grab task but other render devices are alive.
continue # Skip Tasks, don't run on CPU unless there is nothing else or user asked for it.
2022-10-22 04:45:19 +02:00
task = queued_task
break
if task is not None :
del tasks_queue [ tasks_queue . index ( task ) ]
return task
finally :
manager_lock . release ( )
2022-10-17 03:41:39 +02:00
def thread_render ( device ) :
2022-10-28 16:36:44 +02:00
global current_state , current_state_error , current_model_path , current_vae_path
2022-10-15 09:28:20 +02:00
from . import runtime
2022-10-17 03:41:39 +02:00
try :
2022-11-14 06:53:22 +01:00
runtime . thread_init ( device )
2022-10-30 11:04:06 +01:00
except Exception as e :
2022-10-17 03:41:39 +02:00
print ( traceback . format_exc ( ) )
2022-10-30 11:04:06 +01:00
weak_thread_data [ threading . current_thread ( ) ] = {
' error ' : e
}
2022-10-17 03:41:39 +02:00
return
2022-10-18 19:21:15 +02:00
weak_thread_data [ threading . current_thread ( ) ] = {
2022-10-29 23:33:44 +02:00
' device ' : runtime . thread_data . device ,
2022-11-14 06:53:22 +01:00
' device_name ' : runtime . thread_data . device_name ,
' alive ' : True
2022-10-18 19:21:15 +02:00
}
2022-10-28 03:57:50 +02:00
if runtime . thread_data . device != ' cpu ' or is_alive ( ) == 1 :
2022-10-27 20:34:33 +02:00
preload_model ( )
2022-10-28 10:09:34 +02:00
current_state = ServerStates . Online
2022-10-15 09:28:20 +02:00
while True :
task_cache . clean ( )
2022-11-14 06:53:22 +01:00
if not weak_thread_data [ threading . current_thread ( ) ] [ ' alive ' ] :
print ( f ' Shutting down thread for device { runtime . thread_data . device } ' )
runtime . unload_models ( )
runtime . unload_filters ( )
return
2022-10-15 09:28:20 +02:00
if isinstance ( current_state_error , SystemExit ) :
current_state = ServerStates . Unavailable
return
2022-10-22 04:45:19 +02:00
task = thread_get_next_task ( )
2022-10-17 03:41:39 +02:00
if task is None :
time . sleep ( 1 )
continue
2022-10-19 09:02:26 +02:00
if task . error is not None :
print ( task . error )
2022-10-22 04:45:19 +02:00
task . response = { " status " : ' failed ' , " detail " : str ( task . error ) }
2022-10-19 09:02:26 +02:00
task . buffer_queue . put ( json . dumps ( task . response ) )
continue
2022-10-15 09:28:20 +02:00
if current_state_error :
task . error = current_state_error
2022-10-22 04:45:19 +02:00
task . response = { " status " : ' failed ' , " detail " : str ( task . error ) }
task . buffer_queue . put ( json . dumps ( task . response ) )
2022-10-15 09:28:20 +02:00
continue
2022-11-02 03:28:10 +01:00
print ( f ' Session { task . request . session_id } starting task { id ( task ) } on { runtime . thread_data . device_name } ' )
2022-10-17 03:41:39 +02:00
if not task . lock . acquire ( blocking = False ) : raise Exception ( ' Got locked task from queue. ' )
2022-10-15 09:28:20 +02:00
try :
2022-10-30 00:57:10 +02:00
if runtime . thread_data . device == ' cpu ' and is_alive ( ) > 1 :
# CPU is not the only device. Keep track of active time to unload resources later.
runtime . thread_data . lastActive = time . time ( )
2022-10-17 03:41:39 +02:00
# Open data generator.
2022-10-15 09:28:20 +02:00
res = runtime . mk_img ( task . request )
if current_model_path == task . request . use_stable_diffusion_model :
current_state = ServerStates . Rendering
else :
current_state = ServerStates . LoadingModel
2022-10-17 03:41:39 +02:00
# Start reading from generator.
dataQueue = None
if task . request . stream_progress_updates :
dataQueue = task . buffer_queue
for result in res :
if current_state == ServerStates . LoadingModel :
current_state = ServerStates . Rendering
current_model_path = task . request . use_stable_diffusion_model
2022-10-28 16:36:44 +02:00
current_vae_path = task . request . use_vae_model
2022-10-17 03:41:39 +02:00
if isinstance ( current_state_error , SystemExit ) or isinstance ( current_state_error , StopAsyncIteration ) or isinstance ( task . error , StopAsyncIteration ) :
2022-10-22 04:45:19 +02:00
runtime . thread_data . stop_processing = True
2022-10-17 03:41:39 +02:00
if isinstance ( current_state_error , StopAsyncIteration ) :
task . error = current_state_error
current_state_error = None
print ( f ' Session { task . request . session_id } sent cancel signal for task { id ( task ) } ' )
if dataQueue :
dataQueue . put ( result )
if isinstance ( result , str ) :
result = json . loads ( result )
task . response = result
if ' output ' in result :
for out_obj in result [ ' output ' ] :
if ' path ' in out_obj :
img_id = out_obj [ ' path ' ] [ out_obj [ ' path ' ] . rindex ( ' / ' ) + 1 : ]
task . temp_images [ int ( img_id ) ] = runtime . thread_data . temp_images [ out_obj [ ' path ' ] [ 11 : ] ]
elif ' data ' in out_obj :
2022-11-01 09:52:42 +01:00
buf = runtime . base64_str_to_buffer ( out_obj [ ' data ' ] )
task . temp_images [ result [ ' output ' ] . index ( out_obj ) ] = buf
2022-10-17 03:41:39 +02:00
# Before looping back to the generator, mark cache as still alive.
task_cache . keep ( task . request . session_id , TASK_TTL )
2022-10-15 09:28:20 +02:00
except Exception as e :
task . error = e
print ( traceback . format_exc ( ) )
continue
2022-10-17 03:41:39 +02:00
finally :
# Task completed
task . lock . release ( )
2022-10-15 09:28:20 +02:00
task_cache . keep ( task . request . session_id , TASK_TTL )
if isinstance ( task . error , StopAsyncIteration ) :
print ( f ' Session { task . request . session_id } task { id ( task ) } cancelled! ' )
elif task . error is not None :
print ( f ' Session { task . request . session_id } task { id ( task ) } failed! ' )
else :
2022-11-02 03:28:10 +01:00
print ( f ' Session { task . request . session_id } task { id ( task ) } completed by { runtime . thread_data . device_name } . ' )
2022-10-15 09:28:20 +02:00
current_state = ServerStates . Online
2022-10-22 19:52:13 +02:00
def get_cached_task ( session_id : str , update_ttl : bool = False ) :
# By calling keep before tryGet, wont discard if was expired.
if update_ttl and not task_cache . keep ( session_id , TASK_TTL ) :
# Failed to keep task, already gone.
return None
return task_cache . tryGet ( session_id )
2022-10-29 23:33:44 +02:00
def get_devices ( ) :
2022-11-09 14:47:44 +01:00
devices = {
' all ' : { } ,
' active ' : { } ,
}
2022-11-14 16:05:47 +01:00
def get_device_info ( device ) :
if device == ' cpu ' :
return { ' name ' : device_manager . get_processor_name ( ) }
mem_free , mem_total = torch . cuda . mem_get_info ( device )
mem_free / = float ( 10 * * 9 )
mem_total / = float ( 10 * * 9 )
return {
' name ' : torch . cuda . get_device_name ( device ) ,
' mem_free ' : mem_free ,
' mem_total ' : mem_total ,
}
2022-11-09 14:47:44 +01:00
# list the compatible devices
gpu_count = torch . cuda . device_count ( )
for device in range ( gpu_count ) :
2022-11-11 10:16:05 +01:00
device = f ' cuda: { device } '
2022-11-14 06:53:22 +01:00
if not device_manager . is_device_compatible ( device ) :
2022-11-09 14:47:44 +01:00
continue
2022-11-14 16:05:47 +01:00
devices [ ' all ' ] . update ( { device : get_device_info ( device ) } )
2022-11-09 14:47:44 +01:00
2022-11-14 16:05:47 +01:00
devices [ ' all ' ] . update ( { ' cpu ' : get_device_info ( ' cpu ' ) } )
2022-11-09 14:47:44 +01:00
# list the activated devices
2022-10-29 23:33:44 +02:00
if not manager_lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' get_devices ' + ERR_LOCK_FAILED )
try :
for rthread in render_threads :
2022-10-30 06:38:32 +01:00
if not rthread . is_alive ( ) :
continue
2022-10-29 23:33:44 +02:00
weak_data = weak_thread_data . get ( rthread )
2022-10-30 06:38:32 +01:00
if not weak_data or not ' device ' in weak_data or not ' device_name ' in weak_data :
continue
2022-11-14 16:05:47 +01:00
device = weak_data [ ' device ' ]
devices [ ' active ' ] . update ( { device : get_device_info ( device ) } )
2022-10-29 23:33:44 +02:00
finally :
manager_lock . release ( )
2022-11-09 14:47:44 +01:00
return devices
2022-11-10 15:33:11 +01:00
def is_alive ( device = None ) :
2022-10-17 03:41:39 +02:00
if not manager_lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' is_alive ' + ERR_LOCK_FAILED )
nbr_alive = 0
try :
for rthread in render_threads :
2022-11-10 15:33:11 +01:00
if device is not None :
2022-10-18 19:21:15 +02:00
weak_data = weak_thread_data . get ( rthread )
2022-10-30 11:04:06 +01:00
if weak_data is None or not ' device ' in weak_data or weak_data [ ' device ' ] is None :
2022-10-18 19:21:15 +02:00
continue
2022-11-10 15:33:11 +01:00
thread_device = weak_data [ ' device ' ]
if thread_device != device :
2022-10-17 05:06:41 +02:00
continue
2022-10-17 03:41:39 +02:00
if rthread . is_alive ( ) :
nbr_alive + = 1
return nbr_alive
finally :
manager_lock . release ( )
2022-10-15 09:28:20 +02:00
2022-11-14 06:53:22 +01:00
def start_render_thread ( device ) :
if not manager_lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' start_render_thread ' + ERR_LOCK_FAILED )
2022-10-17 03:41:39 +02:00
print ( ' Start new Rendering Thread on device ' , device )
try :
rthread = threading . Thread ( target = thread_render , kwargs = { ' device ' : device } )
rthread . daemon = True
2022-11-14 06:53:22 +01:00
rthread . name = THREAD_NAME_PREFIX + device
2022-10-17 03:41:39 +02:00
rthread . start ( )
render_threads . append ( rthread )
finally :
manager_lock . release ( )
2022-10-29 04:52:00 +02:00
timeout = DEVICE_START_TIMEOUT
while not rthread . is_alive ( ) or not rthread in weak_thread_data or not ' device ' in weak_thread_data [ rthread ] :
2022-10-30 11:04:06 +01:00
if rthread in weak_thread_data and ' error ' in weak_thread_data [ rthread ] :
2022-11-14 06:53:22 +01:00
print ( rthread , device , ' error: ' , weak_thread_data [ rthread ] [ ' error ' ] )
2022-10-30 11:04:06 +01:00
return False
2022-10-29 04:52:00 +02:00
if timeout < = 0 :
return False
timeout - = 1
time . sleep ( 1 )
return True
2022-10-15 09:28:20 +02:00
2022-11-14 06:53:22 +01:00
def stop_render_thread ( device ) :
try :
device_manager . validate_device_id ( device , log_prefix = ' stop_render_thread ' )
except :
print ( traceback . format_exec ( ) )
return False
if not manager_lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT ) : raise Exception ( ' stop_render_thread ' + ERR_LOCK_FAILED )
print ( ' Stopping Rendering Thread on device ' , device )
try :
thread_to_remove = None
for rthread in render_threads :
weak_data = weak_thread_data . get ( rthread )
if weak_data is None or not ' device ' in weak_data or weak_data [ ' device ' ] is None :
continue
thread_device = weak_data [ ' device ' ]
if thread_device == device :
weak_data [ ' alive ' ] = False
thread_to_remove = rthread
break
if thread_to_remove is not None :
render_threads . remove ( rthread )
return True
finally :
manager_lock . release ( )
return False
def update_render_threads ( render_devices , active_devices ) :
devices_to_start , devices_to_stop = device_manager . get_device_delta ( render_devices , active_devices )
print ( ' devices_to_start ' , devices_to_start )
print ( ' devices_to_stop ' , devices_to_stop )
for device in devices_to_stop :
if is_alive ( device ) < = 0 :
print ( device , ' is not alive ' )
continue
if not stop_render_thread ( device ) :
print ( device , ' could not stop render thread ' )
for device in devices_to_start :
if is_alive ( device ) > = 1 :
print ( device , ' already registered. ' )
continue
if not start_render_thread ( device ) :
print ( device , ' failed to start. ' )
if is_alive ( ) < = 0 : # No running devices, probably invalid user config.
raise EnvironmentError ( ' ERROR: No active render devices! Please verify the " render_devices " value in config.json ' )
print ( ' active devices ' , get_devices ( ) [ ' active ' ] )
2022-10-15 09:28:20 +02:00
def shutdown_event ( ) : # Signal render thread to close on shutdown
global current_state_error
current_state_error = SystemExit ( ' Application shutting down. ' )
def render ( req : ImageRequest ) :
2022-10-25 09:00:50 +02:00
if is_alive ( ) < = 0 : # Render thread is dead
2022-10-15 09:28:20 +02:00
raise ChildProcessError ( ' Rendering thread has died. ' )
# Alive, check if task in cache
task = task_cache . tryGet ( req . session_id )
if task and not task . response and not task . error and not task . lock . locked ( ) :
# Unstarted task pending, deny queueing more than one.
raise ConnectionRefusedError ( f ' Session { req . session_id } has an already pending task. ' )
#
from . import runtime
r = Request ( )
r . session_id = req . session_id
r . prompt = req . prompt
r . negative_prompt = req . negative_prompt
r . init_image = req . init_image
r . mask = req . mask
r . num_outputs = req . num_outputs
r . num_inference_steps = req . num_inference_steps
r . guidance_scale = req . guidance_scale
r . width = req . width
r . height = req . height
r . seed = req . seed
r . prompt_strength = req . prompt_strength
r . sampler = req . sampler
# r.allow_nsfw = req.allow_nsfw
r . turbo = req . turbo
r . use_full_precision = req . use_full_precision
r . save_to_disk_path = req . save_to_disk_path
r . use_upscale : str = req . use_upscale
r . use_face_correction = req . use_face_correction
2022-10-17 17:52:05 +02:00
r . use_stable_diffusion_model = req . use_stable_diffusion_model
2022-10-28 16:36:44 +02:00
r . use_vae_model = req . use_vae_model
2022-10-15 09:28:20 +02:00
r . show_only_filtered_image = req . show_only_filtered_image
r . output_format = req . output_format
r . stream_progress_updates = True # the underlying implementation only supports streaming
r . stream_image_progress = req . stream_image_progress
if not req . stream_progress_updates :
r . stream_image_progress = False
new_task = RenderTask ( r )
2022-10-29 23:33:44 +02:00
2022-10-15 10:08:17 +02:00
if task_cache . put ( r . session_id , new_task , TASK_TTL ) :
2022-10-17 03:41:39 +02:00
# Use twice the normal timeout for adding user requests.
# Tries to force task_cache.put to fail before tasks_queue.put would.
if manager_lock . acquire ( blocking = True , timeout = LOCK_TIMEOUT * 2 ) :
try :
tasks_queue . append ( new_task )
return new_task
finally :
manager_lock . release ( )
2022-10-15 10:08:17 +02:00
raise RuntimeError ( ' Failed to add task to cache. ' )