stable-diffusion-webui/modules/call_queue.py

from functools import wraps
import html
import threading
import time

from modules import shared, progress, errors, devices

queue_lock = threading.Lock()


def wrap_queued_call(func):
    def f(*args, **kwargs):
        with queue_lock:
            res = func(*args, **kwargs)

        return res

    return f


def wrap_gradio_gpu_call(func, extra_outputs=None):
    @wraps(func)
    def f(*args, **kwargs):

        # if the first argument is a string that says "task(...)", it is treated as a job id
        if args and type(args[0]) == str and args[0].startswith("task(") and args[0].endswith(")"):
            id_task = args[0]
            progress.add_task_to_queue(id_task)
        else:
            id_task = None

        with queue_lock:
            shared.state.begin(job=id_task)
            progress.start_task(id_task)

            try:
                res = func(*args, **kwargs)
                progress.record_results(id_task, res)
            finally:
                progress.finish_task(id_task)

            shared.state.end()

        return res

    return wrap_gradio_call(f, extra_outputs=extra_outputs, add_stats=True)


def wrap_gradio_call(func, extra_outputs=None, add_stats=False):
    @wraps(func)
    def f(*args, extra_outputs_array=extra_outputs, **kwargs):
        run_memmon = shared.opts.memmon_poll_rate > 0 and not shared.mem_mon.disabled and add_stats
        if run_memmon:
            shared.mem_mon.monitor()
        t = time.perf_counter()

        try:
            res = list(func(*args, **kwargs))
        except Exception as e:
            # When printing out our debug argument list,
            # do not print out more than a 100 KB of text
            max_debug_str_len = 131072
            message = "Error completing request"
            arg_str = f"Arguments: {args} {kwargs}"[:max_debug_str_len]
            if len(arg_str) > max_debug_str_len:
                arg_str += f" (Argument list truncated at {max_debug_str_len}/{len(arg_str)} characters)"
            errors.report(f"{message}\n{arg_str}", exc_info=True)

            shared.state.job = ""
            shared.state.job_count = 0

            if extra_outputs_array is None:
                extra_outputs_array = [None, '']

            error_message = f'{type(e).__name__}: {e}'
            res = extra_outputs_array + [f"<div class='error'>{html.escape(error_message)}</div>"]

        devices.torch_gc()

        shared.state.skipped = False
        shared.state.interrupted = False
        shared.state.job_count = 0

        if not add_stats:
            return tuple(res)

        elapsed = time.perf_counter() - t
        elapsed_m = int(elapsed // 60)
        elapsed_s = elapsed % 60
        elapsed_text = f"{elapsed_s:.1f} sec."
        if elapsed_m > 0:
            elapsed_text = f"{elapsed_m} min. "+elapsed_text

        if run_memmon:
            mem_stats = {k: -(v//-(1024*1024)) for k, v in shared.mem_mon.stop().items()}
            active_peak = mem_stats['active_peak']
            reserved_peak = mem_stats['reserved_peak']
            sys_peak = mem_stats['system_peak']
            sys_total = mem_stats['total']
            sys_pct = sys_peak/max(sys_total, 1) * 100

            toltip_a = "Active: peak amount of video memory used during generation (excluding cached data)"
            toltip_r = "Reserved: total amout of video memory allocated by the Torch library "
            toltip_sys = "System: peak amout of video memory allocated by all running programs, out of total capacity"

            text_a = f"<abbr title='{toltip_a}'>A</abbr>: <span class='measurement'>{active_peak/1024:.2f} GB</span>"
            text_r = f"<abbr title='{toltip_r}'>R</abbr>: <span class='measurement'>{reserved_peak/1024:.2f} GB</span>"
            text_sys = f"<abbr title='{toltip_sys}'>Sys</abbr>: <span class='measurement'>{sys_peak/1024:.1f}/{sys_total/1024:g} GB</span> ({sys_pct:.1f}%)"

            vram_html = f"<p class='vram'>{text_a}, <wbr>{text_r}, <wbr>{text_sys}</p>"
        else:
            vram_html = ''

        # last item is always HTML
        res[-1] += f"<div class='performance'><p class='time'>Time taken: <wbr><span class='measurement'>{elapsed_text}</span></p>{vram_html}</div>"

        return tuple(res)

    return f
Fix gradio special args in the call queue 2023-06-14 21:53:13 +03:00			`from functools import wraps`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00			`import html`
			`import threading`
			`import time`

fix memory leak when generation fails 2023-07-31 22:01:53 +03:00			`from modules import shared, progress, errors, devices`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
			`queue_lock = threading.Lock()`

replace with #wrap_session_call 2023-04-17 06:50:08 +03:00
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00			`def wrap_queued_call(func):`
			`def f(args, *kwargs):`
			`with queue_lock:`
			`res = func(args, *kwargs)`

			`return res`

			`return f`


			`def wrap_gradio_gpu_call(func, extra_outputs=None):`
Fix gradio special args in the call queue 2023-06-14 21:53:13 +03:00			`@wraps(func)`
Revert "Merge pull request #7595 from siutin/feature/restore-progress" This reverts commit 80987c36f9bfa33092ac7c75624b25d839cb2a06, reversing changes made to 2e78e65a22bfa6b116ae18d12fdcb85ec8acd727. 2023-04-29 22:15:20 +03:00			`def f(args, *kwargs):`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
big rework of progressbar/preview system to allow multiple users to prompts at the same time and do not get previews of each other 2023-01-15 18:50:56 +03:00			`# if the first argument is a string that says "task(...)", it is treated as a job id`
Simplify a bunch of `len(x) > 0`/`len(x) == 0` style expressions 2023-06-02 14:58:10 +03:00			`if args and type(args[0]) == str and args[0].startswith("task(") and args[0].endswith(")"):`
big rework of progressbar/preview system to allow multiple users to prompts at the same time and do not get previews of each other 2023-01-15 18:50:56 +03:00			`id_task = args[0]`
Revert "Merge pull request #7595 from siutin/feature/restore-progress" This reverts commit 80987c36f9bfa33092ac7c75624b25d839cb2a06, reversing changes made to 2e78e65a22bfa6b116ae18d12fdcb85ec8acd727. 2023-04-29 22:15:20 +03:00			`progress.add_task_to_queue(id_task)`
big rework of progressbar/preview system to allow multiple users to prompts at the same time and do not get previews of each other 2023-01-15 18:50:56 +03:00			`else:`
			`id_task = None`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
			`with queue_lock:`
Add job argument to State.begin() 2023-06-30 13:11:31 +03:00			`shared.state.begin(job=id_task)`
Revert "Merge pull request #7595 from siutin/feature/restore-progress" This reverts commit 80987c36f9bfa33092ac7c75624b25d839cb2a06, reversing changes made to 2e78e65a22bfa6b116ae18d12fdcb85ec8acd727. 2023-04-29 22:15:20 +03:00			`progress.start_task(id_task)`
big rework of progressbar/preview system to allow multiple users to prompts at the same time and do not get previews of each other 2023-01-15 18:50:56 +03:00
			`try:`
			`res = func(args, *kwargs)`
alternate restore progress button implementation 2023-04-29 22:16:54 +03:00			`progress.record_results(id_task, res)`
big rework of progressbar/preview system to allow multiple users to prompts at the same time and do not get previews of each other 2023-01-15 18:50:56 +03:00			`finally:`
Revert "Merge pull request #7595 from siutin/feature/restore-progress" This reverts commit 80987c36f9bfa33092ac7c75624b25d839cb2a06, reversing changes made to 2e78e65a22bfa6b116ae18d12fdcb85ec8acd727. 2023-04-29 22:15:20 +03:00			`progress.finish_task(id_task)`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
big rework of progressbar/preview system to allow multiple users to prompts at the same time and do not get previews of each other 2023-01-15 18:50:56 +03:00			`shared.state.end()`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
			`return res`

Revert "Merge pull request #7595 from siutin/feature/restore-progress" This reverts commit 80987c36f9bfa33092ac7c75624b25d839cb2a06, reversing changes made to 2e78e65a22bfa6b116ae18d12fdcb85ec8acd727. 2023-04-29 22:15:20 +03:00			`return wrap_gradio_call(f, extra_outputs=extra_outputs, add_stats=True)`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00

replace with #wrap_session_call 2023-04-17 06:50:08 +03:00			`def wrap_gradio_call(func, extra_outputs=None, add_stats=False):`
Fix gradio special args in the call queue 2023-06-14 21:53:13 +03:00			`@wraps(func)`
replace with #wrap_session_call 2023-04-17 06:50:08 +03:00			`def f(args, extra_outputs_array=extra_outputs, *kwargs):`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00			`run_memmon = shared.opts.memmon_poll_rate > 0 and not shared.mem_mon.disabled and add_stats`
			`if run_memmon:`
			`shared.mem_mon.monitor()`
			`t = time.perf_counter()`

			`try:`
replace with #wrap_session_call 2023-04-17 06:50:08 +03:00			`res = list(func(args, *kwargs))`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00			`except Exception as e:`
Add & use modules.errors.print_error where currently printing exception info by hand 2023-05-29 08:54:13 +03:00			`# When printing out our debug argument list,`
			`# do not print out more than a 100 KB of text`
			`max_debug_str_len = 131072`
			`message = "Error completing request"`
			`arg_str = f"Arguments: {args} {kwargs}"[:max_debug_str_len]`
			`if len(arg_str) > max_debug_str_len:`
			`arg_str += f" (Argument list truncated at {max_debug_str_len}/{len(arg_str)} characters)"`
rename print_error to report, use it with together with package name 2023-05-31 19:56:37 +03:00			`errors.report(f"{message}\n{arg_str}", exc_info=True)`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
			`shared.state.job = ""`
			`shared.state.job_count = 0`

			`if extra_outputs_array is None:`
			`extra_outputs_array = [None, '']`

Fix up string formatting/concatenation to f-strings where feasible 2023-05-09 22:17:58 +03:00			`error_message = f'{type(e).__name__}: {e}'`
			`res = extra_outputs_array + [f"<div class='error'>{html.escape(error_message)}</div>"]`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
fix memory leak when generation fails 2023-07-31 22:01:53 +03:00			`devices.torch_gc()`

fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00			`shared.state.skipped = False`
			`shared.state.interrupted = False`
			`shared.state.job_count = 0`

			`if not add_stats:`
			`return tuple(res)`

			`elapsed = time.perf_counter() - t`
			`elapsed_m = int(elapsed // 60)`
			`elapsed_s = elapsed % 60`
restyle time taken/VRAM display 2023-07-14 22:51:58 +03:00			`elapsed_text = f"{elapsed_s:.1f} sec."`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00			`if elapsed_m > 0:`
restyle time taken/VRAM display 2023-07-14 22:51:58 +03:00			`elapsed_text = f"{elapsed_m} min. "+elapsed_text`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
			`if run_memmon:`
			`mem_stats = {k: -(v//-(1024*1024)) for k, v in shared.mem_mon.stop().items()}`
			`active_peak = mem_stats['active_peak']`
			`reserved_peak = mem_stats['reserved_peak']`
			`sys_peak = mem_stats['system_peak']`
			`sys_total = mem_stats['total']`
restyle time taken/VRAM display 2023-07-14 22:51:58 +03:00			`sys_pct = sys_peak/max(sys_total, 1) * 100`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
restyle time taken/VRAM display 2023-07-14 22:51:58 +03:00			`toltip_a = "Active: peak amount of video memory used during generation (excluding cached data)"`
			`toltip_r = "Reserved: total amout of video memory allocated by the Torch library "`
			`toltip_sys = "System: peak amout of video memory allocated by all running programs, out of total capacity"`

			`text_a = f"<abbr title='{toltip_a}'>A</abbr>: <span class='measurement'>{active_peak/1024:.2f} GB</span>"`
			`text_r = f"<abbr title='{toltip_r}'>R</abbr>: <span class='measurement'>{reserved_peak/1024:.2f} GB</span>"`
			`text_sys = f"<abbr title='{toltip_sys}'>Sys</abbr>: <span class='measurement'>{sys_peak/1024:.1f}/{sys_total/1024:g} GB</span> ({sys_pct:.1f}%)"`

			`vram_html = f"<p class='vram'>{text_a}, <wbr>{text_r}, <wbr>{text_sys}</p>"`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00			`else:`
			`vram_html = ''`

			`# last item is always HTML`
restyle time taken/VRAM display 2023-07-14 22:51:58 +03:00			`res[-1] += f"<div class='performance'><p class='time'>Time taken: <wbr><span class='measurement'>{elapsed_text}</span></p>{vram_html}</div>"`
fix an error that happens when you type into prompt while switching model, put queue stuff into separate file 2022-11-28 09:00:10 +03:00
			`return tuple(res)`

			`return f`