import html import threading import time import cProfile from modules import shared, progress, errors, timer queue_lock = threading.Lock() def wrap_queued_call(func): def f(*args, **kwargs): with queue_lock: res = func(*args, **kwargs) return res return f def wrap_gradio_gpu_call(func, extra_outputs=None, name=None): name = name or func.__name__ def f(*args, **kwargs): # if the first argument is a string that says "task(...)", it is treated as a job id if len(args) > 0 and type(args[0]) == str and args[0][0:5] == "task(" and args[0][-1] == ")": id_task = args[0] progress.add_task_to_queue(id_task) else: id_task = None with queue_lock: progress.start_task(id_task) res = [None, '', '', ''] try: res = func(*args, **kwargs) progress.record_results(id_task, res) except Exception as e: shared.log.error(f"Exception: {e}") shared.log.error(f"Arguments: args={str(args)[:10240]} kwargs={str(kwargs)[:10240]}") errors.display(e, 'gradio call') res[-1] = f"
{html.escape(str(e))}
" finally: progress.finish_task(id_task) return res return wrap_gradio_call(f, extra_outputs=extra_outputs, add_stats=True, name=name) def wrap_gradio_call(func, extra_outputs=None, add_stats=False, name=None): job_name = name if name is not None else func.__name__ def f(*args, extra_outputs_array=extra_outputs, **kwargs): t = time.perf_counter() shared.mem_mon.reset() shared.state.begin(job_name) try: if shared.cmd_opts.profile: pr = cProfile.Profile() pr.enable() res = func(*args, **kwargs) if res is None: msg = "No result returned from function" shared.log.warning(msg) res = [None, '', '', f"
{html.escape(msg)}
"] else: res = list(res) if shared.cmd_opts.profile: pr.disable() errors.profile(pr, 'Wrap') except Exception as e: errors.display(e, 'gradio call') if extra_outputs_array is None: extra_outputs_array = [None, ''] res = extra_outputs_array + [f"
{html.escape(type(e).__name__+': '+str(e))}
"] shared.state.end() if not add_stats: return tuple(res) elapsed = time.perf_counter() - t elapsed_m = int(elapsed // 60) elapsed_s = elapsed % 60 elapsed_text = f"{elapsed_m}m {elapsed_s:.2f}s" if elapsed_m > 0 else f"{elapsed_s:.2f}s" summary = timer.process.summary(min_time=0.25, total=False).replace('=', ' ') gpu = '' cpu = '' if not shared.mem_mon.disabled: mem_mon_read = shared.mem_mon.read() ooms = mem_mon_read.pop("oom") retries = mem_mon_read.pop("retries") vram = {k: v//1048576 for k, v in mem_mon_read.items()} if 'active_peak' in vram: peak = max(vram['active_peak'], vram['reserved_peak'], vram['used']) used = round(100.0 * peak / vram['total']) if vram['total'] > 0 else 0 else: peak = 0 used = 0 if peak > 0: gpu += f"| GPU {peak} MB" gpu += f" {used}%" if used > 0 else '' gpu += f" | retries {retries} oom {ooms}" if retries > 0 or ooms > 0 else '' ram = shared.ram_stats() if ram['used'] > 0: cpu += f"| RAM {ram['used']} GB" cpu += f" {round(100.0 * ram['used'] / ram['total'])}%" if ram['total'] > 0 else '' if isinstance(res, list): res[-1] += f"

Time: {elapsed_text} | {summary} {gpu} {cpu}

" return tuple(res) return f