diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml
new file mode 100644
index 00000000000..bdac41941cb
--- /dev/null
+++ b/.github/workflows/build.yaml
@@ -0,0 +1,57 @@
+name: Deploy Images to GHCR
+
+
+
+on:
+  pull_request:
+    types: [labeled]
+
+jobs:
+      cancel_outstanding:
+        name: Detect and cancel outstanding runs of this workflow
+        runs-on: ubuntu-latest
+        timeout-minutes: 10
+        steps:
+          - name: Cancel Previous Runs
+            if: ${{ (github.event.label.name == 'release') && !contains(github.event.pull_request.labels.*.name, 'skip-cancel') }}
+            uses: styfle/cancel-workflow-action@0.11.0
+            with:
+              access_token: ${{ secrets.GITHUB_TOKEN }}
+  
+
+      push-store-image:
+        permissions: write-all
+        runs-on: ubuntu-latest
+        if: ${{ (github.event.label.name == 'release' ) && !contains(github.event.pull_request.labels.*.name, 'skip-cancel') }}
+        steps:
+          - name: 'Checkout GitHub Action'
+            uses: actions/checkout@main
+          - name: envvars
+            run: |
+                 echo "RELEASE=$(cat build/vars/BUILD_TAG)" >> $GITHUB_ENV
+                 echo "REGISTRY=$(cat build/vars/REGISTRY)" >> $GITHUB_ENV
+
+
+          - name: Login to GitHub Container Registry
+            uses: docker/login-action@v2
+            with:
+              registry: ghcr.io
+              username: ${{ github.actor }}
+              password: ${{ secrets.GITHUB_TOKEN }}
+
+
+          - name: free space
+            run: |
+                bash .github/workflows/freespace.sh              
+          ##https://github.com/orgs/community/discussions/25678
+          - name: 'free up space'
+
+            run: |
+                rm -rf /opt/hostedtoolcache
+
+          - name: 'Build sd-web-ui image'
+            run: |
+              cd build && \
+              RELEASE=${{ env.RELEASE }} \
+              REGISTRY=${{ env.REGISTRY }} \
+              docker buildx bake sd-web-ui -f docker-bake.hcl --push
diff --git a/.gitignore b/.gitignore
index 09734267ff5..2ed62f7e797 100644
--- a/.gitignore
+++ b/.gitignore
@@ -37,3 +37,7 @@ notification.mp3
 /node_modules
 /package-lock.json
 /.coverage*
+
+sd-data
+modules/api/raypi2.py
+modules/api/raypi3.py
diff --git a/build/docker-bake.hcl b/build/docker-bake.hcl
new file mode 100644
index 00000000000..5646e08e787
--- /dev/null
+++ b/build/docker-bake.hcl
@@ -0,0 +1,24 @@
+
+variable "RELEASE" {
+    default = "v1.0.0"
+}
+
+variable "REGISTRY" {
+    default = ""
+}
+
+group "default" {
+  targets = ["sd-web-ui"]
+}
+
+target "sd-web-ui" {
+  dockerfile = "sd.Dockerfile"
+  tags       = ["${REGISTRY}${target.sd-web-ui.name}:${RELEASE}"]
+  context    = "."  
+  labels = {
+    "org.opencontainers.image.source" = "https://github.com/webcoderz/stable-diffusion-webui"
+  } 
+}
+
+
+#RELEASE=$(cat build/vars/BUILD_TAG) REGISTRY=$(cat build/vars/REGISTRY) docker buildx bake  --print
\ No newline at end of file
diff --git a/build/sd.Dockerfile b/build/sd.Dockerfile
new file mode 100644
index 00000000000..d5183f227a1
--- /dev/null
+++ b/build/sd.Dockerfile
@@ -0,0 +1,54 @@
+FROM nvidia/cuda:12.2.0-base-ubuntu22.04
+ENV DEBIAN_FRONTEND noninteractive
+SHELL ["/bin/bash", "-o", "pipefail", "-c"]
+
+
+ENV DEBIAN_FRONTEND noninteractive
+RUN apt-get update -y \
+    && apt-get upgrade -y \
+    && apt-get install -y --no-install-recommends \
+    curl \
+    git \
+    git-lfs \
+    python3.10 \
+    python3.10-venv \
+    python3-pip \
+    libgl1 \
+    libglib2.0-0
+RUN apt-get clean -y && rm -rf /var/lib/apt/lists/*
+
+# user and workdir
+RUN useradd -m user
+RUN mkdir /work && chown -R user:user /work
+USER user
+WORKDIR /work
+
+
+################################
+# setup
+################################
+
+RUN git clone https://github.com/webcoderz/stable-diffusion-webui.git
+WORKDIR /work/stable-diffusion-webui
+
+
+
+# setup
+RUN python3 -mvenv venv && /work/stable-diffusion-webui/venv/bin/python -c "from launch import *; prepare_environment()" --skip-torch-cuda-test --no-download-sd-model
+
+
+
+################################
+# entrypoint
+################################
+
+
+
+
+EXPOSE 7860
+EXPOSE 8000
+EXPOSE 8265
+EXPOSE 6388
+EXPOSE 10001
+
+CMD ["./webui.sh", "--xformers --cors-allow-origins=* --api"]
\ No newline at end of file
diff --git a/build/vars/BUILD_TAG b/build/vars/BUILD_TAG
new file mode 100644
index 00000000000..95e94cdd37f
--- /dev/null
+++ b/build/vars/BUILD_TAG
@@ -0,0 +1 @@
+v0.0.1
\ No newline at end of file
diff --git a/build/vars/REGISTRY b/build/vars/REGISTRY
new file mode 100644
index 00000000000..bfda55613df
--- /dev/null
+++ b/build/vars/REGISTRY
@@ -0,0 +1 @@
+ghcr.io/webcoderz/stable-diffusion-webui/
\ No newline at end of file
diff --git a/extensions-builtin/LDSR/sd_hijack_ddpm_v1.py b/extensions-builtin/LDSR/sd_hijack_ddpm_v1.py
index 04adc5eb2cf..21e6c61c85c 100644
--- a/extensions-builtin/LDSR/sd_hijack_ddpm_v1.py
+++ b/extensions-builtin/LDSR/sd_hijack_ddpm_v1.py
@@ -14,7 +14,7 @@
 from functools import partial
 from tqdm import tqdm
 from torchvision.utils import make_grid
-from pytorch_lightning.utilities.distributed import rank_zero_only
+from pytorch_lightning.utilities.rank_zero import rank_zero_only
 
 from ldm.util import log_txt_as_img, exists, default, ismap, isimage, mean_flat, count_params, instantiate_from_config
 from ldm.modules.ema import LitEma
diff --git a/extensions-builtin/Lora/networks.py b/extensions-builtin/Lora/networks.py
index 96f935b236f..64c4512386e 100644
--- a/extensions-builtin/Lora/networks.py
+++ b/extensions-builtin/Lora/networks.py
@@ -15,6 +15,7 @@
 from typing import Union
 
 from modules import shared, devices, sd_models, errors, scripts, sd_hijack
+from modules.shared import shared_instance
 
 module_types = [
     network_lora.ModuleTypeLora(),
@@ -112,8 +113,10 @@ def match(match_list, regex_text):
 def assign_network_names_to_compvis_modules(sd_model):
     network_layer_mapping = {}
 
-    if shared.sd_model.is_sdxl:
-        for i, embedder in enumerate(shared.sd_model.conditioner.embedders):
+    #if shared.sd_model.is_sdxl:
+    if shared_instance.sd_model.is_sdxl:
+        #for i, embedder in enumerate(shared.sd_model.conditioner.embedders):
+        for i, embedder in enumerate(shared_instance.sd_model.conditioner.embedders):
             if not hasattr(embedder, 'wrapped'):
                 continue
 
@@ -122,12 +125,14 @@ def assign_network_names_to_compvis_modules(sd_model):
                 network_layer_mapping[network_name] = module
                 module.network_layer_name = network_name
     else:
-        for name, module in shared.sd_model.cond_stage_model.wrapped.named_modules():
+        #for name, module in shared.sd_model.cond_stage_model.wrapped.named_modules():
+        for name, module in shared_instance.sd_model.cond_stage_model.wrapped.named_modules():
             network_name = name.replace(".", "_")
             network_layer_mapping[network_name] = module
             module.network_layer_name = network_name
 
-    for name, module in shared.sd_model.model.named_modules():
+    #for name, module in shared.sd_model.model.named_modules():
+    for name, module in shared_instance.sd_model.model.named_modules():
         network_name = name.replace(".", "_")
         network_layer_mapping[network_name] = module
         module.network_layer_name = network_name
@@ -142,11 +147,14 @@ def load_network(name, network_on_disk):
     sd = sd_models.read_state_dict(network_on_disk.filename)
 
     # this should not be needed but is here as an emergency fix for an unknown error people are experiencing in 1.2.0
-    if not hasattr(shared.sd_model, 'network_layer_mapping'):
-        assign_network_names_to_compvis_modules(shared.sd_model)
+    #if not hasattr(shared.sd_model, 'network_layer_mapping'):
+        #assign_network_names_to_compvis_modules(shared.sd_model)
+    if not hasattr(shared_instance.sd_model, 'network_layer_mapping'):
+        assign_network_names_to_compvis_modules(shared_instance.sd_model)
 
     keys_failed_to_match = {}
-    is_sd2 = 'model_transformer_resblocks' in shared.sd_model.network_layer_mapping
+    #is_sd2 = 'model_transformer_resblocks' in shared.sd_model.network_layer_mapping
+    is_sd2 = 'model_transformer_resblocks' in shared_instance.sd_model.network_layer_mapping
 
     matched_networks = {}
 
@@ -154,25 +162,31 @@ def load_network(name, network_on_disk):
         key_network_without_network_parts, network_part = key_network.split(".", 1)
 
         key = convert_diffusers_name_to_compvis(key_network_without_network_parts, is_sd2)
-        sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+        #sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+        sd_module = shared_instance.sd_model.network_layer_mapping.get(key, None)
 
         if sd_module is None:
             m = re_x_proj.match(key)
             if m:
-                sd_module = shared.sd_model.network_layer_mapping.get(m.group(1), None)
+                #sd_module = shared.sd_model.network_layer_mapping.get(m.group(1), None)
+                sd_module = shared_instance.sd_model.network_layer_mapping.get(m.group(1), None)
+
 
         # SDXL loras seem to already have correct compvis keys, so only need to replace "lora_unet" with "diffusion_model"
         if sd_module is None and "lora_unet" in key_network_without_network_parts:
             key = key_network_without_network_parts.replace("lora_unet", "diffusion_model")
-            sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+            #sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+            sd_module = shared_instance.sd_model.network_layer_mapping.get(key, None)
         elif sd_module is None and "lora_te1_text_model" in key_network_without_network_parts:
             key = key_network_without_network_parts.replace("lora_te1_text_model", "0_transformer_text_model")
-            sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+            #sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+            sd_module = shared_instance.sd_model.network_layer_mapping.get(key, None)
 
             # some SD1 Loras also have correct compvis keys
             if sd_module is None:
                 key = key_network_without_network_parts.replace("lora_te1_text_model", "transformer_text_model")
-                sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+                #sd_module = shared.sd_model.network_layer_mapping.get(key, None)
+                sd_module = shared_instance.sd_model.network_layer_mapping.get(key, None)
 
         if sd_module is None:
             keys_failed_to_match[key_network] = key
diff --git a/extensions-builtin/Lora/ui_extra_networks_lora.py b/extensions-builtin/Lora/ui_extra_networks_lora.py
index 55409a7829d..8bb11a400dd 100644
--- a/extensions-builtin/Lora/ui_extra_networks_lora.py
+++ b/extensions-builtin/Lora/ui_extra_networks_lora.py
@@ -6,7 +6,7 @@
 from modules import shared, ui_extra_networks
 from modules.ui_extra_networks import quote_js
 from ui_edit_user_metadata import LoraUserMetadataEditor
-
+from modules.shared import shared_instance
 
 class ExtraNetworksPageLora(ui_extra_networks.ExtraNetworksPage):
     def __init__(self):
@@ -52,17 +52,26 @@ def create_item(self, name, index=None, enable_filter=True):
 
         if shared.opts.lora_show_all or not enable_filter:
             pass
+#        elif sd_version == network.SdVersion.Unknown:
+#            model_version = network.SdVersion.SDXL if shared.sd_model.is_sdxl else network.SdVersion.SD2 if shared.sd_model.is_sd2 else network.SdVersion.SD1
+#            if model_version.name in shared.opts.lora_hide_unknown_for_versions:
+#                return None
+#        elif shared.sd_model.is_sdxl and sd_version != network.SdVersion.SDXL:
+#            return None
+#        elif shared.sd_model.is_sd2 and sd_version != network.SdVersion.SD2:
+#            return None
+#        elif shared.sd_model.is_sd1 and sd_version != network.SdVersion.SD1:
+#            return None
         elif sd_version == network.SdVersion.Unknown:
-            model_version = network.SdVersion.SDXL if shared.sd_model.is_sdxl else network.SdVersion.SD2 if shared.sd_model.is_sd2 else network.SdVersion.SD1
+            model_version = network.SdVersion.SDXL if shared_instance.sd_model.is_sdxl else network.SdVersion.SD2 if shared_instance.sd_model.is_sd2 else network.SdVersion.SD1
             if model_version.name in shared.opts.lora_hide_unknown_for_versions:
                 return None
-        elif shared.sd_model.is_sdxl and sd_version != network.SdVersion.SDXL:
+        elif shared_instance.sd_model.is_sdxl and sd_version != network.SdVersion.SDXL:
             return None
-        elif shared.sd_model.is_sd2 and sd_version != network.SdVersion.SD2:
+        elif shared_instance.sd_model.is_sd2 and sd_version != network.SdVersion.SD2:
             return None
-        elif shared.sd_model.is_sd1 and sd_version != network.SdVersion.SD1:
+        elif shared_instance.sd_model.is_sd1 and sd_version != network.SdVersion.SD1:
             return None
-
         return item
 
     def list_items(self):
diff --git a/launch.py b/launch.py
index f83820d2534..410dc05ccff 100644
--- a/launch.py
+++ b/launch.py
@@ -24,6 +24,7 @@
 start = launch_utils.start
 
 
+
 def main():
     if args.dump_sysinfo:
         filename = launch_utils.dump_sysinfo()
@@ -43,6 +44,5 @@ def main():
 
     start()
 
-
 if __name__ == "__main__":
     main()
diff --git a/modules/api/api.py b/modules/api/api.py
index e6edffe7144..aeee9d5968c 100644
--- a/modules/api/api.py
+++ b/modules/api/api.py
@@ -33,7 +33,7 @@
 import piexif
 import piexif.helper
 from contextlib import closing
-
+from modules.shared import shared_instance
 
 def script_name_to_index(name, scripts):
     try:
@@ -364,7 +364,8 @@ def text2imgapi(self, txt2imgreq: models.StableDiffusionTxt2ImgProcessingAPI):
         args.pop('save_images', None)
 
         with self.queue_lock:
-            with closing(StableDiffusionProcessingTxt2Img(sd_model=shared.sd_model, **args)) as p:
+            with closing(StableDiffusionProcessingTxt2Img(sd_model=shared_instance.sd_model, **args)) as p:
+            #with closing(StableDiffusionProcessingTxt2Img(sd_model=shared.sd_model, **args)) as p:
                 p.is_api = True
                 p.scripts = script_runner
                 p.outpath_grids = opts.outdir_txt2img_grids
@@ -424,7 +425,8 @@ def img2imgapi(self, img2imgreq: models.StableDiffusionImg2ImgProcessingAPI):
         args.pop('save_images', None)
 
         with self.queue_lock:
-            with closing(StableDiffusionProcessingImg2Img(sd_model=shared.sd_model, **args)) as p:
+            #with closing(StableDiffusionProcessingImg2Img(sd_model=shared.sd_model, **args)) as p:
+            with closing(StableDiffusionProcessingImg2Img(sd_model=shared_instance.sd_model, **args)) as p:
                 p.init_images = [decode_base64_to_image(x) for x in init_images]
                 p.is_api = True
                 p.scripts = script_runner
@@ -724,8 +726,10 @@ def train_hypernetwork(self, args: dict):
             except Exception as e:
                 error = e
             finally:
-                shared.sd_model.cond_stage_model.to(devices.device)
-                shared.sd_model.first_stage_model.to(devices.device)
+                #shared.sd_model.cond_stage_model.to(devices.device)
+                #shared.sd_model.first_stage_model.to(devices.device)
+                shared_instance.sd_model.cond_stage_model.to(devices.device)
+                shared_instance.sd_model.first_stage_model.to(devices.device)
                 if not apply_optimizations:
                     sd_hijack.apply_optimizations()
                 shared.state.end()
@@ -785,4 +789,3 @@ def restart_webui(self):
     def stop_webui(request):
         shared.state.server_command = "stop"
         return Response("Stopping.")
-
diff --git a/modules/api/ray.py b/modules/api/ray.py
new file mode 100644
index 00000000000..ed945b658ef
--- /dev/null
+++ b/modules/api/ray.py
@@ -0,0 +1,49 @@
+from ray import serve
+import ray
+
+from modules.api.raypi import Raypi
+
+import time
+import os
+
+
+#ray.init(os.environ.get("RAY_HEAD_ADDRESS", ""))
+#ray.init("ray://localhost:10001")
+
+
+ray_head_address = os.environ.get("RAY_ADDRESS")
+print("RAY_ADDRESS:", ray_head_address)
+
+if ray_head_address:
+    #ray.init(address=ray_head_address)
+    ray.init(address=ray_head_address)
+    #ray.init(address="172.21.0.3:6388")
+else:
+    ray.init()
+
+
+#entrypoint = Raypi.bind()
+
+def ray_only():
+    serve.shutdown()
+    if "RAY_DOCKER" in os.environ:
+        print("starting ray in docker")
+        serve.start(
+            detached=True,
+            http_options={
+                        "host": os.environ.get("RAY_IP", "0.0.0.0"), 
+                        "port": int(os.environ.get("RAY_PORT", 8000))
+                        }
+        )
+    else:
+        serve.start(
+            http_options={
+                        "host": os.environ.get("RAY_IP", "0.0.0.0"), 
+                        "port": int(os.environ.get("RAY_PORT", 8000))
+                        }
+        )
+    print(f"Starting Raypi on port {os.environ.get('RAY_PORT', 8000)}")
+    serve.run(Raypi.bind(), port=int(os.environ.get("RAY_PORT", 8000)), route_prefix="/sdapi/v1")  #route_prefix="/sdapi/v1" # Call the launch_ray method to get the FastAPI app
+    print("Done setting up replicas! Now accepting requests...")
+    while True:
+        time.sleep(1000)
\ No newline at end of file
diff --git a/modules/api/raypi.py b/modules/api/raypi.py
new file mode 100644
index 00000000000..3bfa78bbc14
--- /dev/null
+++ b/modules/api/raypi.py
@@ -0,0 +1,811 @@
+import base64
+import io
+import os
+import time
+import datetime
+import uvicorn
+import ipaddress
+import requests
+import gradio as gr
+from threading import Lock
+from io import BytesIO
+from fastapi import APIRouter, Depends, FastAPI, Request, Response
+from fastapi.security import HTTPBasic, HTTPBasicCredentials
+from fastapi.exceptions import HTTPException
+from fastapi.responses import JSONResponse
+from fastapi.encoders import jsonable_encoder
+from secrets import compare_digest
+
+from modules import initialize
+initialize.imports()
+
+import modules.shared as shared
+from modules import sd_samplers, deepbooru, sd_hijack, images, scripts, ui, postprocessing, errors, restart, shared_items
+from modules.api import models
+from modules.shared import opts
+from modules.processing import StableDiffusionProcessingTxt2Img, StableDiffusionProcessingImg2Img, process_images
+from modules.textual_inversion.textual_inversion import create_embedding, train_embedding
+from modules.textual_inversion.preprocess import preprocess
+from modules.hypernetworks.hypernetwork import create_hypernetwork, train_hypernetwork
+from PIL import PngImagePlugin,Image
+from modules.sd_models import unload_model_weights, reload_model_weights, checkpoint_aliases
+from modules.sd_models_config import find_checkpoint_config_near_filename
+from modules.realesrgan_model import get_realesrgan_models
+from modules import devices
+from typing import Dict, List, Any
+import piexif
+import piexif.helper
+from contextlib import closing
+
+from modules import initialize_util
+from modules import script_callbacks
+import os
+from modules.shared import shared_instance
+import launch
+from ray import serve
+
+app = FastAPI()
+
+def script_name_to_index(name, scripts):
+    try:
+        return [script.title().lower() for script in scripts].index(name.lower())
+    except Exception as e:
+        raise HTTPException(status_code=422, detail=f"Script '{name}' not found") from e
+
+
+def validate_sampler_name(name):
+    config = sd_samplers.all_samplers_map.get(name, None)
+    if config is None:
+        raise HTTPException(status_code=404, detail="Sampler not found")
+
+    return name
+
+
+def setUpscalers(req: dict):
+    reqDict = vars(req)
+    reqDict['extras_upscaler_1'] = reqDict.pop('upscaler_1', None)
+    reqDict['extras_upscaler_2'] = reqDict.pop('upscaler_2', None)
+    return reqDict
+
+
+def verify_https://github.com/url(url):
+    """Returns True if the url refers to a global resource."""
+
+    import socket
+    from urllib.parse import urlparse
+    try:
+        parsed_url = urlparse(url)
+        domain_name = parsed_url.netloc
+        host = socket.gethostbyname_ex(domain_name)
+        for ip in host[2]:
+            ip_addr = ipaddress.ip_address(ip)
+            if not ip_addr.is_global:
+                return False
+    except Exception:
+        return False
+
+    return True
+
+
+def decode_base64_to_image(encoding):
+    if encoding.startswith("http://") or encoding.startswith("https://"):
+        if not opts.api_enable_requests:
+            raise HTTPException(status_code=500, detail="Requests not allowed")
+
+        if opts.api_forbid_local_requests and not verify_url(https://github.com/encoding):
+            raise HTTPException(status_code=500, detail="Request to local resource not allowed")
+
+        headers = {'user-agent': opts.api_useragent} if opts.api_useragent else {}
+        response = requests.get(encoding, timeout=30, headers=headers)
+        try:
+            image = Image.open(BytesIO(response.content))
+            return image
+        except Exception as e:
+            raise HTTPException(status_code=500, detail="Invalid image url") from e
+
+    if encoding.startswith("data:image/"):
+        encoding = encoding.split(";")[1].split(",")[1]
+    try:
+        image = Image.open(BytesIO(base64.b64decode(encoding)))
+        return image
+    except Exception as e:
+        raise HTTPException(status_code=500, detail="Invalid encoded image") from e
+
+
+def encode_pil_to_base64(image):
+    with io.BytesIO() as output_bytes:
+
+        if opts.samples_format.lower() == 'png':
+            use_metadata = False
+            metadata = PngImagePlugin.PngInfo()
+            for key, value in image.info.items():
+                if isinstance(key, str) and isinstance(value, str):
+                    metadata.add_text(key, value)
+                    use_metadata = True
+            image.save(output_bytes, format="PNG", pnginfo=(metadata if use_metadata else None), quality=opts.jpeg_quality)
+
+        elif opts.samples_format.lower() in ("jpg", "jpeg", "webp"):
+            if image.mode == "RGBA":
+                image = image.convert("RGB")
+            parameters = image.info.get('parameters', None)
+            exif_bytes = piexif.dump({
+                "Exif": { piexif.ExifIFD.UserComment: piexif.helper.UserComment.dump(parameters or "", encoding="unicode") }
+            })
+            if opts.samples_format.lower() in ("jpg", "jpeg"):
+                image.save(output_bytes, format="JPEG", exif = exif_bytes, quality=opts.jpeg_quality)
+            else:
+                image.save(output_bytes, format="WEBP", exif = exif_bytes, quality=opts.jpeg_quality)
+
+        else:
+            raise HTTPException(status_code=500, detail="Invalid image format")
+
+        bytes_data = output_bytes.getvalue()
+
+    return base64.b64encode(bytes_data)
+
+
+def api_middleware(app: FastAPI):
+    rich_available = False
+    try:
+        if os.environ.get('WEBUI_RICH_EXCEPTIONS', None) is not None:
+            import anyio  # importing just so it can be placed on silent list
+            import starlette  # importing just so it can be placed on silent list
+            from rich.console import Console
+            console = Console()
+            rich_available = True
+    except Exception:
+        pass
+
+    @app.middleware("http")
+    async def log_and_time(req: Request, call_next):
+        ts = time.time()
+        res: Response = await call_next(req)
+        duration = str(round(time.time() - ts, 4))
+        res.headers["X-Process-Time"] = duration
+        endpoint = req.scope.get('path', 'err')
+        if shared.cmd_opts.api_log and endpoint.startswith('/sdapi'):
+            print('API {t} {code} {prot}/{ver} {method} {endpoint} {cli} {duration}'.format(
+                t=datetime.datetime.now().strftime("%Y-%m-%d %H:%M:%S.%f"),
+                code=res.status_code,
+                ver=req.scope.get('http_version', '0.0'),
+                cli=req.scope.get('client', ('0:0.0.0', 0))[0],
+                prot=req.scope.get('scheme', 'err'),
+                method=req.scope.get('method', 'err'),
+                endpoint=endpoint,
+                duration=duration,
+            ))
+        return res
+
+    def handle_exception(request: Request, e: Exception):
+        err = {
+            "error": type(e).__name__,
+            "detail": vars(e).get('detail', ''),
+            "body": vars(e).get('body', ''),
+            "errors": str(e),
+        }
+        if not isinstance(e, HTTPException):  # do not print backtrace on known httpexceptions
+            message = f"API error: {request.method}: {request.url} {err}"
+            if rich_available:
+                print(message)
+                console.print_exception(show_locals=True, max_frames=2, extra_lines=1, suppress=[anyio, starlette], word_wrap=False, width=min([console.width, 200]))
+            else:
+                errors.report(message, exc_info=True)
+        return JSONResponse(status_code=vars(e).get('status_code', 500), content=jsonable_encoder(err))
+
+    @app.middleware("http")
+    async def exception_handling(request: Request, call_next):
+        try:
+            return await call_next(request)
+        except Exception as e:
+            return handle_exception(request, e)
+
+    @app.exception_handler(Exception)
+    async def fastapi_exception_handler(request: Request, e: Exception):
+        return handle_exception(request, e)
+
+    @app.exception_handler(HTTPException)
+    async def http_exception_handler(request: Request, e: HTTPException):
+        return handle_exception(request, e)
+
+
+api_middleware(app)
+
+@serve.deployment(    
+    ray_actor_options={"num_gpus": int(os.environ.get("RAY_NUM_GPUS", 0)),
+                       "num_cpus": int(os.environ.get("RAY_NUM_CPUS", 0))
+                       },
+    autoscaling_config={
+                        "min_replicas": int(os.environ.get("RAY_MIN_REPLICAS", 0)),
+                        "max_replicas": int(os.environ.get("RAY_MAX_REPLICAS", 0))
+                        },
+    #route_prefix="/sdapi/v1"
+    )
+@serve.ingress(app)
+class Raypi:
+    def __init__(self):
+        print("Initializing API")
+        initialize.initialize()
+        print("preparing env")
+        launch.prepare_environment()
+        #app.include_router(Raypi(app).router)      
+              
+        if shared.cmd_opts.api_auth:
+            self.credentials = {}
+            for auth in shared.cmd_opts.api_auth.split(","):
+                user, password = auth.split(":")
+                self.credentials[user] = password
+        
+     
+        print("API initialized")
+
+        self.default_script_arg_txt2img = []
+        self.default_script_arg_img2img = []
+
+
+    def auth(self, credentials: HTTPBasicCredentials = Depends(HTTPBasic())):
+        if credentials.username in self.credentials:
+            if compare_digest(credentials.password, self.credentials[credentials.username]):
+                return True
+
+        raise HTTPException(status_code=401, detail="Incorrect username or password", headers={"WWW-Authenticate": "Basic"})
+
+    def get_selectable_script(self, script_name, script_runner):
+        if script_name is None or script_name == "":
+            return None, None
+
+        script_idx = script_name_to_index(script_name, script_runner.selectable_scripts)
+        script = script_runner.selectable_scripts[script_idx]
+        return script, script_idx
+
+    @app.get("/scripts", response_model=models.ScriptsList)
+    def get_scripts_list(self):
+        t2ilist = [script.name for script in scripts.scripts_txt2img.scripts if script.name is not None]
+        i2ilist = [script.name for script in scripts.scripts_img2img.scripts if script.name is not None]
+
+        return models.ScriptsList(txt2img=t2ilist, img2img=i2ilist)
+
+    @app.get("/script-info", response_model=List[models.ScriptInfo])
+    def get_script_info(self):
+        res = []
+
+        for script_list in [scripts.scripts_txt2img.scripts, scripts.scripts_img2img.scripts]:
+            res += [script.api_info for script in script_list if script.api_info is not None]
+
+        return res
+
+    def get_script(self, script_name, script_runner):
+        if script_name is None or script_name == "":
+            return None, None
+
+        script_idx = script_name_to_index(script_name, script_runner.scripts)
+        return script_runner.scripts[script_idx]
+
+    def init_default_script_args(self, script_runner):
+        #find max idx from the scripts in runner and generate a none array to init script_args
+        last_arg_index = 1
+        for script in script_runner.scripts:
+            if last_arg_index < script.args_to:
+                last_arg_index = script.args_to
+        # None everywhere except position 0 to initialize script args
+        script_args = [None]*last_arg_index
+        script_args[0] = 0
+
+        # get default values
+        with gr.Blocks(): # will throw errors calling ui function without this
+            for script in script_runner.scripts:
+                if script.ui(script.is_img2img):
+                    ui_default_values = []
+                    for elem in script.ui(script.is_img2img):
+                        ui_default_values.append(elem.value)
+                    script_args[script.args_from:script.args_to] = ui_default_values
+        return script_args
+
+    def init_script_args(self, request, default_script_args, selectable_scripts, selectable_idx, script_runner):
+        script_args = default_script_args.copy()
+        # position 0 in script_arg is the idx+1 of the selectable script that is going to be run when using scripts.scripts_*2img.run()
+        if selectable_scripts:
+            script_args[selectable_scripts.args_from:selectable_scripts.args_to] = request.script_args
+            script_args[0] = selectable_idx + 1
+
+        # Now check for always on scripts
+        if request.alwayson_scripts:
+            for alwayson_script_name in request.alwayson_scripts.keys():
+                alwayson_script = self.get_script(alwayson_script_name, script_runner)
+                if alwayson_script is None:
+                    raise HTTPException(status_code=422, detail=f"always on script {alwayson_script_name} not found")
+                # Selectable script in always on script param check
+                if alwayson_script.alwayson is False:
+                    raise HTTPException(status_code=422, detail="Cannot have a selectable script in the always on scripts params")
+                # always on script with no arg should always run so you don't really need to add them to the requests
+                if "args" in request.alwayson_scripts[alwayson_script_name]:
+                    # min between arg length in scriptrunner and arg length in the request
+                    for idx in range(0, min((alwayson_script.args_to - alwayson_script.args_from), len(request.alwayson_scripts[alwayson_script_name]["args"]))):
+                        script_args[alwayson_script.args_from + idx] = request.alwayson_scripts[alwayson_script_name]["args"][idx]
+        return script_args
+
+    @app.post("/txt2img", response_model=models.TextToImageResponse)
+    def text2imgapi(self, txt2imgreq: models.StableDiffusionTxt2ImgProcessingAPI):
+        script_runner = scripts.scripts_txt2img
+        if not script_runner.scripts:
+            script_runner.initialize_scripts(False)
+            ui.create_ui()
+        if not self.default_script_arg_txt2img:
+            self.default_script_arg_txt2img = self.init_default_script_args(script_runner)
+        selectable_scripts, selectable_script_idx = self.get_selectable_script(txt2imgreq.script_name, script_runner)
+
+        populate = txt2imgreq.copy(update={  # Override __init__ params
+            "sampler_name": validate_sampler_name(txt2imgreq.sampler_name or txt2imgreq.sampler_index),
+            "do_not_save_samples": not txt2imgreq.save_images,
+            "do_not_save_grid": not txt2imgreq.save_images,
+        })
+        if populate.sampler_name:
+            populate.sampler_index = None  # prevent a warning later on
+
+        args = vars(populate)
+        args.pop('script_name', None)
+        args.pop('script_args', None) # will refeed them to the pipeline directly after initializing them
+        args.pop('alwayson_scripts', None)
+
+        script_args = self.init_script_args(txt2imgreq, self.default_script_arg_txt2img, selectable_scripts, selectable_script_idx, script_runner)
+
+        send_images = args.pop('send_images', True)
+        args.pop('save_images', None)
+
+        with closing(StableDiffusionProcessingTxt2Img(sd_model=shared_instance.sd_model, **args)) as p:          
+        #with closing(StableDiffusionProcessingTxt2Img(sd_model=shared.sd_model, **args)) as p:
+            p.is_api = True
+            p.scripts = script_runner
+            p.outpath_grids = opts.outdir_txt2img_grids
+            p.outpath_samples = opts.outdir_txt2img_samples
+            try:
+                shared.state.begin(job="scripts_txt2img")
+                if selectable_scripts is not None:
+                    p.script_args = script_args
+                    processed = scripts.scripts_txt2img.run(p, *p.script_args) # Need to pass args as list here
+                else:
+                    p.script_args = tuple(script_args) # Need to pass args as tuple here
+                    processed = process_images(p)
+            finally:
+                shared.state.end()
+                shared.total_tqdm.clear()
+
+        b64images = list(map(encode_pil_to_base64, processed.images)) if send_images else []
+
+        return models.TextToImageResponse(images=b64images, parameters=vars(txt2imgreq), info=processed.js())
+
+    @app.post("/img2img", response_model=models.ImageToImageResponse)
+    def img2imgapi(self, img2imgreq: models.StableDiffusionImg2ImgProcessingAPI):
+        init_images = img2imgreq.init_images
+        if init_images is None:
+            raise HTTPException(status_code=404, detail="Init image not found")
+
+        mask = img2imgreq.mask
+        if mask:
+            mask = decode_base64_to_image(mask)
+
+        script_runner = scripts.scripts_img2img
+        if not script_runner.scripts:
+            script_runner.initialize_scripts(True)
+            ui.create_ui()
+        if not self.default_script_arg_img2img:
+            self.default_script_arg_img2img = self.init_default_script_args(script_runner)
+        selectable_scripts, selectable_script_idx = self.get_selectable_script(img2imgreq.script_name, script_runner)
+
+        populate = img2imgreq.copy(update={  # Override __init__ params
+            "sampler_name": validate_sampler_name(img2imgreq.sampler_name or img2imgreq.sampler_index),
+            "do_not_save_samples": not img2imgreq.save_images,
+            "do_not_save_grid": not img2imgreq.save_images,
+            "mask": mask,
+        })
+        if populate.sampler_name:
+            populate.sampler_index = None  # prevent a warning later on
+
+        args = vars(populate)
+        args.pop('include_init_images', None)  # this is meant to be done by "exclude": True in model, but it's for a reason that I cannot determine.
+        args.pop('script_name', None)
+        args.pop('script_args', None)  # will refeed them to the pipeline directly after initializing them
+        args.pop('alwayson_scripts', None)
+
+        script_args = self.init_script_args(img2imgreq, self.default_script_arg_img2img, selectable_scripts, selectable_script_idx, script_runner)
+
+        send_images = args.pop('send_images', True)
+        args.pop('save_images', None)
+
+        with closing(StableDiffusionProcessingImg2Img(sd_model=shared_instance.sd_model, **args)) as p:
+        #with closing(StableDiffusionProcessingImg2Img(sd_model=shared.sd_model, **args)) as p:
+            p.init_images = [decode_base64_to_image(x) for x in init_images]
+            p.is_api = True
+            p.scripts = script_runner
+            p.outpath_grids = opts.outdir_img2img_grids
+            p.outpath_samples = opts.outdir_img2img_samples
+            try:
+                shared.state.begin(job="scripts_img2img")
+                if selectable_scripts is not None:
+                    p.script_args = script_args
+                    processed = scripts.scripts_img2img.run(p, *p.script_args) # Need to pass args as list here
+                else:
+                    p.script_args = tuple(script_args) # Need to pass args as tuple here
+                    processed = process_images(p)
+            finally:
+                shared.state.end()
+                shared.total_tqdm.clear()
+
+        b64images = list(map(encode_pil_to_base64, processed.images)) if send_images else []
+
+        if not img2imgreq.include_init_images:
+            img2imgreq.init_images = None
+            img2imgreq.mask = None
+
+        return models.ImageToImageResponse(images=b64images, parameters=vars(img2imgreq), info=processed.js())
+
+    @app.post("/extra-single-image",response_model=models.ExtrasSingleImageResponse)
+    def extras_single_image_api(self, req: models.ExtrasSingleImageRequest):
+        reqDict = setUpscalers(req)
+
+        reqDict['image'] = decode_base64_to_image(reqDict['image'])
+
+        
+        result = postprocessing.run_extras(extras_mode=0, image_folder="", input_dir="", output_dir="", save_output=False, **reqDict)
+
+        return models.ExtrasSingleImageResponse(image=encode_pil_to_base64(result[0][0]), html_info=result[1])
+
+    @app.post("/extra-batch-images",response_model=models.ExtrasBatchImagesResponse)
+    def extras_batch_images_api(self, req: models.ExtrasBatchImagesRequest):
+        reqDict = setUpscalers(req)
+
+        image_list = reqDict.pop('imageList', [])
+        image_folder = [decode_base64_to_image(x.data) for x in image_list]
+
+        
+        result = postprocessing.run_extras(extras_mode=1, image_folder=image_folder, image="", input_dir="", output_dir="", save_output=False, **reqDict)
+
+        return models.ExtrasBatchImagesResponse(images=list(map(encode_pil_to_base64, result[0])), html_info=result[1])
+
+    @app.post("/png-info",response_model=models.PNGInfoResponse)
+    def pnginfoapi(self, req: models.PNGInfoRequest):
+        if(not req.image.strip()):
+            return models.PNGInfoResponse(info="")
+
+        image = decode_base64_to_image(req.image.strip())
+        if image is None:
+            return models.PNGInfoResponse(info="")
+
+        geninfo, items = images.read_info_from_image(image)
+        if geninfo is None:
+            geninfo = ""
+
+        items = {**{'parameters': geninfo}, **items}
+
+        return models.PNGInfoResponse(info=geninfo, items=items)
+
+    @app.get("/progress",response_model=models.ProgressResponse)
+    def progressapi(self, req: models.ProgressRequest = Depends()):
+        # copy from check_progress_call of ui.py
+
+        if shared.state.job_count == 0:
+            return models.ProgressResponse(progress=0, eta_relative=0, state=shared.state.dict(), textinfo=shared.state.textinfo)
+
+        # avoid dividing zero
+        progress = 0.01
+
+        if shared.state.job_count > 0:
+            progress += shared.state.job_no / shared.state.job_count
+        if shared.state.sampling_steps > 0:
+            progress += 1 / shared.state.job_count * shared.state.sampling_step / shared.state.sampling_steps
+
+        time_since_start = time.time() - shared.state.time_start
+        eta = (time_since_start/progress)
+        eta_relative = eta-time_since_start
+
+        progress = min(progress, 1)
+
+        shared.state.set_current_image()
+
+        current_image = None
+        if shared.state.current_image and not req.skip_current_image:
+            current_image = encode_pil_to_base64(shared.state.current_image)
+
+        return models.ProgressResponse(progress=progress, eta_relative=eta_relative, state=shared.state.dict(), current_image=current_image, textinfo=shared.state.textinfo)
+
+    @app.post("/interrogate")
+    def interrogateapi(self, interrogatereq: models.InterrogateRequest):
+        image_b64 = interrogatereq.image
+        if image_b64 is None:
+            raise HTTPException(status_code=404, detail="Image not found")
+
+        img = decode_base64_to_image(image_b64)
+        img = img.convert('RGB')
+
+        # Override object param
+        if interrogatereq.model == "clip":
+            processed = shared.interrogator.interrogate(img)
+        elif interrogatereq.model == "deepdanbooru":
+            processed = deepbooru.model.tag(img)
+        else:
+            raise HTTPException(status_code=404, detail="Model not found")
+        
+        return models.InterrogateResponse(caption=processed)
+
+    @app.post("/interrupt")
+    def interruptapi(self):
+        shared.state.interrupt()
+
+        return {}
+
+    @app.post("/unload-checkpoint")
+    def unloadapi(self):
+        unload_model_weights()
+
+        return {}
+
+    @app.post("/reload-checkpoint")
+    def reloadapi(self):
+        reload_model_weights()
+
+        return {}
+
+    @app.post("/skip")
+    def skip(self):
+        shared.state.skip()
+
+    @app.get("/options",response_model=models.OptionsModel)
+    def get_config(self):
+        options = {}
+        for key in shared.opts.data.keys():
+            metadata = shared.opts.data_labels.get(key)
+            if(metadata is not None):
+                options.update({key: shared.opts.data.get(key, shared.opts.data_labels.get(key).default)})
+            else:
+                options.update({key: shared.opts.data.get(key, None)})
+
+        return options
+
+    @app.post("/options")
+    def set_config(self, req: Dict[str, Any]):
+        checkpoint_name = req.get("sd_model_checkpoint", None)
+        if checkpoint_name is not None and checkpoint_name not in checkpoint_aliases:
+            raise RuntimeError(f"model {checkpoint_name!r} not found")
+
+        for k, v in req.items():
+            shared.opts.set(k, v, is_api=True)
+
+        shared.opts.save(shared.config_filename)
+        return
+
+    @app.get("/cmd-flags", response_model=models.FlagsModel)
+    def get_cmd_flags(self):
+        return vars(shared.cmd_opts)
+
+    @app.get("/samplers", response_model=List[models.SamplerItem])
+    def get_samplers(self):
+        return [{"name": sampler[0], "aliases":sampler[2], "options":sampler[3]} for sampler in sd_samplers.all_samplers]
+
+    @app.get("/upscalers",response_model=List[models.UpscalerItem])
+    def get_upscalers(self):
+        return [
+            {
+                "name": upscaler.name,
+                "model_name": upscaler.scaler.model_name,
+                "model_path": upscaler.data_path,
+                "model_url": None,
+                "scale": upscaler.scale,
+            }
+            for upscaler in shared.sd_upscalers
+        ]
+
+    @app.get("/latent-upscale-modes",response_model=List[models.LatentUpscalerModeItem])
+    def get_latent_upscale_modes(self):
+        return [
+            {
+                "name": upscale_mode,
+            }
+            for upscale_mode in [*(shared.latent_upscale_modes or {})]
+        ]
+
+    @app.get("/sd-models", response_model=List[models.SDModelItem])
+    def get_sd_models(self):
+        import modules.sd_models as sd_models
+        return [{"title": x.title, "model_name": x.model_name, "hash": x.shorthash, "sha256": x.sha256, "filename": x.filename, "config": find_checkpoint_config_near_filename(x)} for x in sd_models.checkpoints_list.values()]
+
+    @app.get("/sd-vae", response_model=List[models.SDVaeItem])
+    def get_sd_vaes(self):
+        import modules.sd_vae as sd_vae
+        return [{"model_name": x, "filename": sd_vae.vae_dict[x]} for x in sd_vae.vae_dict.keys()]
+
+    @app.get("/hypernetworks", response_model=List[models.HypernetworkItem])
+    def get_hypernetworks(self):
+        return [{"name": name, "path": shared.hypernetworks[name]} for name in shared.hypernetworks]
+
+    @app.get("/face-restorers", response_model=List[models.FaceRestorerItem])
+    def get_face_restorers(self):
+        return [{"name":x.name(), "cmd_dir": getattr(x, "cmd_dir", None)} for x in shared.face_restorers]
+
+    @app.get("/realesrgan-models",response_model=List[models.RealesrganItem])
+    def get_realesrgan_models(self):
+        return [{"name":x.name,"path":x.data_path, "scale":x.scale} for x in get_realesrgan_models(None)]
+
+    @app.get("/prompt-styles", response_model=List[models.PromptStyleItem])
+    def get_prompt_styles(self):
+        styleList = []
+        for k in shared.prompt_styles.styles:
+            style = shared.prompt_styles.styles[k]
+            styleList.append({"name":style[0], "prompt": style[1], "negative_prompt": style[2]})
+
+        return styleList
+
+    @app.get("/embeddings", response_model=models.EmbeddingsResponse)
+    def get_embeddings(self):
+        db = sd_hijack.model_hijack.embedding_db
+
+        def convert_embedding(embedding):
+            return {
+                "step": embedding.step,
+                "sd_checkpoint": embedding.sd_checkpoint,
+                "sd_checkpoint_name": embedding.sd_checkpoint_name,
+                "shape": embedding.shape,
+                "vectors": embedding.vectors,
+            }
+
+
+        def convert_embeddings(embeddings):
+            return {embedding.name: convert_embedding(embedding) for embedding in embeddings.values()}
+
+        return {
+            "loaded": convert_embeddings(db.word_embeddings),
+            "skipped": convert_embeddings(db.skipped_embeddings),
+        }
+
+    @app.post("/refresh-checkpoints")
+    def refresh_checkpoints(self):
+        
+        shared.refresh_checkpoints()
+
+    @app.post("/refresh-vae")
+    def refresh_vae(self):
+        
+        shared_items.refresh_vae_list()
+
+    @app.post("/create/embedding", response_model=models.CreateResponse)
+    def create_embedding(self, args: dict):
+        try:
+            shared.state.begin(job="create_embedding")
+            filename = create_embedding(**args) # create empty embedding
+            sd_hijack.model_hijack.embedding_db.load_textual_inversion_embeddings() # reload embeddings so new one can be immediately used
+            return models.CreateResponse(info=f"create embedding filename: {filename}")
+        except AssertionError as e:
+            return models.TrainResponse(info=f"create embedding error: {e}")
+        finally:
+            shared.state.end()
+
+    @app.post("/create/hypernetwork", response_model=models.CreateResponse)
+    def create_hypernetwork(self, args: dict):
+        try:
+            shared.state.begin(job="create_hypernetwork")
+            filename = create_hypernetwork(**args) # create empty embedding
+            return models.CreateResponse(info=f"create hypernetwork filename: {filename}")
+        except AssertionError as e:
+            return models.TrainResponse(info=f"create hypernetwork error: {e}")
+        finally:
+            shared.state.end()
+
+    @app.post("/preprocess", response_model=models.PreprocessResponse)
+    def preprocess(self, args: dict):
+        try:
+            shared.state.begin(job="preprocess")
+            preprocess(**args) # quick operation unless blip/booru interrogation is enabled
+            shared.state.end()
+            return models.PreprocessResponse(info='preprocess complete')
+        except KeyError as e:
+            return models.PreprocessResponse(info=f"preprocess error: invalid token: {e}")
+        except Exception as e:
+            return models.PreprocessResponse(info=f"preprocess error: {e}")
+        finally:
+            shared.state.end()
+
+    @app.post("/train/embedding", response_model=models.TrainResponse)
+    def train_embedding(self, args: dict):
+        try:
+            shared.state.begin(job="train_embedding")
+            apply_optimizations = shared.opts.training_xattention_optimizations
+            error = None
+            filename = ''
+            if not apply_optimizations:
+                sd_hijack.undo_optimizations()
+            try:
+                embedding, filename = train_embedding(**args) # can take a long time to complete
+            except Exception as e:
+                error = e
+            finally:
+                if not apply_optimizations:
+                    sd_hijack.apply_optimizations()
+            return models.TrainResponse(info=f"train embedding complete: filename: {filename} error: {error}")
+        except Exception as msg:
+            return models.TrainResponse(info=f"train embedding error: {msg}")
+        finally:
+            shared.state.end()
+
+    @app.post("/train/hypernetwork", response_model=models.TrainResponse)
+    def train_hypernetwork(self, args: dict):
+        try:
+            shared.state.begin(job="train_hypernetwork")
+            shared.loaded_hypernetworks = []
+            apply_optimizations = shared.opts.training_xattention_optimizations
+            error = None
+            filename = ''
+            if not apply_optimizations:
+                sd_hijack.undo_optimizations()
+            try:
+                hypernetwork, filename = train_hypernetwork(**args)
+            except Exception as e:
+                error = e
+            finally:
+                #shared.sd_model.cond_stage_model.to(devices.device)
+                #shared.sd_model.first_stage_model.to(devices.device)
+                shared_instance.sd_model.cond_stage_model.to(devices.device)
+                shared_instance.sd_model.first_stage_model.to(devices.device)
+                if not apply_optimizations:
+                    sd_hijack.apply_optimizations()
+                shared.state.end()
+            return models.TrainResponse(info=f"train embedding complete: filename: {filename} error: {error}")
+        except Exception as exc:
+            return models.TrainResponse(info=f"train embedding error: {exc}")
+        finally:
+            shared.state.end()
+
+    @app.get("/memory", response_model=models.MemoryResponse)
+    def get_memory(self):
+        try:
+            import os
+            import psutil
+            process = psutil.Process(os.getpid())
+            res = process.memory_info() # only rss is cross-platform guaranteed so we dont rely on other values
+            ram_total = 100 * res.rss / process.memory_percent() # and total memory is calculated as actual value is not cross-platform safe
+            ram = { 'free': ram_total - res.rss, 'used': res.rss, 'total': ram_total }
+        except Exception as err:
+            ram = { 'error': f'{err}' }
+        try:
+            import torch
+            if torch.cuda.is_available():
+                s = torch.cuda.mem_get_info()
+                system = { 'free': s[0], 'used': s[1] - s[0], 'total': s[1] }
+                s = dict(torch.cuda.memory_stats(shared.device))
+                allocated = { 'current': s['allocated_bytes.all.current'], 'peak': s['allocated_bytes.all.peak'] }
+                reserved = { 'current': s['reserved_bytes.all.current'], 'peak': s['reserved_bytes.all.peak'] }
+                active = { 'current': s['active_bytes.all.current'], 'peak': s['active_bytes.all.peak'] }
+                inactive = { 'current': s['inactive_split_bytes.all.current'], 'peak': s['inactive_split_bytes.all.peak'] }
+                warnings = { 'retries': s['num_alloc_retries'], 'oom': s['num_ooms'] }
+                cuda = {
+                    'system': system,
+                    'active': active,
+                    'allocated': allocated,
+                    'reserved': reserved,
+                    'inactive': inactive,
+                    'events': warnings,
+                }
+            else:
+                cuda = {'error': 'unavailable'}
+        except Exception as err:
+            cuda = {'error': f'{err}'}
+        return models.MemoryResponse(ram=ram, cuda=cuda)
+
+    def launch(self, server_name, port, root_path):
+        self.app.include_router(self.router)
+        uvicorn.run(self.app, host=server_name, port=port, timeout_keep_alive=shared.cmd_opts.timeout_keep_alive, root_path=root_path)
+
+    @app.post("/server-kill")
+    def kill_webui(self):
+        restart.stop_program()
+
+    @app.post("/server-restart")
+    def restart_webui(self):
+        if restart.is_restartable():
+            restart.restart_program()
+        return Response(status_code=501)
+
+    @app.post("/server-stop")
+    def stop_webui(request):
+        shared.state.server_command = "stop"
+        return Response("Stopping.")
+
+
+entrypoint = Raypi.bind()
\ No newline at end of file
diff --git a/modules/cmd_args.py b/modules/cmd_args.py
index aab62286e24..8168fa4765b 100644
--- a/modules/cmd_args.py
+++ b/modules/cmd_args.py
@@ -117,3 +117,26 @@
 parser.add_argument('--timeout-keep-alive', type=int, default=30, help='set timeout_keep_alive for uvicorn')
 parser.add_argument("--disable-all-extensions", action='https://github.com/store_true', help="prevent all extensions from running regardless of any other settings", default=False)
 parser.add_argument("--disable-extra-extensions", action='https://github.com/store_true', help=" prevent all extensions except built-in from running regardless of any other settings", default=False)
+parser.add_argument("--ray", action='https://github.com/store_true', help="use api=True to launch the ray API instead of the webui")
+
+
+# Add a few dummy flags from possibly Ray server.
+# This is a limitation from Ray and will be fixed in future version.
+parser.add_argument("--node-ip-address", type=str, default="")
+parser.add_argument("--node-manager-port", type=str, default="")
+parser.add_argument("--object-store-name", type=str, default="")
+parser.add_argument("--raylet-name", type=str, default="")
+parser.add_argument("--redis-address", type=str, default="")
+parser.add_argument("--temp-dir", type=str, default="")
+parser.add_argument("--metrics-agent-port", type=str, default="")
+#parser.add_argument("--runtime-env-agent-port", type=str, default="")
+parser.add_argument("--logging-rotate-bytes", type=str, default="")
+parser.add_argument("--logging-rotate-backup-count", type=str, default="")
+parser.add_argument("--runtime-env-agent-port", type=str, default="")
+parser.add_argument("--gcs-address", type=str, default="")
+parser.add_argument("--session-name", type=str, default="")
+#parser.add_argument("--temp-dir", type=str, default="")
+parser.add_argument("--webui", type=str, default="")
+parser.add_argument("--cluster-id", type=str, default="")
+parser.add_argument("--startup-token", type=str, default="")
+parser.add_argument("--worker-launch-time-ms", type=str, default="")
\ No newline at end of file
diff --git a/modules/hypernetworks/hypernetwork.py b/modules/hypernetworks/hypernetwork.py
index 70f1cbd26b6..f4876ab1e61 100644
--- a/modules/hypernetworks/hypernetwork.py
+++ b/modules/hypernetworks/hypernetwork.py
@@ -18,7 +18,7 @@
 
 from collections import deque
 from statistics import stdev, mean
-
+from modules.shared import shared_instance
 
 optimizer_dict = {optim_name : cls_obj for optim_name, cls_obj in inspect.getmembers(torch.optim, inspect.isclass) if optim_name != "Optimizer"}
 
@@ -525,7 +525,8 @@ def train_hypernetwork(id_task, hypernetwork_name, learn_rate, batch_size, gradi
 
     pin_memory = shared.opts.pin_memory
 
-    ds = modules.textual_inversion.dataset.PersonalizedBase(data_root=data_root, width=training_width, height=training_height, repeats=shared.opts.training_image_repeats_per_epoch, placeholder_token=hypernetwork_name, model=shared.sd_model, cond_model=shared.sd_model.cond_stage_model, device=devices.device, template_file=template_file, include_cond=True, batch_size=batch_size, gradient_step=gradient_step, shuffle_tags=shuffle_tags, tag_drop_out=tag_drop_out, latent_sampling_method=latent_sampling_method, varsize=varsize, use_weight=use_weight)
+    #ds = modules.textual_inversion.dataset.PersonalizedBase(data_root=data_root, width=training_width, height=training_height, repeats=shared.opts.training_image_repeats_per_epoch, placeholder_token=hypernetwork_name, model=shared.sd_model, cond_model=shared.sd_model.cond_stage_model, device=devices.device, template_file=template_file, include_cond=True, batch_size=batch_size, gradient_step=gradient_step, shuffle_tags=shuffle_tags, tag_drop_out=tag_drop_out, latent_sampling_method=latent_sampling_method, varsize=varsize, use_weight=use_weight)
+    ds = modules.textual_inversion.dataset.PersonalizedBase(data_root=data_root, width=training_width, height=training_height, repeats=shared.opts.training_image_repeats_per_epoch, placeholder_token=hypernetwork_name, model=shared_instance.sd_model, cond_model=shared_instance.sd_model.cond_stage_model, device=devices.device, template_file=template_file, include_cond=True, batch_size=batch_size, gradient_step=gradient_step, shuffle_tags=shuffle_tags, tag_drop_out=tag_drop_out, latent_sampling_method=latent_sampling_method, varsize=varsize, use_weight=use_weight)
 
     if shared.opts.save_training_settings_to_txt:
         saved_params = dict(
@@ -542,8 +543,10 @@ def train_hypernetwork(id_task, hypernetwork_name, learn_rate, batch_size, gradi
 
     if unload:
         shared.parallel_processing_allowed = False
-        shared.sd_model.cond_stage_model.to(devices.cpu)
-        shared.sd_model.first_stage_model.to(devices.cpu)
+        #shared.sd_model.cond_stage_model.to(devices.cpu)
+        #shared.sd_model.first_stage_model.to(devices.cpu)
+        shared_instance.sd_model.cond_stage_model.to(devices.cpu)
+        shared_instance.sd_model.first_stage_model.to(devices.cpu)
 
     weights = hypernetwork.weights()
     hypernetwork.train()
@@ -614,16 +617,21 @@ def train_hypernetwork(id_task, hypernetwork_name, learn_rate, batch_size, gradi
                     if use_weight:
                         w = batch.weight.to(devices.device, non_blocking=pin_memory)
                     if tag_drop_out != 0 or shuffle_tags:
-                        shared.sd_model.cond_stage_model.to(devices.device)
-                        c = shared.sd_model.cond_stage_model(batch.cond_text).to(devices.device, non_blocking=pin_memory)
-                        shared.sd_model.cond_stage_model.to(devices.cpu)
+                        #shared.sd_model.cond_stage_model.to(devices.device)
+                        shared_instance.sd_model.cond_stage_model.to(devices.device)
+                        c = shared_instance.sd_model.cond_stage_model(batch.cond_text).to(devices.device, non_blocking=pin_memory)
+                        shared_instance.sd_model.cond_stage_model.to(devices.cpu)
+                        #c = shared.sd_model.cond_stage_model(batch.cond_text).to(devices.device, non_blocking=pin_memory)
+                        #shared.sd_model.cond_stage_model.to(devices.cpu)
                     else:
                         c = stack_conds(batch.cond).to(devices.device, non_blocking=pin_memory)
                     if use_weight:
-                        loss = shared.sd_model.weighted_forward(x, c, w)[0] / gradient_step
+                        loss = shared_instance.sd_model.weighted_forward(x, c, w)[0] / gradient_step
+                        #loss = shared.sd_model.weighted_forward(x, c, w)[0] / gradient_step
                         del w
                     else:
-                        loss = shared.sd_model.forward(x, c)[0] / gradient_step
+                        #loss = shared.sd_model.forward(x, c)[0] / gradient_step
+                        loss = shared_instance.sd_model.forward(x, c)[0] / gradient_step
                     del x
                     del c
 
@@ -683,11 +691,14 @@ def train_hypernetwork(id_task, hypernetwork_name, learn_rate, batch_size, gradi
                     cuda_rng_state = None
                     if torch.cuda.is_available():
                         cuda_rng_state = torch.cuda.get_rng_state_all()
-                    shared.sd_model.cond_stage_model.to(devices.device)
-                    shared.sd_model.first_stage_model.to(devices.device)
+                    #shared.sd_model.cond_stage_model.to(devices.device)
+                    #shared.sd_model.first_stage_model.to(devices.device)
+                    shared_instance.sd_model.cond_stage_model.to(devices.device)
+                    shared_instance.sd_model.first_stage_model.to(devices.device)
 
                     p = processing.StableDiffusionProcessingTxt2Img(
-                        sd_model=shared.sd_model,
+                        #sd_model=shared.sd_model,
+                        sd_model=shared_instance.sd_model,
                         do_not_save_grid=True,
                         do_not_save_samples=True,
                     )
@@ -716,8 +727,10 @@ def train_hypernetwork(id_task, hypernetwork_name, learn_rate, batch_size, gradi
                         image = processed.images[0] if len(processed.images) > 0 else None
 
                     if unload:
-                        shared.sd_model.cond_stage_model.to(devices.cpu)
-                        shared.sd_model.first_stage_model.to(devices.cpu)
+                        #shared.sd_model.cond_stage_model.to(devices.cpu)
+                        #shared.sd_model.first_stage_model.to(devices.cpu)
+                        shared_instance.sd_model.cond_stage_model.to(devices.cpu)
+                        shared_instance.sd_model.first_stage_model.to(devices.cpu)
                     torch.set_rng_state(rng_state)
                     if torch.cuda.is_available():
                         torch.cuda.set_rng_state_all(cuda_rng_state)
@@ -760,8 +773,10 @@ def train_hypernetwork(id_task, hypernetwork_name, learn_rate, batch_size, gradi
 
     del optimizer
     hypernetwork.optimizer_state_dict = None  # dereference it after saving, to save memory.
-    shared.sd_model.cond_stage_model.to(devices.device)
-    shared.sd_model.first_stage_model.to(devices.device)
+    #shared.sd_model.cond_stage_model.to(devices.device)
+    #shared.sd_model.first_stage_model.to(devices.device)
+    shared_instance.sd_model.cond_stage_model.to(devices.device)
+    shared_instance.sd_model.first_stage_model.to(devices.device)
     shared.parallel_processing_allowed = old_parallel_processing_allowed
 
     return hypernetwork, filename
diff --git a/modules/hypernetworks/ui.py b/modules/hypernetworks/ui.py
index 8b6255e2b67..cce2ef28419 100644
--- a/modules/hypernetworks/ui.py
+++ b/modules/hypernetworks/ui.py
@@ -3,7 +3,7 @@
 import gradio as gr
 import modules.hypernetworks.hypernetwork
 from modules import devices, sd_hijack, shared
-
+from modules.shared import shared_instance
 not_available = ["hardswish", "multiheadattention"]
 keys = [x for x in modules.hypernetworks.hypernetwork.HypernetworkModule.activation_dict if x not in not_available]
 
@@ -32,7 +32,9 @@ def train_hypernetwork(*args):
     except Exception:
         raise
     finally:
-        shared.sd_model.cond_stage_model.to(devices.device)
-        shared.sd_model.first_stage_model.to(devices.device)
+        #shared.sd_model.cond_stage_model.to(devices.device)
+        #shared.sd_model.first_stage_model.to(devices.device)
+        shared_instance.sd_model.cond_stage_model.to(devices.device)
+        shared_instance.sd_model.first_stage_model.to(devices.device)
         sd_hijack.apply_optimizations()
 
diff --git a/modules/images.py b/modules/images.py
index eb644733898..cdf160b7fee 100644
--- a/modules/images.py
+++ b/modules/images.py
@@ -20,6 +20,8 @@
 from modules import sd_samplers, shared, script_callbacks, errors
 from modules.paths_internal import roboto_ttf_file
 from modules.shared import opts
+from modules.shared import shared_instance
+
 
 LANCZOS = (Image.Resampling.LANCZOS if hasattr(Image, 'Resampling') else Image.LANCZOS)
 
@@ -350,8 +352,10 @@ class FilenameGenerator:
         'height': lambda self: self.image.height,
         'styles': lambda self: self.p and sanitize_filename_part(", ".join([style for style in self.p.styles if not style == "None"]) or "None", replace_spaces=False),
         'sampler': lambda self: self.p and sanitize_filename_part(self.p.sampler_name, replace_spaces=False),
-        'model_hash': lambda self: getattr(self.p, "sd_model_hash", shared.sd_model.sd_model_hash),
-        'model_name': lambda self: sanitize_filename_part(shared.sd_model.sd_checkpoint_info.name_for_extra, replace_spaces=False),
+        'model_hash': lambda self: getattr(self.p, "sd_model_hash", shared_instance.sd_model.sd_model_hash),
+        #'model_hash': lambda self: getattr(self.p, "sd_model_hash", shared.sd_model.sd_model_hash),
+        #'model_name': lambda self: sanitize_filename_part(shared.sd_model.sd_checkpoint_info.name_for_extra, replace_spaces=False),
+        'model_name': lambda self: sanitize_filename_part(shared_instance.sd_model.sd_checkpoint_info.name_for_extra, replace_spaces=False),
         'date': lambda self: datetime.datetime.now().strftime('%Y-%m-%d'),
         'datetime': lambda self, *args: self.datetime(*args),  # accepts formats: [datetime], [datetime<Format>], [datetime<Format><Time Zone>]
         'job_timestamp': lambda self: getattr(self.p, "job_timestamp", shared.state.job_timestamp),
diff --git a/modules/img2img.py b/modules/img2img.py
index 1519e132b2b..bc363fa15bc 100644
--- a/modules/img2img.py
+++ b/modules/img2img.py
@@ -14,7 +14,7 @@
 import modules.processing as processing
 from modules.ui import plaintext_to_html
 import modules.scripts
-
+from modules.shared import shared_instance
 
 def process_batch(p, input_dir, output_dir, inpaint_mask_dir, args, to_scale=False, scale_by=1.0, use_png_info=False, png_info_props=None, png_info_dir=None):
     output_dir = output_dir.strip()
@@ -158,7 +158,8 @@ def img2img(id_task: str, mode: int, prompt: str, negative_prompt: str, prompt_s
     assert 0. <= denoising_strength <= 1., 'can only work with strength in [0.0, 1.0]'
 
     p = StableDiffusionProcessingImg2Img(
-        sd_model=shared.sd_model,
+        #sd_model=shared.sd_model,
+        sd_model=shared_instance.sd_model,
         outpath_samples=opts.outdir_samples or opts.outdir_img2img_samples,
         outpath_grids=opts.outdir_grids or opts.outdir_img2img_grids,
         prompt=prompt,
diff --git a/modules/import_hook.py b/modules/import_hook.py
index 28c67dfa897..4ef02d2e828 100644
--- a/modules/import_hook.py
+++ b/modules/import_hook.py
@@ -3,3 +3,15 @@
 # this will break any attempt to import xformers which will prevent stability diffusion repo from trying to use it
 if "--xformers" not in "".join(sys.argv):
     sys.modules["xformers"] = None
+
+
+# Hack to fix a changed import in torchvision 0.17+, which otherwise breaks
+# basicsr; see https://github.com/AUTOMATIC1111/stable-diffusion-webui/issues/13985
+try:
+    import torchvision.transforms.functional_tensor  # noqa: F401
+except ImportError:
+    try:
+        import torchvision.transforms.functional as functional
+        sys.modules["torchvision.transforms.functional_tensor"] = functional
+    except ImportError:
+        pass 
\ No newline at end of file
diff --git a/modules/initialize.py b/modules/initialize.py
index f24f76375db..58e1fced846 100644
--- a/modules/initialize.py
+++ b/modules/initialize.py
@@ -5,7 +5,7 @@
 from threading import Thread
 
 from modules.timer import startup_timer
-
+from modules.shared import shared_instance
 
 def imports():
     logging.getLogger("torch.distributed.nn").setLevel(logging.ERROR)  # sshh...
@@ -51,7 +51,7 @@ def initialize():
     initialize_util.fix_torch_version()
     initialize_util.fix_asyncio_event_loop_policy()
     initialize_util.validate_tls_options()
-    initialize_util.configure_sigint_handler()
+    #initialize_util.configure_sigint_handler()
     initialize_util.configure_opts_onchange()
 
     from modules import modelloader
@@ -144,7 +144,9 @@ def load_model():
         by that time, so we apply optimization again.
         """
 
-        shared.sd_model  # noqa: B018
+        #shared.sd_model  # noqa: B018
+        
+        shared_instance.sd_model = shared.shared_instance.sd_model
 
         if sd_hijack.current_optimizer is None:
             sd_hijack.apply_optimizations()
diff --git a/modules/initialize_util.py b/modules/initialize_util.py
index 2894eee4c1a..275bf546dbe 100644
--- a/modules/initialize_util.py
+++ b/modules/initialize_util.py
@@ -5,6 +5,7 @@
 import re
 
 from modules.timer import startup_timer
+from modules.shared import shared_instance
 
 
 def gradio_server_name():
@@ -172,7 +173,8 @@ def configure_opts_onchange():
     shared.opts.onchange("sd_vae_overrides_per_model_preferences", wrap_queued_call(lambda: sd_vae.reload_vae_weights()), call=False)
     shared.opts.onchange("temp_dir", ui_tempdir.on_tmpdir_changed)
     shared.opts.onchange("gradio_theme", shared.reload_gradio_theme)
-    shared.opts.onchange("cross_attention_optimization", wrap_queued_call(lambda: sd_hijack.model_hijack.redo_hijack(shared.sd_model)), call=False)
+    #shared.opts.onchange("cross_attention_optimization", wrap_queued_call(lambda: sd_hijack.model_hijack.redo_hijack(shared.sd_model)), call=False)
+    shared.opts.onchange("cross_attention_optimization", wrap_queued_call(lambda: sd_hijack.model_hijack.redo_hijack(shared_instance.sd_model)), call=False)
     startup_timer.record("opts onchange")
 
 
diff --git a/modules/launch_utils.py b/modules/launch_utils.py
index 6e54d06367c..1f0a5cb071f 100644
--- a/modules/launch_utils.py
+++ b/modules/launch_utils.py
@@ -30,6 +30,7 @@
     os.environ['GRADIO_ANALYTICS_ENABLED'] = 'False'
 
 
+
 def check_python_version():
     is_windows = platform.system() == "Windows"
     major = sys.version_info.major
@@ -135,7 +136,11 @@ def run_pip(command, desc=None, live=default_command_live):
         return
 
     index_url_line = f' --index-url {index_url}' if index_url != '' else ''
-    return run(f'"{python}" -m pip {command} --prefer-binary{index_url_line}', desc=f"Installing {desc}", errdesc=f"Couldn't install {desc}", live=live)
+
+    if "ENABLE_UV" not in os.environ:
+        return run(f'"{python}" -m pip {command} --prefer-binary{index_url_line}', desc=f"Installing {desc}", errdesc=f"Couldn't install {desc}", live=live)
+    else:
+        return run(f'uv pip {command}', desc=f"Installing {desc}", errdesc=f"Couldn't install {desc}", live=live)
 
 
 def check_run_python(code: str) -> bool:
@@ -313,8 +318,8 @@ def prepare_environment():
     requirements_file = os.environ.get('REQS_FILE', "requirements_versions.txt")
 
     xformers_package = os.environ.get('XFORMERS_PACKAGE', 'xformers==0.0.20')
-    clip_package = os.environ.get('CLIP_PACKAGE', "https://github.com/openai/CLIP/archive/d50d76daa670286dd6cacf3bcd80b5e4823fc8e1.zip")
-    openclip_package = os.environ.get('OPENCLIP_PACKAGE', "https://github.com/mlfoundations/open_clip/archive/bb6e834e9c70d9c27d0dc3ecedeebeaeb1ffad6b.zip")
+    clip_package = os.environ.get('CLIP_PACKAGE', "'CLIP @ https://github.com/openai/CLIP/archive/d50d76daa670286dd6cacf3bcd80b5e4823fc8e1.zip'")
+    openclip_package = os.environ.get('OPENCLIP_PACKAGE', "'open_clip @ https://github.com/mlfoundations/open_clip/archive/bb6e834e9c70d9c27d0dc3ecedeebeaeb1ffad6b.zip'")
 
     stable_diffusion_repo = os.environ.get('STABLE_DIFFUSION_REPO', "https://github.com/Stability-AI/stablediffusion.git")
     stable_diffusion_xl_repo = os.environ.get('STABLE_DIFFUSION_XL_REPO', "https://github.com/Stability-AI/generative-models.git")
@@ -428,10 +433,13 @@ def configure_for_tests():
 
 
 def start():
-    print(f"Launching {'API server' if '--nowebui' in sys.argv else 'Web UI'} with arguments: {' '.join(sys.argv[1:])}")
+    print(f"Launching {'API server' if '--nowebui' or '--ray' in sys.argv else 'Web UI'} with arguments: {' '.join(sys.argv[1:])}")
     import webui
+    
     if '--nowebui' in sys.argv:
         webui.api_only()
+    elif '--ray' in sys.argv:
+        webui.ray_api()
     else:
         webui.webui()
 
diff --git a/modules/processing.py b/modules/processing.py
index e124e7f0dd2..78a894d79d5 100644
--- a/modules/processing.py
+++ b/modules/processing.py
@@ -19,7 +19,6 @@
 from modules import devices, prompt_parser, masking, sd_samplers, lowvram, generation_parameters_copypaste, extra_networks, sd_vae_approx, scripts, sd_samplers_common, sd_unet, errors, rng
 from modules.rng import slerp # noqa: F401
 from modules.sd_hijack import model_hijack
-from modules.sd_samplers_common import images_tensor_to_samples, decode_first_stage, approximation_indexes
 from modules.shared import opts, cmd_opts, state
 import modules.shared as shared
 import modules.paths as paths
@@ -33,7 +32,7 @@
 
 from einops import repeat, rearrange
 from blendmodes.blend import blendLayers, BlendType
-
+from modules.shared import shared_instance
 
 # some of those options should not be changed at all because they would break the model, so I removed them from options.
 opt_C = 4
@@ -89,6 +88,7 @@ def create_binary_mask(image):
     return image
 
 def txt2img_image_conditioning(sd_model, x, width, height):
+    from modules.sd_samplers_common import images_tensor_to_samples, approximation_indexes
     if sd_model.model.conditioning_key in {'hybrid', 'concat'}: # Inpainting models
 
         # The "masked-image" in this case will just be all 0.5 since the entire image is masked.
@@ -235,7 +235,8 @@ def __post_init__(self):
 
     @property
     def sd_model(self):
-        return shared.sd_model
+        #return shared.sd_model
+        return shared_instance.sd_model
 
     @sd_model.setter
     def sd_model(self, value):
@@ -277,6 +278,7 @@ def txt2img_image_conditioning(self, x, width=None, height=None):
         return txt2img_image_conditioning(self.sd_model, x, width or self.width, height or self.height)
 
     def depth2img_image_conditioning(self, source_image):
+        from modules.sd_samplers_common import images_tensor_to_samples, approximation_indexes
         # Use the AddMiDaS helper to Format our source image to suit the MiDaS model
         transformer = AddMiDaS(model_type="dpt_hybrid")
         transformed = transformer({"jpg": rearrange(source_image[0], "c h w -> h w c")})
@@ -296,6 +298,7 @@ def depth2img_image_conditioning(self, source_image):
         return conditioning
 
     def edit_image_conditioning(self, source_image):
+        from modules.sd_samplers_common import images_tensor_to_samples, approximation_indexes
         conditioning_image = images_tensor_to_samples(source_image*0.5+0.5, approximation_indexes.get(opts.sd_vae_encode_method))
 
         return conditioning_image
@@ -416,7 +419,8 @@ def cached_params(self, required_prompts, steps, extra_network_data, hires_steps
             hires_steps,
             use_old_scheduling,
             opts.CLIP_stop_at_last_layers,
-            shared.sd_model.sd_checkpoint_info,
+            #shared.sd_model.sd_checkpoint_info,
+            shared_instance.sd_model.sd_checkpoint_info,
             extra_network_data,
             opts.sdxl_crop_left,
             opts.sdxl_crop_top,
@@ -452,8 +456,8 @@ def get_conds_with_caching(self, function, required_prompts, steps, caches, extr
         cache = caches[0]
 
         with devices.autocast():
-            cache[1] = function(shared.sd_model, required_prompts, steps, hires_steps, shared.opts.use_old_scheduling)
-
+            #cache[1] = function(shared.sd_model, required_prompts, steps, hires_steps, shared.opts.use_old_scheduling)
+            cache[1] = function(shared_instance.sd_model, required_prompts, steps, hires_steps, shared.opts.use_old_scheduling)
         cache[0] = cached_params
         return cache[1]
 
@@ -588,6 +592,7 @@ class DecodedSamples(list):
 
 
 def decode_latent_batch(model, batch, target_device=None, check_for_nans=False):
+    from modules.sd_samplers_common import decode_first_stage
     samples = DecodedSamples()
 
     for i in range(batch.shape[0]):
@@ -769,8 +774,10 @@ def process_images_inner(p: StableDiffusionProcessing) -> Processed:
         if p.refiner_checkpoint_info is None:
             raise Exception(f'Could not find checkpoint with name {p.refiner_checkpoint}')
 
-    p.sd_model_name = shared.sd_model.sd_checkpoint_info.name_for_extra
-    p.sd_model_hash = shared.sd_model.sd_model_hash
+    #p.sd_model_name = shared.sd_model.sd_checkpoint_info.name_for_extra
+    #p.sd_model_hash = shared.sd_model.sd_model_hash
+    p.sd_model_name = shared_instance.sd_model.sd_checkpoint_info.name_for_extra
+    p.sd_model_hash = shared_instance.sd_model.sd_model_hash
     p.sd_vae_name = sd_vae.get_loaded_vae_name()
     p.sd_vae_hash = sd_vae.get_loaded_vae_hash()
 
@@ -879,7 +886,8 @@ def process_images_inner(p: StableDiffusionProcessing) -> Processed:
 
             del samples_ddim
 
-            if lowvram.is_enabled(shared.sd_model):
+            #if lowvram.is_enabled(shared.sd_model):
+            if lowvram.is_enabled(shared_instance.sd_model):
                 lowvram.send_everything_to_cpu()
 
             devices.torch_gc()
@@ -1156,6 +1164,7 @@ def sample(self, conditioning, unconditional_conditioning, seeds, subseeds, subs
         return self.sample_hr_pass(samples, decoded_samples, seeds, subseeds, subseed_strength, prompts)
 
     def sample_hr_pass(self, samples, decoded_samples, seeds, subseeds, subseed_strength, prompts):
+        
         if shared.state.interrupted:
             return samples
 
@@ -1189,6 +1198,7 @@ def save_intermediate(image, index):
             # Avoid making the inpainting conditioning unless necessary as
             # this does need some extra compute to decode / encode the image again.
             if getattr(self, "inpainting_mask_weight", shared.opts.inpainting_mask_weight) < 1.0:
+                from modules.sd_samplers_common import decode_first_stage , approximation_indexes
                 image_conditioning = self.img2img_image_conditioning(decode_first_stage(self.sd_model, samples), samples)
             else:
                 image_conditioning = self.txt2img_image_conditioning(samples)
@@ -1212,6 +1222,7 @@ def save_intermediate(image, index):
             decoded_samples = decoded_samples.to(shared.device, dtype=devices.dtype_vae)
 
             if opts.sd_vae_encode_method != 'Full':
+                from modules.sd_samplers_common import images_tensor_to_samples
                 self.extra_generation_params['VAE Encoder'] = opts.sd_vae_encode_method
             samples = images_tensor_to_samples(decoded_samples, approximation_indexes.get(opts.sd_vae_encode_method))
 
@@ -1315,7 +1326,8 @@ def setup_conds(self):
             if shared.opts.hires_fix_use_firstpass_conds:
                 self.calculate_hr_conds()
 
-            elif lowvram.is_enabled(shared.sd_model) and shared.sd_model.sd_checkpoint_info == sd_models.select_checkpoint():  # if in lowvram mode, we need to calculate conds right away, before the cond NN is unloaded
+            elif lowvram.is_enabled(shared_instance.sd_model) and shared_instance.sd_model.sd_checkpoint_info == sd_models.select_checkpoint():  # if in lowvram mode, we need to calculate conds right away, before the cond NN is unloaded
+            #elif lowvram.is_enabled(shared.sd_model) and shared.sd_model.sd_checkpoint_info == sd_models.select_checkpoint():  # if in lowvram mode, we need to calculate conds right away, before the cond NN is unloaded
                 with devices.autocast():
                     extra_networks.activate(self, self.hr_extra_network_data)
 
@@ -1387,7 +1399,10 @@ def mask_blur(self, value):
             self.mask_blur_y = value
 
     def init(self, all_prompts, all_seeds, all_subseeds):
-        self.image_cfg_scale: float = self.image_cfg_scale if shared.sd_model.cond_stage_key == "edit" else None
+        from modules.sd_samplers_common import images_tensor_to_samples, approximation_indexes
+        #self.image_cfg_scale: float = self.image_cfg_scale if shared.sd_model.cond_stage_key == "edit" else None
+        self.image_cfg_scale: float = self.image_cfg_scale if shared_instance.sd_model.cond_stage_key == "edit" else None
+
 
         self.sampler = sd_samplers.create_sampler(self.sampler_name, self.sd_model)
         crop_region = None
diff --git a/modules/sd_samplers.py b/modules/sd_samplers.py
index 45faae62821..745b2911a7f 100644
--- a/modules/sd_samplers.py
+++ b/modules/sd_samplers.py
@@ -56,4 +56,4 @@ def visible_sampler_names():
     return [x.name for x in samplers if x.name not in samplers_hidden]
 
 
-set_samplers()
+#set_samplers()
diff --git a/modules/sd_samplers_cfg_denoiser.py b/modules/sd_samplers_cfg_denoiser.py
index b8101d38dc3..0af6add03dd 100644
--- a/modules/sd_samplers_cfg_denoiser.py
+++ b/modules/sd_samplers_cfg_denoiser.py
@@ -6,7 +6,7 @@
 from modules.script_callbacks import CFGDenoiserParams, cfg_denoiser_callback
 from modules.script_callbacks import CFGDenoisedParams, cfg_denoised_callback
 from modules.script_callbacks import AfterCFGCallbackParams, cfg_after_cfg_callback
-
+from modules.shared import shared_instance
 
 def catenate_conds(conds):
     if not isinstance(conds[0], dict):
@@ -98,7 +98,8 @@ def forward(self, x, sigma, uncond, cond, cond_scale, s_min_uncond, image_cond):
 
         # at self.image_cfg_scale == 1.0 produced results for edit model are the same as with normal sampling,
         # so is_edit_model is set to False to support AND composition.
-        is_edit_model = shared.sd_model.cond_stage_key == "edit" and self.image_cfg_scale is not None and self.image_cfg_scale != 1.0
+        #is_edit_model = shared.sd_model.cond_stage_key == "edit" and self.image_cfg_scale is not None and self.image_cfg_scale != 1.0
+        is_edit_model = shared_instance.sd_model.cond_stage_key == "edit" and self.image_cfg_scale is not None and self.image_cfg_scale != 1.0
 
         conds_list, tensor = prompt_parser.reconstruct_multicond_batch(cond, self.step)
         uncond = prompt_parser.reconstruct_cond_batch(uncond, self.step)
@@ -111,7 +112,8 @@ def forward(self, x, sigma, uncond, cond, cond_scale, s_min_uncond, image_cond):
         batch_size = len(conds_list)
         repeats = [len(conds_list[i]) for i in range(batch_size)]
 
-        if shared.sd_model.model.conditioning_key == "crossattn-adm":
+        #if shared.sd_model.model.conditioning_key == "crossattn-adm":
+        if shared_instance.sd_model.model.conditioning_key == "crossattn-adm":
             image_uncond = torch.zeros_like(image_cond)
             make_condition_dict = lambda c_crossattn, c_adm: {"c_crossattn": [c_crossattn], "c_adm": c_adm}
         else:
@@ -147,7 +149,8 @@ def forward(self, x, sigma, uncond, cond, cond_scale, s_min_uncond, image_cond):
 
         self.padded_cond_uncond = False
         if shared.opts.pad_cond_uncond and tensor.shape[1] != uncond.shape[1]:
-            empty = shared.sd_model.cond_stage_model_empty_prompt
+            #empty = shared.sd_model.cond_stage_model_empty_prompt
+            empty = shared_instance.sd_model.cond_stage_model_empty_prompt
             num_repeats = (tensor.shape[1] - uncond.shape[1]) // empty.shape[1]
 
             if num_repeats < 0:
diff --git a/modules/sd_samplers_common.py b/modules/sd_samplers_common.py
index 58efcad2374..d4e66cb948a 100644
--- a/modules/sd_samplers_common.py
+++ b/modules/sd_samplers_common.py
@@ -3,10 +3,10 @@
 import numpy as np
 import torch
 from PIL import Image
-from modules import devices, images, sd_vae_approx, sd_samplers, sd_vae_taesd, shared, sd_models
+from modules import devices, images, sd_vae_approx, sd_vae_taesd, shared, sd_models
 from modules.shared import opts, state
 import k_diffusion.sampling
-
+from modules.shared import shared_instance
 
 SamplerDataTuple = namedtuple('SamplerData', ['name', 'constructor', 'aliases', 'options'])
 
@@ -41,7 +41,8 @@ def samples_to_images_tensor(sample, approximation=None, model=None):
         approximation = approximation_indexes.get(opts.show_progress_type, 0)
 
         from modules import lowvram
-        if approximation == 0 and lowvram.is_enabled(shared.sd_model) and not shared.opts.live_preview_allow_lowvram_full:
+        if approximation == 0 and lowvram.is_enabled(shared_instance.sd_model) and not shared.opts.live_preview_allow_lowvram_full:
+        #if approximation == 0 and lowvram.is_enabled(shared.sd_model) and not shared.opts.live_preview_allow_lowvram_full:
             approximation = 1
 
     if approximation == 2:
@@ -53,7 +54,8 @@ def samples_to_images_tensor(sample, approximation=None, model=None):
         x_sample = x_sample * 2 - 1
     else:
         if model is None:
-            model = shared.sd_model
+            #model = shared.sd_model
+            model = shared_instance.sd_model
         with devices.without_autocast(): # fixes an issue with unstable VAEs that are flaky even in fp32
             x_sample = model.decode_first_stage(sample.to(model.first_stage_model.dtype))
 
@@ -94,7 +96,8 @@ def images_tensor_to_samples(image, approximation=None, model=None):
         x_latent = sd_vae_taesd.encoder_model()(image)
     else:
         if model is None:
-            model = shared.sd_model
+            #model = shared.sd_model
+            model = shared_instance.sd_model
         model.first_stage_model.to(devices.dtype_vae)
 
         image = image.to(shared.device, dtype=devices.dtype_vae)
@@ -122,8 +125,8 @@ def store_latent(decoded):
 
 def is_sampler_using_eta_noise_seed_delta(p):
     """returns whether sampler from config will use eta noise seed delta for image creation"""
-
-    sampler_config = sd_samplers.find_sampler_config(p.sampler_name)
+    from modules.sd_samplers import find_sampler_config
+    sampler_config = find_sampler_config(p.sampler_name)
 
     eta = p.eta
 
@@ -163,7 +166,8 @@ def apply_refiner(cfg_denoiser):
     if refiner_switch_at is not None and completed_ratio < refiner_switch_at:
         return False
 
-    if refiner_checkpoint_info is None or shared.sd_model.sd_checkpoint_info == refiner_checkpoint_info:
+    if refiner_checkpoint_info is None or shared_instance.sd_model.sd_checkpoint_info == refiner_checkpoint_info:
+    #if refiner_checkpoint_info is None or shared.sd_model.sd_checkpoint_info == refiner_checkpoint_info:
         return False
 
     if getattr(cfg_denoiser.p, "enable_hr", False):
@@ -235,7 +239,8 @@ def __init__(self, funcname):
         self.eta_infotext_field = 'Eta'
         self.eta_default = 1.0
 
-        self.conditioning_key = shared.sd_model.model.conditioning_key
+        #self.conditioning_key = shared.sd_model.model.conditioning_key
+        self.conditioning_key = shared_instance.sd_model.model.conditioning_key
 
         self.p = None
         self.model_wrap_cfg = None
diff --git a/modules/sd_samplers_kdiffusion.py b/modules/sd_samplers_kdiffusion.py
index 8a8c87e0d01..9989dec5747 100644
--- a/modules/sd_samplers_kdiffusion.py
+++ b/modules/sd_samplers_kdiffusion.py
@@ -1,10 +1,11 @@
 import torch
 import inspect
 import k_diffusion.sampling
-from modules import sd_samplers_common, sd_samplers_extra, sd_samplers_cfg_denoiser
+from modules.sd_samplers_common import SamplerData, Sampler, setup_img2img_steps
+from modules import sd_samplers_extra, sd_samplers_cfg_denoiser
 from modules.sd_samplers_cfg_denoiser import CFGDenoiser  # noqa: F401
 from modules.script_callbacks import ExtraNoiseParams, extra_noise_callback
-
+from modules.shared import shared_instance
 from modules.shared import opts
 import modules.shared as shared
 
@@ -40,7 +41,7 @@
 
 
 samplers_data_k_diffusion = [
-    sd_samplers_common.SamplerData(label, lambda model, funcname=funcname: KDiffusionSampler(funcname, model), aliases, options)
+    SamplerData(label, lambda model, funcname=funcname: KDiffusionSampler(funcname, model), aliases, options)
     for label, funcname, aliases, options in samplers_k_diffusion
     if callable(funcname) or hasattr(k_diffusion.sampling, funcname)
 ]
@@ -70,13 +71,14 @@ class CFGDenoiserKDiffusion(sd_samplers_cfg_denoiser.CFGDenoiser):
     @property
     def inner_model(self):
         if self.model_wrap is None:
-            denoiser = k_diffusion.external.CompVisVDenoiser if shared.sd_model.parameterization == "v" else k_diffusion.external.CompVisDenoiser
-            self.model_wrap = denoiser(shared.sd_model, quantize=shared.opts.enable_quantization)
-
+            #denoiser = k_diffusion.external.CompVisVDenoiser if shared.sd_model.parameterization == "v" else k_diffusion.external.CompVisDenoiser
+            denoiser = k_diffusion.external.CompVisVDenoiser if shared_instance.sd_model.parameterization == "v" else k_diffusion.external.CompVisDenoiser
+            #self.model_wrap = denoiser(shared.sd_model, quantize=shared.opts.enable_quantization)
+            self.model_wrap = denoiser(shared_instance.sd_model, quantize=shared.opts.enable_quantization)
         return self.model_wrap
 
 
-class KDiffusionSampler(sd_samplers_common.Sampler):
+class KDiffusionSampler(Sampler):
     def __init__(self, funcname, sd_model, options=None):
         super().__init__(funcname)
 
@@ -139,7 +141,7 @@ def get_sigmas(self, p, steps):
         return sigmas
 
     def sample_img2img(self, p, x, noise, conditioning, unconditional_conditioning, steps=None, image_conditioning=None):
-        steps, t_enc = sd_samplers_common.setup_img2img_steps(p, steps)
+        steps, t_enc = setup_img2img_steps(p, steps)
 
         sigmas = self.get_sigmas(p, steps)
         sigma_sched = sigmas[steps - t_enc - 1:]
diff --git a/modules/sd_samplers_timesteps.py b/modules/sd_samplers_timesteps.py
index b17a8f93c2b..fd1ee63f911 100644
--- a/modules/sd_samplers_timesteps.py
+++ b/modules/sd_samplers_timesteps.py
@@ -4,7 +4,7 @@
 from modules import devices, sd_samplers_common, sd_samplers_timesteps_impl
 from modules.sd_samplers_cfg_denoiser import CFGDenoiser
 from modules.script_callbacks import ExtraNoiseParams, extra_noise_callback
-
+from modules.shared import shared_instance
 from modules.shared import opts
 import modules.shared as shared
 
@@ -49,7 +49,8 @@ class CFGDenoiserTimesteps(CFGDenoiser):
     def __init__(self, sampler):
         super().__init__(sampler)
 
-        self.alphas = shared.sd_model.alphas_cumprod
+        #self.alphas = shared.sd_model.alphas_cumprod
+        self.alphas = shared_instance.sd_model.alphas_cumprod
         self.mask_before_denoising = True
 
     def get_pred_x0(self, x_in, x_out, sigma):
@@ -65,8 +66,10 @@ def get_pred_x0(self, x_in, x_out, sigma):
     @property
     def inner_model(self):
         if self.model_wrap is None:
-            denoiser = CompVisTimestepsVDenoiser if shared.sd_model.parameterization == "v" else CompVisTimestepsDenoiser
-            self.model_wrap = denoiser(shared.sd_model)
+            #denoiser = CompVisTimestepsVDenoiser if shared.sd_model.parameterization == "v" else CompVisTimestepsDenoiser
+            denoiser = CompVisTimestepsVDenoiser if shared_instance.sd_model.parameterization == "v" else CompVisTimestepsDenoiser
+            #self.model_wrap = denoiser(shared.sd_model)
+            self.model_wrap = denoiser(shared_instance.sd_model)
 
         return self.model_wrap
 
@@ -99,7 +102,8 @@ def sample_img2img(self, p, x, noise, conditioning, unconditional_conditioning,
         timesteps = self.get_timesteps(p, steps)
         timesteps_sched = timesteps[:t_enc]
 
-        alphas_cumprod = shared.sd_model.alphas_cumprod
+        #alphas_cumprod = shared.sd_model.alphas_cumprod
+        alphas_cumprod = shared_instance.sd_model.alphas_cumprod
         sqrt_alpha_cumprod = torch.sqrt(alphas_cumprod[timesteps[t_enc]])
         sqrt_one_minus_alpha_cumprod = torch.sqrt(1 - alphas_cumprod[timesteps[t_enc]])
 
diff --git a/modules/sd_unet.py b/modules/sd_unet.py
index 5525cfbc3a0..37a5162767f 100644
--- a/modules/sd_unet.py
+++ b/modules/sd_unet.py
@@ -2,6 +2,7 @@
 import ldm.modules.diffusionmodules.openaimodel
 
 from modules import script_callbacks, shared, devices
+from modules.shared import shared_instance
 
 unet_options = []
 current_unet_option = None
@@ -22,7 +23,8 @@ def get_unet_option(option=None):
         return None
 
     if option == "Automatic":
-        name = shared.sd_model.sd_checkpoint_info.model_name
+        #name = shared.sd_model.sd_checkpoint_info.model_name
+        name = shared_instance.sd_model.sd_checkpoint_info.model_name
 
         options = [x for x in unet_options if x.model_name == name]
 
@@ -47,12 +49,15 @@ def apply_unet(option=None):
     if current_unet_option is None:
         current_unet = None
 
-        if not shared.sd_model.lowvram:
-            shared.sd_model.model.diffusion_model.to(devices.device)
+        #if not shared.sd_model.lowvram:
+        #    shared.sd_model.model.diffusion_model.to(devices.device)
+        if not shared_instance.sd_model.lowvram:
+            shared_instance.sd_model.model.diffusion_model.to(devices.device)
 
         return
 
-    shared.sd_model.model.diffusion_model.to(devices.cpu)
+    #shared.sd_model.model.diffusion_model.to(devices.cpu)
+    shared_instance.sd_model.model.diffusion_model.to(devices.cpu)
     devices.torch_gc()
 
     current_unet = current_unet_option.create_unet()
diff --git a/modules/sd_vae.py b/modules/sd_vae.py
index 31306d8ba4b..05baccf59f0 100644
--- a/modules/sd_vae.py
+++ b/modules/sd_vae.py
@@ -3,6 +3,7 @@
 from dataclasses import dataclass
 
 from modules import paths, shared, devices, script_callbacks, sd_models, extra_networks, lowvram, sd_hijack, hashes
+from modules.shared import shared_instance
 
 import glob
 from copy import deepcopy
@@ -250,7 +251,8 @@ def clear_loaded_vae():
 
 def reload_vae_weights(sd_model=None, vae_file=unspecified):
     if not sd_model:
-        sd_model = shared.sd_model
+        #sd_model = shared.sd_model
+        sd_model = shared_instance.sd_model
 
     checkpoint_info = sd_model.sd_checkpoint_info
     checkpoint_file = checkpoint_info.filename
diff --git a/modules/sd_vae_approx.py b/modules/sd_vae_approx.py
index 3965e223e6f..65da156a044 100644
--- a/modules/sd_vae_approx.py
+++ b/modules/sd_vae_approx.py
@@ -3,7 +3,7 @@
 import torch
 from torch import nn
 from modules import devices, paths, shared
-
+from modules.shared import shared_instance
 sd_vae_approx_models = {}
 
 
@@ -40,7 +40,8 @@ def download_model(model_path, model_url):
 
 
 def model():
-    model_name = "vaeapprox-sdxl.pt" if getattr(shared.sd_model, 'is_sdxl', False) else "model.pt"
+    model_name = "vaeapprox-sdxl.pt" if getattr(shared_instance.sd_model, 'is_sdxl', False) else "model.pt"
+    #model_name = "vaeapprox-sdxl.pt" if getattr(shared.sd_model, 'is_sdxl', False) else "model.pt"
     loaded_model = sd_vae_approx_models.get(model_name)
 
     if loaded_model is None:
@@ -64,7 +65,8 @@ def model():
 def cheap_approximation(sample):
     # https://discuss.huggingface.co/t/decoding-latents-to-rgb-without-upscaling/23204/2
 
-    if shared.sd_model.is_sdxl:
+    #if shared.sd_model.is_sdxl:
+    if shared_instance.sd_model.is_sdxl:
         coeffs = [
             [ 0.3448,  0.4168,  0.4395],
             [-0.1953, -0.0290,  0.0250],
diff --git a/modules/sd_vae_taesd.py b/modules/sd_vae_taesd.py
index 808eb3624fd..9a7a1acc92e 100644
--- a/modules/sd_vae_taesd.py
+++ b/modules/sd_vae_taesd.py
@@ -9,6 +9,7 @@
 import torch.nn as nn
 
 from modules import devices, paths_internal, shared
+from modules.shared import shared_instance
 
 sd_vae_taesd_models = {}
 
@@ -87,7 +88,8 @@ def download_model(model_path, model_url):
 
 
 def decoder_model():
-    model_name = "taesdxl_decoder.pth" if getattr(shared.sd_model, 'is_sdxl', False) else "taesd_decoder.pth"
+    model_name = "taesdxl_decoder.pth" if getattr(shared_instance.sd_model, 'is_sdxl', False) else "taesd_decoder.pth"
+    #model_name = "taesdxl_decoder.pth" if getattr(shared.sd_model, 'is_sdxl', False) else "taesd_decoder.pth"
     loaded_model = sd_vae_taesd_models.get(model_name)
 
     if loaded_model is None:
@@ -106,7 +108,8 @@ def decoder_model():
 
 
 def encoder_model():
-    model_name = "taesdxl_encoder.pth" if getattr(shared.sd_model, 'is_sdxl', False) else "taesd_encoder.pth"
+    model_name = "taesdxl_encoder.pth" if getattr(shared_instance.sd_model, 'is_sdxl', False) else "taesd_encoder.pth"
+    #model_name = "taesdxl_encoder.pth" if getattr(shared.sd_model, 'is_sdxl', False) else "taesd_encoder.pth"
     loaded_model = sd_vae_taesd_models.get(model_name)
 
     if loaded_model is None:
diff --git a/modules/shared.py b/modules/shared.py
index 636619391fc..08cff270897 100644
--- a/modules/shared.py
+++ b/modules/shared.py
@@ -1,7 +1,7 @@
 import sys
 
 import gradio as gr
-
+from modules.shared_items import Shared
 from modules import shared_cmd_options, shared_gradio_themes, options, shared_items, sd_models_types
 from modules.paths_internal import models_path, script_path, data_path, sd_configs_path, sd_default_config, sd_model_file, default_sd_model_file, extensions_dir, extensions_builtin_dir  # noqa: F401
 from modules import util
@@ -85,3 +85,5 @@
 refresh_checkpoints = shared_items.refresh_checkpoints
 list_samplers = shared_items.list_samplers
 reload_hypernetworks = shared_items.reload_hypernetworks
+
+shared_instance = Shared()
\ No newline at end of file
diff --git a/modules/shared_items.py b/modules/shared_items.py
index 84d69c8df43..960518fe02e 100644
--- a/modules/shared_items.py
+++ b/modules/shared_items.py
@@ -95,7 +95,8 @@ def ui_reorder_categories():
     yield "scripts"
 
 
-class Shared(sys.modules[__name__].__class__):
+#class Shared(sys.modules[__name__].__class__):
+class Shared:
     """
     this class is here to provide sd_model field as a property, so that it can be created and loaded on demand rather than
     at program startup.
@@ -115,5 +116,10 @@ def sd_model(self, value):
 
         modules.sd_models.model_data.set_sd_model(value)
 
+    def __reduce__(self):
+        # The callable is the class itself
+        # The arguments are the current values of the sd_model property
+        #return (self.__class__, (self.sd_model,))
+        return (self.__class__, ())
 
-sys.modules['modules.shared'].__class__ = Shared
+#sys.modules['modules.shared'].__class__ = Shared
diff --git a/modules/textual_inversion/dataset.py b/modules/textual_inversion/dataset.py
index 7ee05061545..4fb0d44894a 100644
--- a/modules/textual_inversion/dataset.py
+++ b/modules/textual_inversion/dataset.py
@@ -12,7 +12,7 @@
 import tqdm
 from modules import devices, shared
 import re
-
+from modules.shared import shared_instance
 from ldm.modules.distributions.distributions import DiagonalGaussianDistribution
 
 re_numbers_at_start = re.compile(r"^[-\d]+\s*")
@@ -169,7 +169,8 @@ def __getitem__(self, i):
         if self.tag_drop_out != 0 or self.shuffle_tags:
             entry.cond_text = self.create_text(entry.filename_text)
         if self.latent_sampling_method == "random":
-            entry.latent_sample = shared.sd_model.get_first_stage_encoding(entry.latent_dist).to(devices.cpu)
+            #entry.latent_sample = shared.sd_model.get_first_stage_encoding(entry.latent_dist).to(devices.cpu)
+            entry.latent_sample = shared_instance.sd_model.get_first_stage_encoding(entry.latent_dist).to(devices.cpu)
         return entry
 
 
diff --git a/modules/textual_inversion/textual_inversion.py b/modules/textual_inversion/textual_inversion.py
index aa79dc09843..98c16dfcf75 100644
--- a/modules/textual_inversion/textual_inversion.py
+++ b/modules/textual_inversion/textual_inversion.py
@@ -19,6 +19,7 @@
 
 from modules.textual_inversion.image_embedding import embedding_to_b64, embedding_from_b64, insert_image_data_embed, extract_image_data_embed, caption_image_overlay
 from modules.textual_inversion.logging import save_settings_to_file
+from modules.shared import shared_instance
 
 
 TextualInversionTemplate = namedtuple("TextualInversionTemplate", ["name", "path"])
@@ -151,7 +152,8 @@ def register_embedding_by_name(self, embedding, model, name):
         return embedding
 
     def get_expected_shape(self):
-        vec = shared.sd_model.cond_stage_model.encode_embedding_init_text(",", 1)
+        #vec = shared.sd_model.cond_stage_model.encode_embedding_init_text(",", 1)
+        vec = shared_instance.sd_model.cond_stage_model.encode_embedding_init_text(",", 1)
         return vec.shape[1]
 
     def load_from_file(self, path, filename):
@@ -217,7 +219,8 @@ def load_from_file(self, path, filename):
         embedding.set_hash(hashes.sha256(embedding.filename, "textual_inversion/" + name) or '')
 
         if self.expected_shape == -1 or self.expected_shape == embedding.shape:
-            self.register_embedding(embedding, shared.sd_model)
+            #self.register_embedding(embedding, shared.sd_model)
+            self.register_embedding(embedding, shared_instance.sd_model)
         else:
             self.skipped_embeddings[name] = embedding
 
@@ -286,7 +289,8 @@ def find_embedding_at_position(self, tokens, offset):
 
 
 def create_embedding(name, num_vectors_per_token, overwrite_old, init_text='*'):
-    cond_model = shared.sd_model.cond_stage_model
+    #cond_model = shared.sd_model.cond_stage_model
+    cond_model = shared_instance.sd_model.cond_stage_model
 
     with devices.autocast():
         cond_model([""])  # will send cond model to GPU if lowvram/medvram is active
@@ -447,7 +451,9 @@ def train_embedding(id_task, embedding_name, learn_rate, batch_size, gradient_st
 
     pin_memory = shared.opts.pin_memory
 
-    ds = modules.textual_inversion.dataset.PersonalizedBase(data_root=data_root, width=training_width, height=training_height, repeats=shared.opts.training_image_repeats_per_epoch, placeholder_token=embedding_name, model=shared.sd_model, cond_model=shared.sd_model.cond_stage_model, device=devices.device, template_file=template_file, batch_size=batch_size, gradient_step=gradient_step, shuffle_tags=shuffle_tags, tag_drop_out=tag_drop_out, latent_sampling_method=latent_sampling_method, varsize=varsize, use_weight=use_weight)
+    ds = modules.textual_inversion.dataset.PersonalizedBase(data_root=data_root, width=training_width, height=training_height, repeats=shared.opts.training_image_repeats_per_epoch, placeholder_token=embedding_name, model=shared_instance.sd_model, cond_model=shared_instance.sd_model.cond_stage_model, device=devices.device, template_file=template_file, batch_size=batch_size, gradient_step=gradient_step, shuffle_tags=shuffle_tags, tag_drop_out=tag_drop_out, latent_sampling_method=latent_sampling_method, varsize=varsize, use_weight=use_weight)
+
+    #ds = modules.textual_inversion.dataset.PersonalizedBase(data_root=data_root, width=training_width, height=training_height, repeats=shared.opts.training_image_repeats_per_epoch, placeholder_token=embedding_name, model=shared.sd_model, cond_model=shared.sd_model.cond_stage_model, device=devices.device, template_file=template_file, batch_size=batch_size, gradient_step=gradient_step, shuffle_tags=shuffle_tags, tag_drop_out=tag_drop_out, latent_sampling_method=latent_sampling_method, varsize=varsize, use_weight=use_weight)
 
     if shared.opts.save_training_settings_to_txt:
         save_settings_to_file(log_directory, {**dict(model_name=checkpoint.model_name, model_hash=checkpoint.shorthash, num_of_dataset_images=len(ds), num_vectors_per_token=len(embedding.vec)), **locals()})
@@ -458,7 +464,8 @@ def train_embedding(id_task, embedding_name, learn_rate, batch_size, gradient_st
 
     if unload:
         shared.parallel_processing_allowed = False
-        shared.sd_model.first_stage_model.to(devices.cpu)
+        #shared.sd_model.first_stage_model.to(devices.cpu)
+        shared_instance.sd_model.first_stage_model.to(devices.cpu)
 
     embedding.vec.requires_grad = True
     optimizer = torch.optim.AdamW([embedding.vec], lr=scheduler.learn_rate, weight_decay=0.0)
@@ -490,7 +497,8 @@ def train_embedding(id_task, embedding_name, learn_rate, batch_size, gradient_st
     forced_filename = "<none>"
     embedding_yet_to_be_embedded = False
 
-    is_training_inpainting_model = shared.sd_model.model.conditioning_key in {'hybrid', 'concat'}
+    #is_training_inpainting_model = shared.sd_model.model.conditioning_key in {'hybrid', 'concat'}
+    is_training_inpainting_model = shared_instance.sd_model.model.conditioning_key in {'hybrid', 'concat'}
     img_c = None
 
     pbar = tqdm.tqdm(total=steps - initial_step)
@@ -519,21 +527,24 @@ def train_embedding(id_task, embedding_name, learn_rate, batch_size, gradient_st
                     x = batch.latent_sample.to(devices.device, non_blocking=pin_memory)
                     if use_weight:
                         w = batch.weight.to(devices.device, non_blocking=pin_memory)
-                    c = shared.sd_model.cond_stage_model(batch.cond_text)
+                    #c = shared.sd_model.cond_stage_model(batch.cond_text)
+                    c = shared_instance.sd_model.cond_stage_model(batch.cond_text)
 
                     if is_training_inpainting_model:
                         if img_c is None:
-                            img_c = processing.txt2img_image_conditioning(shared.sd_model, c, training_width, training_height)
-
+                            #img_c = processing.txt2img_image_conditioning(shared.sd_model, c, training_width, training_height)
+                            img_c = processing.txt2img_image_conditioning(shared_instance.sd_model, c, training_width, training_height)
                         cond = {"c_concat": [img_c], "c_crossattn": [c]}
                     else:
                         cond = c
 
                     if use_weight:
-                        loss = shared.sd_model.weighted_forward(x, cond, w)[0] / gradient_step
+                        #loss = shared.sd_model.weighted_forward(x, cond, w)[0] / gradient_step
+                        loss = shared_instance.sd_model.weighted_forward(x, cond, w)[0] / gradient_step
                         del w
                     else:
-                        loss = shared.sd_model.forward(x, cond)[0] / gradient_step
+                        #loss = shared.sd_model.forward(x, cond)[0] / gradient_step
+                        loss = shared_instance.sd_model.forward(x, cond)[0] / gradient_step
                     del x
 
                     _loss_step += loss.item()
@@ -577,14 +588,21 @@ def train_embedding(id_task, embedding_name, learn_rate, batch_size, gradient_st
                     forced_filename = f'{embedding_name}-{steps_done}'
                     last_saved_image = os.path.join(images_dir, forced_filename)
 
-                    shared.sd_model.first_stage_model.to(devices.device)
+                    #shared.sd_model.first_stage_model.to(devices.device)
+                    shared_instance.sd_model.first_stage_model.to(devices.device)
 
+                    #p = processing.StableDiffusionProcessingTxt2Img(
+                    #    sd_model=shared.sd_model,
+                    #    do_not_save_grid=True,
+                    #    do_not_save_samples=True,
+                    #    do_not_reload_embeddings=True,
+                    #)
                     p = processing.StableDiffusionProcessingTxt2Img(
-                        sd_model=shared.sd_model,
-                        do_not_save_grid=True,
-                        do_not_save_samples=True,
-                        do_not_reload_embeddings=True,
-                    )
+                                            sd_model=shared_instance.sd_model,
+                                            do_not_save_grid=True,
+                                            do_not_save_samples=True,
+                                            do_not_reload_embeddings=True,
+                                        )
 
                     if preview_from_txt2img:
                         p.prompt = preview_prompt
@@ -608,7 +626,8 @@ def train_embedding(id_task, embedding_name, learn_rate, batch_size, gradient_st
                         image = processed.images[0] if len(processed.images) > 0 else None
 
                     if unload:
-                        shared.sd_model.first_stage_model.to(devices.cpu)
+                        #shared.sd_model.first_stage_model.to(devices.cpu)
+                        shared_instance.sd_model.first_stage_model.to(devices.cpu)
 
                     if image is not None:
                         shared.state.assign_current_image(image)
@@ -666,7 +685,8 @@ def train_embedding(id_task, embedding_name, learn_rate, batch_size, gradient_st
     finally:
         pbar.leave = False
         pbar.close()
-        shared.sd_model.first_stage_model.to(devices.device)
+        #shared.sd_model.first_stage_model.to(devices.device)
+        shared_instance.sd_model.first_stage_model.to(devices.device)
         shared.parallel_processing_allowed = old_parallel_processing_allowed
         sd_hijack_checkpoint.remove()
 
diff --git a/modules/txt2img.py b/modules/txt2img.py
index 1ee592ad944..61db75256d1 100644
--- a/modules/txt2img.py
+++ b/modules/txt2img.py
@@ -7,13 +7,14 @@
 import modules.shared as shared
 from modules.ui import plaintext_to_html
 import gradio as gr
-
+from modules.shared import shared_instance
 
 def txt2img(id_task: str, prompt: str, negative_prompt: str, prompt_styles, steps: int, sampler_name: str, n_iter: int, batch_size: int, cfg_scale: float, height: int, width: int, enable_hr: bool, denoising_strength: float, hr_scale: float, hr_upscaler: str, hr_second_pass_steps: int, hr_resize_x: int, hr_resize_y: int, hr_checkpoint_name: str, hr_sampler_name: str, hr_prompt: str, hr_negative_prompt, override_settings_texts, request: gr.Request, *args):
     override_settings = create_override_settings_dict(override_settings_texts)
 
     p = processing.StableDiffusionProcessingTxt2Img(
-        sd_model=shared.sd_model,
+        #sd_model=shared.sd_model,
+        sd_model=shared_instance.sd_model,
         outpath_samples=opts.outdir_samples or opts.outdir_txt2img_samples,
         outpath_grids=opts.outdir_grids or opts.outdir_txt2img_grids,
         prompt=prompt,
diff --git a/modules/ui.py b/modules/ui.py
index 579bab9800c..b5eae9e8a1e 100644
--- a/modules/ui.py
+++ b/modules/ui.py
@@ -29,7 +29,7 @@
 from modules import prompt_parser
 from modules.sd_hijack import model_hijack
 from modules.generation_parameters_copypaste import image_from_url_text
-
+from modules.shared import shared_instance
 create_setting_component = ui_settings.create_setting_component
 
 warnings.filterwarnings("default" if opts.show_warnings else "ignore", category=UserWarning)
@@ -1294,8 +1294,8 @@ def get_textual_inversion_template_names():
         gr.HTML(footer, elem_id="footer")
 
         settings.add_functionality(demo)
-
-        update_image_cfg_scale_visibility = lambda: gr.update(visible=shared.sd_model and shared.sd_model.cond_stage_key == "edit")
+        #update_image_cfg_scale_visibility = lambda: gr.update(visible=shared.sd_model and shared.sd_model.cond_stage_key == "edit")
+        update_image_cfg_scale_visibility = lambda: gr.update(visible=shared_instance.sd_model and shared_instance.sd_model.cond_stage_key == "edit")
         settings.text_settings.change(fn=update_image_cfg_scale_visibility, inputs=[], outputs=[image_cfg_scale])
         demo.load(fn=update_image_cfg_scale_visibility, inputs=[], outputs=[image_cfg_scale])
 
diff --git a/modules/ui_extra_networks_checkpoints_user_metadata.py b/modules/ui_extra_networks_checkpoints_user_metadata.py
index 25df0a8079b..9cee11f9b11 100644
--- a/modules/ui_extra_networks_checkpoints_user_metadata.py
+++ b/modules/ui_extra_networks_checkpoints_user_metadata.py
@@ -2,7 +2,7 @@
 
 from modules import ui_extra_networks_user_metadata, sd_vae, shared
 from modules.ui_common import create_refresh_button
-
+from modules.shared import shared_instance
 
 class CheckpointUserMetadataEditor(ui_extra_networks_user_metadata.UserMetadataEditor):
     def __init__(self, ui, tabname, page):
@@ -19,7 +19,8 @@ def save_user_metadata(self, name, desc, notes, vae):
         self.write_user_metadata(name, user_metadata)
 
     def update_vae(self, name):
-        if name == shared.sd_model.sd_checkpoint_info.name_for_extra:
+        if name == shared_instance.sd_model.sd_checkpoint_info.name_for_extra:
+        #if name == shared.sd_model.sd_checkpoint_info.name_for_extra:
             sd_vae.reload_vae_weights()
 
     def put_values_into_components(self, name):
diff --git a/requirements.txt b/requirements.txt
index 80b438455ce..cf0e68fbd77 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -32,3 +32,6 @@ torch
 torchdiffeq
 torchsde
 transformers==4.30.2
+ray[default]
+ray[serve]
+ray[client]
diff --git a/requirements_versions.txt b/requirements_versions.txt
index f8ae1f385ae..9d7e56ba94c 100644
--- a/requirements_versions.txt
+++ b/requirements_versions.txt
@@ -29,3 +29,6 @@ torch
 torchdiffeq==0.2.3
 torchsde==0.2.5
 transformers==4.30.2
+ray[default]
+ray[serve]
+ray[client]
diff --git a/scripts/img2imgalt.py b/scripts/img2imgalt.py
index 1e833fa898f..6ee58ab5f03 100644
--- a/scripts/img2imgalt.py
+++ b/scripts/img2imgalt.py
@@ -7,7 +7,7 @@
 import gradio as gr
 
 from modules import processing, shared, sd_samplers, sd_samplers_common
-
+from modules.shared import shared_instance
 import torch
 import k_diffusion as K
 
@@ -15,11 +15,17 @@ def find_noise_for_image(p, cond, uncond, cfg_scale, steps):
     x = p.init_latent
 
     s_in = x.new_ones([x.shape[0]])
-    if shared.sd_model.parameterization == "v":
-        dnw = K.external.CompVisVDenoiser(shared.sd_model)
+    #if shared.sd_model.parameterization == "v":
+    #    dnw = K.external.CompVisVDenoiser(shared.sd_model)
+    #    skip = 1
+    #else:
+    #    dnw = K.external.CompVisDenoiser(shared.sd_model)
+    #    skip = 0
+    if shared_instance.sd_model.parameterization == "v":
+        dnw = K.external.CompVisVDenoiser(shared_instance.sd_model)
         skip = 1
     else:
-        dnw = K.external.CompVisDenoiser(shared.sd_model)
+        dnw = K.external.CompVisDenoiser(shared_instance.sd_model)
         skip = 0
     sigmas = dnw.get_sigmas(steps).flip(0)
 
@@ -38,7 +44,8 @@ def find_noise_for_image(p, cond, uncond, cfg_scale, steps):
         c_out, c_in = [K.utils.append_dims(k, x_in.ndim) for k in dnw.get_scalings(sigma_in)[skip:]]
         t = dnw.sigma_to_t(sigma_in)
 
-        eps = shared.sd_model.apply_model(x_in * c_in, t, cond=cond_in)
+        #eps = shared.sd_model.apply_model(x_in * c_in, t, cond=cond_in)
+        eps = shared_instance.sd_model.apply_model(x_in * c_in, t, cond=cond_in)
         denoised_uncond, denoised_cond = (x_in + eps * c_out).chunk(2)
 
         denoised = denoised_uncond + (denoised_cond - denoised_uncond) * cfg_scale
@@ -67,11 +74,14 @@ def find_noise_for_image_sigma_adjustment(p, cond, uncond, cfg_scale, steps):
     x = p.init_latent
 
     s_in = x.new_ones([x.shape[0]])
-    if shared.sd_model.parameterization == "v":
-        dnw = K.external.CompVisVDenoiser(shared.sd_model)
+    #if shared.sd_model.parameterization == "v":
+    if shared_instance.sd_model.parameterization == "v":
+        #dnw = K.external.CompVisVDenoiser(shared.sd_model)
+        dnw = K.external.CompVisVDenoiser(shared_instance.sd_model)
         skip = 1
     else:
-        dnw = K.external.CompVisDenoiser(shared.sd_model)
+        #dnw = K.external.CompVisDenoiser(shared.sd_model)
+        dnw = K.external.CompVisDenoiser(shared_instance.sd_model)
         skip = 0
     sigmas = dnw.get_sigmas(steps).flip(0)
 
@@ -94,7 +104,8 @@ def find_noise_for_image_sigma_adjustment(p, cond, uncond, cfg_scale, steps):
         else:
             t = dnw.sigma_to_t(sigma_in)
 
-        eps = shared.sd_model.apply_model(x_in * c_in, t, cond=cond_in)
+        #eps = shared.sd_model.apply_model(x_in * c_in, t, cond=cond_in)
+        eps = shared_instance.sd_model.apply_model(x_in * c_in, t, cond=cond_in)
         denoised_uncond, denoised_cond = (x_in + eps * c_out).chunk(2)
 
         denoised = denoised_uncond + (denoised_cond - denoised_uncond) * cfg_scale
diff --git a/scripts/xyz_grid.py b/scripts/xyz_grid.py
index 939d86053bd..10993ad653e 100644
--- a/scripts/xyz_grid.py
+++ b/scripts/xyz_grid.py
@@ -19,7 +19,7 @@
 import modules.sd_models
 import modules.sd_vae
 import re
-
+from modules.shared import shared_instance
 from modules.ui_components import ToolButton
 
 fill_values_symbol = "\U0001f4d2"  # 📒
@@ -121,7 +121,8 @@ def find_vae(name: str):
 
 
 def apply_vae(p, x, xs):
-    modules.sd_vae.reload_vae_weights(shared.sd_model, vae_file=find_vae(x))
+    #modules.sd_vae.reload_vae_weights(shared.sd_model, vae_file=find_vae(x))
+    modules.sd_vae.reload_vae_weights(shared_instance.sd_model, vae_file=find_vae(x))
 
 
 def apply_styles(p: StableDiffusionProcessingTxt2Img, x: str, _):
diff --git a/webui-user.sh b/webui-user.sh
index 70306c60d5b..5f201067cc3 100644
--- a/webui-user.sh
+++ b/webui-user.sh
@@ -11,6 +11,8 @@
 
 # Commandline arguments for webui.py, for example: export COMMANDLINE_ARGS="--medvram --opt-split-attention"
 #export COMMANDLINE_ARGS=""
+#export COMMANDLINE_ARGS="--skip-torch-cuda-test --data-dir sd-data --allow-code --administrator --precision full --no-half --xformers --api --enable-insecure-extension-access --cors-allow-origins * --listen --ray"
+#export COMMANDLINE_ARGS="--skip-torch-cuda-test --data-dir sd-data --allow-code --administrator --no-half --api --enable-insecure-extension-access --cors-allow-origins * --listen --use-cpu SD GFPGAN BSRGAN ESRGAN SCUNet CodeFormer --all --ray"
 
 # python3 executable
 #python_cmd="python3"
@@ -45,4 +47,15 @@
 # Uncomment to disable TCMalloc
 #export NO_TCMALLOC="True"
 
-###########################################
+###############ray############################
+#export RAY_NUM_GPUS=1
+#export RAY_NUM_CPUS=1
+#export RAY_MIN_REPLICAS=1
+#export RAY_MAX_REPLICAS=2
+#export RAY_PORT=7575
+#export RAY_IP="0.0.0.0"
+#export RAY_ADDRESS='ray://ray-head:10001'
+#export RAY_DOCKER="True"
+#export RAY_DASHBOARD_PORT=8265
+#export RAY_DASHBOARD_HOST="0.0.0.0"
+export ENABLE_UV="True"
diff --git a/webui.py b/webui.py
index 12328423d0d..ae439bab4cd 100644
--- a/webui.py
+++ b/webui.py
@@ -19,10 +19,30 @@ def create_api(app):
     from modules.api.api import Api
     from modules.call_queue import queue_lock
 
+    
     api = Api(app, queue_lock)
     return api
 
 
+def ray_api():
+    from modules.api.ray import ray_only
+
+    from modules.shared_cmd_options import cmd_opts
+
+    launch_api = cmd_opts.api
+    initialize.initialize()
+
+    from modules import shared, ui_tempdir, script_callbacks, ui, progress, ui_extra_networks
+
+    script_callbacks.before_ui_callback()
+    startup_timer.record("scripts before_ui_callback")
+    shared.demo = ui.create_ui()
+    startup_timer.record("create ui")
+    if not cmd_opts.no_gradio_queue:
+        shared.demo.queue(64)
+    ray_only()
+
+
 def api_only():
     from fastapi import FastAPI
     from modules.shared_cmd_options import cmd_opts
@@ -155,8 +175,11 @@ def webui():
 
 if __name__ == "__main__":
     from modules.shared_cmd_options import cmd_opts
+    
 
     if cmd_opts.nowebui:
         api_only()
+    elif cmd_opts.ray:
+        ray_api()
     else:
         webui()