Merge 91c58b172c into 2c78cec01d

Merge pull request #3436 from lllyasviel/develop
fix: change wrong label for in describe apply styles checkbox
2024-08-05 11:31:55 +03:00 · 2024-08-03 15:18:24 +02:00 · 2024-08-03 15:16:18 +02:00 · 2024-08-03 15:11:35 +02:00 · 2024-08-03 15:10:27 +02:00 · 2024-08-03 15:08:34 +02:00
24 changed files with 195 additions and 48 deletions
--- a/amd/README.md
+++ b/amd/README.md
@ -0,0 +1,44 @@
+# 💬 [lllyasviel Fooocus](https://github.com/lllyasviel/Fooocus) on AMD ROCm 📷
+- Make sure that your system was fresh (ubuntu 22.04)
+- Computer will restart during the AMD driver install.
+- Prepare AMD ROCm Driver install
+```
+sudo usermod -a -G render,video $LOGNAME
+wget https://raw.githubusercontent.com/lllyasviel/Fooocus/main/AMD/amd_drivers.sh
+sudo chmod 777 amd_drivers.sh
+sudo ./amd_drivers.sh
+```
+- For RDNA and RDNA 2 cards RX5000 RX6000:
+```
+export HSA_OVERRIDE_GFX_VERSION=10.3.0
+```
+- For RDNA 3 cards RX7000:
+```
+export HSA_OVERRIDE_GFX_VERSION=11.0.0
+```
+- install Python
+```
+wget https://raw.githubusercontent.com/lllyasviel/Fooocus/main/AMD/install_python_conda.sh
+sudo chmod 777 install_python_conda.sh
+sudo ./install_python_conda.sh
+```
+- Install and Start lllyasviel/Fooocus
+```
+git clone --branch 2.3.1 https://github.com/lllyasviel/Fooocus.git
+cd Fooocus
+source fooocus_env/bin/activate
+pip3 install -r requirements_versions.txt
+pip3 install torch==2.1.2+rocm5.6 torchvision==0.16.2+rocm5.6 --extra-index-url https://download.pytorch.org/whl/rocm5.6
+python entry_with_update.py --listen --attention-split
+```
+- Restart Fooocus
+```
+cd Fooocus
+export HSA_OVERRIDE_GFX_VERSION=11.0.0
+source fooocus_env/bin/activate
+python entry_with_update.py --listen --attention-split
+```
+To see a prompt from your GPU usage.
+```
+watch /opt/rocm-6.0.2/bin/rocm-smi
+```
--- a/amd/amd_drivers.sh
+++ b/amd/amd_drivers.sh
@ -0,0 +1,11 @@
+#!/bin/bash
+sudo apt update -y && sudo apt full-upgrade -y
+sudo apt install "linux-headers-$(uname -r)" "linux-modules-extra-$(uname -r)"
+sudo usermod -a -G render,video $LOGNAME
+wget https://repo.radeon.com/amdgpu-install/6.0.2/ubuntu/jammy/amdgpu-install_6.0.60002-1_all.deb
+# to Ubuntu 20.04: wget https://repo.radeon.com/amdgpu-install/6.0.2/ubuntu/focal/amdgpu-install_6.0.60002-1_all.deb
+sudo apt install ./amdgpu-install_6.0.60002-1_all.deb
+sudo apt update
+sudo apt install amdgpu-dkms -y
+sudo apt install rocm -y
+sudo reboot now
--- a/amd/install_python_conda.sh
+++ b/amd/install_python_conda.sh
@ -0,0 +1,11 @@
+#!/bin/bash
+mkdir -p ~/miniconda3
+wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh -O ~/miniconda3/miniconda.sh
+bash ~/miniconda3/miniconda.sh -b -u -p ~/miniconda3
+rm -rf ~/miniconda3/miniconda.sh
+~/miniconda3/bin/conda init bash
+sudo apt install python3 -y
+sudo apt-get install python-is-python3 -y
+sudo apt install python3.11-venv -y
+sudo apt-get install git -y
+sudo apt-get install wget -y
--- a/extras/BLIP/models/blip.py
+++ b/extras/BLIP/models/blip.py
@ -216,9 +216,9 @@ def is_url(url_or_filename):
 def load_checkpoint(model,url_or_filename):
    if is_url(url_or_filename):
        cached_file = download_cached_file(url_or_filename, check_hash=False, progress=True)
-        checkpoint = torch.load(cached_file, map_location='cpu') 
+        checkpoint = torch.load(cached_file, map_location='cpu', weights_only=True) 
    elif os.path.isfile(url_or_filename):        
-        checkpoint = torch.load(url_or_filename, map_location='cpu') 
+        checkpoint = torch.load(url_or_filename, map_location='cpu', weights_only=True) 
    else:
        raise RuntimeError('checkpoint url or path is invalid')
        
--- a/extras/BLIP/models/blip_nlvr.py
+++ b/extras/BLIP/models/blip_nlvr.py
@ -78,9 +78,9 @@ def blip_nlvr(pretrained='',**kwargs):
 def load_checkpoint(model,url_or_filename):
    if is_url(url_or_filename):
        cached_file = download_cached_file(url_or_filename, check_hash=False, progress=True)
-        checkpoint = torch.load(cached_file, map_location='cpu') 
+        checkpoint = torch.load(cached_file, map_location='cpu', weights_only=True) 
    elif os.path.isfile(url_or_filename):        
-        checkpoint = torch.load(url_or_filename, map_location='cpu') 
+        checkpoint = torch.load(url_or_filename, map_location='cpu', weights_only=True) 
    else:
        raise RuntimeError('checkpoint url or path is invalid')
    state_dict = checkpoint['model']
--- a/extras/facexlib/detection/init.py
+++ b/extras/facexlib/detection/init.py
@ -19,7 +19,7 @@ def init_detection_model(model_name, half=False, device='cuda', model_rootpath=N
        url=model_url, model_dir='facexlib/weights', progress=True, file_name=None, save_dir=model_rootpath)

    # TODO: clean pretrained model
-    load_net = torch.load(model_path, map_location=lambda storage, loc: storage)
+    load_net = torch.load(model_path, map_location=lambda storage, loc: storage, weights_only=True)
    # remove unnecessary 'module.'
    for k, v in deepcopy(load_net).items():
        if k.startswith('module.'):
--- a/extras/facexlib/parsing/init.py
+++ b/extras/facexlib/parsing/init.py
@ -17,7 +17,7 @@ def init_parsing_model(model_name='bisenet', half=False, device='cuda', model_ro

    model_path = load_file_from_url(
        url=model_url, model_dir='facexlib/weights', progress=True, file_name=None, save_dir=model_rootpath)
-    load_net = torch.load(model_path, map_location=lambda storage, loc: storage)
+    load_net = torch.load(model_path, map_location=lambda storage, loc: storage, weights_only=True)
    model.load_state_dict(load_net, strict=True)
    model.eval()
    model = model.to(device)
--- a/extras/ip_adapter.py
+++ b/extras/ip_adapter.py
@ -104,7 +104,7 @@ def load_ip_adapter(clip_vision_path, ip_negative_path, ip_adapter_path):
    offload_device = torch.device('cpu')

    use_fp16 = model_management.should_use_fp16(device=load_device)
-    ip_state_dict = torch.load(ip_adapter_path, map_location="cpu")
+    ip_state_dict = torch.load(ip_adapter_path, map_location="cpu", weights_only=True)
    plus = "latents" in ip_state_dict["image_proj"]
    cross_attention_dim = ip_state_dict["ip_adapter"]["1.to_k_ip.weight"].shape[1]
    sdxl = cross_attention_dim == 2048
--- a/fooocus_version.py
+++ b/fooocus_version.py
@ -1 +1 @@
-version = '2.5.2'
+version = '2.5.3'
--- a/language/en.json
+++ b/language/en.json
@ -17,6 +17,7 @@
    "Content Type": "Content Type",
    "Photograph": "Photograph",
    "Art/Anime": "Art/Anime",
+    "Apply Styles": "Apply Styles",
    "Describe this Image into Prompt": "Describe this Image into Prompt",
    "Image Size and Recommended Size": "Image Size and Recommended Size",
    "Upscale or Variation:": "Upscale or Variation:",
--- a/ldm_patched/ldm/modules/encoders/noise_aug_modules.py
+++ b/ldm_patched/ldm/modules/encoders/noise_aug_modules.py
@ -8,7 +8,7 @@ class CLIPEmbeddingNoiseAugmentation(ImageConcatWithNoiseAugmentation):
        if clip_stats_path is None:
            clip_mean, clip_std = torch.zeros(timestep_dim), torch.ones(timestep_dim)
        else:
-            clip_mean, clip_std = torch.load(clip_stats_path, map_location="cpu")
+            clip_mean, clip_std = torch.load(clip_stats_path, map_location="cpu", weights_only=True)
        self.register_buffer("data_mean", clip_mean[None, :], persistent=False)
        self.register_buffer("data_std", clip_std[None, :], persistent=False)
        self.time_embed = Timestep(timestep_dim)
--- a/ldm_patched/modules/sd1_clip.py
+++ b/ldm_patched/modules/sd1_clip.py
@ -326,7 +326,7 @@ def load_embed(embedding_name, embedding_directory, embedding_size, embed_key=No
                except:
                    embed_out = safe_load_embed_zip(embed_path)
            else:
-                embed = torch.load(embed_path, map_location="cpu")
+                embed = torch.load(embed_path, map_location="cpu", weights_only=True)
    except Exception as e:
        print(traceback.format_exc())
        print()
--- a/ldm_patched/pfn/architecture/face/codeformer.py
+++ b/ldm_patched/pfn/architecture/face/codeformer.py
@ -377,15 +377,15 @@ class VQAutoEncoder(nn.Module):
        )

        if model_path is not None:
-            chkpt = torch.load(model_path, map_location="cpu")
+            chkpt = torch.load(model_path, map_location="cpu", weights_only=True)
            if "params_ema" in chkpt:
                self.load_state_dict(
-                    torch.load(model_path, map_location="cpu")["params_ema"]
+                    torch.load(model_path, map_location="cpu", weights_only=True)["params_ema"]
                )
                logger.info(f"vqgan is loaded from: {model_path} [params_ema]")
            elif "params" in chkpt:
                self.load_state_dict(
-                    torch.load(model_path, map_location="cpu")["params"]
+                    torch.load(model_path, map_location="cpu", weights_only=True)["params"]
                )
                logger.info(f"vqgan is loaded from: {model_path} [params]")
            else:
--- a/ldm_patched/pfn/architecture/face/gfpgan_bilinear_arch.py
+++ b/ldm_patched/pfn/architecture/face/gfpgan_bilinear_arch.py
@ -273,8 +273,8 @@ class GFPGANBilinear(nn.Module):
        if decoder_load_path:
            self.stylegan_decoder.load_state_dict(
                torch.load(
-                    decoder_load_path, map_location=lambda storage, loc: storage
-                )["params_ema"]
+                    decoder_load_path, map_location=lambda storage, loc: storage, 
+                weights_only=True)["params_ema"]
            )
        # fix decoder without updating params
        if fix_decoder:
--- a/ldm_patched/pfn/architecture/face/gfpganv1_arch.py
+++ b/ldm_patched/pfn/architecture/face/gfpganv1_arch.py
@ -373,8 +373,8 @@ class GFPGANv1(nn.Module):
        if decoder_load_path:
            self.stylegan_decoder.load_state_dict(
                torch.load(
-                    decoder_load_path, map_location=lambda storage, loc: storage
-                )["params_ema"]
+                    decoder_load_path, map_location=lambda storage, loc: storage, 
+                weights_only=True)["params_ema"]
            )
        # fix decoder without updating params
        if fix_decoder:
--- a/ldm_patched/pfn/architecture/face/gfpganv1_clean_arch.py
+++ b/ldm_patched/pfn/architecture/face/gfpganv1_clean_arch.py
@ -284,8 +284,8 @@ class GFPGANv1Clean(nn.Module):
        if decoder_load_path:
            self.stylegan_decoder.load_state_dict(
                torch.load(
-                    decoder_load_path, map_location=lambda storage, loc: storage
-                )["params_ema"]
+                    decoder_load_path, map_location=lambda storage, loc: storage, 
+                weights_only=True)["params_ema"]
            )
        # fix decoder without updating params
        if fix_decoder:
--- a/modules/config.py
+++ b/modules/config.py
@ -702,6 +702,19 @@ default_inpaint_mask_sam_model = get_config_item_or_set_default(
    expected_type=str
 )

+default_describe_apply_prompts_checkbox = get_config_item_or_set_default(
+    key='default_describe_apply_prompts_checkbox',
+    default_value=True,
+    validator=lambda x: isinstance(x, bool),
+    expected_type=bool
+)
+default_describe_content_type = get_config_item_or_set_default(
+    key='default_describe_content_type',
+    default_value=[modules.flags.describe_type_photo],
+    validator=lambda x: all(k in modules.flags.describe_types for k in x),
+    expected_type=list
+)
+
 config_dict["default_loras"] = default_loras = default_loras[:default_max_lora_number] + [[True, 'None', 1.0] for _ in range(default_max_lora_number - len(default_loras))]

 # mapping config to meta parameter
--- a/modules/core.py
+++ b/modules/core.py
@ -231,7 +231,7 @@ def get_previewer(model):
    if vae_approx_filename in VAE_approx_models:
        VAE_approx_model = VAE_approx_models[vae_approx_filename]
    else:
-        sd = torch.load(vae_approx_filename, map_location='cpu')
+        sd = torch.load(vae_approx_filename, map_location='cpu', weights_only=True)
        VAE_approx_model = VAEApprox()
        VAE_approx_model.load_state_dict(sd)
        del sd
--- a/modules/flags.py
+++ b/modules/flags.py
@ -96,6 +96,7 @@ inpaint_options = [inpaint_option_default, inpaint_option_detail, inpaint_option

 describe_type_photo = 'Photograph'
 describe_type_anime = 'Art/Anime'
+describe_types = [describe_type_photo, describe_type_anime]

 sdxl_aspect_ratios = [
    '704*1408', '704*1344', '768*1344', '768*1280', '832*1216', '832*1152',
--- a/modules/inpaint_worker.py
+++ b/modules/inpaint_worker.py
@ -196,7 +196,7 @@ class InpaintWorker:

        if inpaint_head_model is None:
            inpaint_head_model = InpaintHead()
-            sd = torch.load(inpaint_head_model_path, map_location='cpu')
+            sd = torch.load(inpaint_head_model_path, map_location='cpu', weights_only=True)
            inpaint_head_model.load_state_dict(sd)

        feed = torch.cat([
--- a/modules/upscaler.py
+++ b/modules/upscaler.py
@ -17,7 +17,7 @@ def perform_upscale(img):

    if model is None:
        model_filename = downloading_upscale_model()
-        sd = torch.load(model_filename)
+        sd = torch.load(model_filename, weights_only=True)
        sdo = OrderedDict()
        for k, v in sd.items():
            sdo[k.replace('residual_block_', 'RDB')] = v
--- a/readme.md
+++ b/readme.md
@ -201,14 +201,50 @@ Use `python entry_with_update.py --preset anime` or `python entry_with_update.py

 Note that the [minimal requirement](#minimal-requirement) for different platforms is different.

-Same with the above instructions. You need to change torch to the AMD version
-
-    pip uninstall torch torchvision torchaudio torchtext functorch xformers 
-    pip install torch torchvision torchaudio --index-url https://download.pytorch.org/whl/rocm5.6
-
-AMD is not intensively tested, however. The AMD support is in beta.
-
-Use `python entry_with_update.py --preset anime` or `python entry_with_update.py --preset realistic` for Fooocus Anime/Realistic Edition.
+[AMD GPU's Tutorial](https://github.com/lllyasviel/Fooocus/tree/main/amd) Debian and Ubuntu
+- Make sure that your system was fresh (ubuntu 22.04)
+- Computer will restart during the AMD driver install.
+- Prepare AMD ROCm Driver install
+```
+sudo usermod -a -G render,video $LOGNAME
+wget https://raw.githubusercontent.com/lllyasviel/Fooocus/main/AMD/amd_drivers.sh
+sudo chmod 777 amd_drivers.sh
+sudo ./amd_drivers.sh
+```
+- For RDNA and RDNA 2 cards RX5000 RX6000:
+```
+export HSA_OVERRIDE_GFX_VERSION=10.3.0
+```
+- For RDNA 3 cards RX7000:
+```
+export HSA_OVERRIDE_GFX_VERSION=11.0.0
+```
+- install Python
+```
+wget https://raw.githubusercontent.com/lllyasviel/Fooocus/main/AMD/install_python_conda.sh
+sudo chmod 777 install_python_conda.sh
+sudo ./install_python_conda.sh
+```
+- Install and Start lllyasviel/Fooocus
+```
+git clone --branch 2.3.1 https://github.com/lllyasviel/Fooocus.git
+cd Fooocus
+source fooocus_env/bin/activate
+pip3 install -r requirements_versions.txt
+pip3 install torch==2.1.2+rocm5.6 torchvision==0.16.2+rocm5.6 --extra-index-url https://download.pytorch.org/whl/rocm5.6
+python entry_with_update.py --listen --attention-split
+```
+- Restart Fooocus
+```
+cd Fooocus
+export HSA_OVERRIDE_GFX_VERSION=11.0.0
+source fooocus_env/bin/activate
+python entry_with_update.py --listen --attention-split
+```
+To see a prompt from your GPU usage.
+```
+watch /opt/rocm-6.0.2/bin/rocm-smi
+```

 ### Windows (AMD GPUs)

--- a/update_log.md
+++ b/update_log.md
@ -1,3 +1,8 @@
+# [2.5.3](https://github.com/lllyasviel/Fooocus/releases/tag/v2.5.3)
+
+* Only load weights from non-safetensors files, preventing harmful code injection
+* Add checkbox for applying/resetting styles when describing images, also allowing multiple describe content types
+
 # [2.5.2](https://github.com/lllyasviel/Fooocus/releases/tag/v2.5.2)

 * Fix not adding positive prompt when styles didn't have a {prompt} placeholder in the positive prompt
--- a/webui.py
+++ b/webui.py
@ -337,10 +337,11 @@ with shared.gradio_root:
                            with gr.Column():
                                describe_input_image = grh.Image(label='Image', source='upload', type='numpy', show_label=False)
                            with gr.Column():
-                                describe_method = gr.Radio(
+                                describe_methods = gr.CheckboxGroup(
                                    label='Content Type',
-                                    choices=[flags.describe_type_photo, flags.describe_type_anime],
-                                    value=flags.describe_type_photo)
+                                    choices=flags.describe_types,
+                                    value=modules.config.default_describe_content_type)
+                                describe_apply_styles = gr.Checkbox(label='Apply Styles', value=modules.config.default_describe_apply_prompts_checkbox)
                                describe_btn = gr.Button(value='Describe this Image into Prompt')
                                describe_image_size = gr.Textbox(label='Image Size and Recommended Size', elem_id='describe_image_size', visible=False)
                                gr.HTML('<a href="https://github.com/lllyasviel/Fooocus/discussions/1363" target="_blank">\U0001F4D4 Documentation</a>')
@ -1060,30 +1061,54 @@ with shared.gradio_root:
                gr.Audio(interactive=False, value=notification_file, elem_id='audio_notification', visible=False)
                break

-        def trigger_describe(mode, img):
-            if mode == flags.describe_type_photo:
-                from extras.interrogate import default_interrogator as default_interrogator_photo
-                return default_interrogator_photo(img), ["Fooocus V2", "Fooocus Enhance", "Fooocus Sharp"]
-            if mode == flags.describe_type_anime:
-                from extras.wd14tagger import default_interrogator as default_interrogator_anime
-                return default_interrogator_anime(img), ["Fooocus V2", "Fooocus Masterpiece"]
-            return mode, ["Fooocus V2"]
+        def trigger_describe(modes, img, apply_styles):
+            describe_prompts = []
+            styles = set()

-        describe_btn.click(trigger_describe, inputs=[describe_method, describe_input_image],
-                           outputs=[prompt, style_selections], show_progress=True, queue=True)
+            if flags.describe_type_photo in modes:
+                from extras.interrogate import default_interrogator as default_interrogator_photo
+                describe_prompts.append(default_interrogator_photo(img))
+                styles.update(["Fooocus V2", "Fooocus Enhance", "Fooocus Sharp"])
+
+            if flags.describe_type_anime in modes:
+                from extras.wd14tagger import default_interrogator as default_interrogator_anime
+                describe_prompts.append(default_interrogator_anime(img))
+                styles.update(["Fooocus V2", "Fooocus Masterpiece"])
+
+            if len(styles) == 0 or not apply_styles:
+                styles = gr.update()
+            else:
+                styles = list(styles)
+
+            if len(describe_prompts) == 0:
+                describe_prompt = gr.update()
+            else:
+                describe_prompt = ', '.join(describe_prompts)
+
+            return describe_prompt, styles
+
+        describe_btn.click(trigger_describe, inputs=[describe_methods, describe_input_image, describe_apply_styles],
+                           outputs=[prompt, style_selections], show_progress=True, queue=True) \
+            .then(fn=style_sorter.sort_styles, inputs=style_selections, outputs=style_selections, queue=False, show_progress=False) \
+            .then(lambda: None, _js='()=>{refresh_style_localization();}')

        if args_manager.args.enable_auto_describe_image:
-            def trigger_auto_describe(mode, img, prompt):
+            def trigger_auto_describe(mode, img, prompt, apply_styles):
                # keep prompt if not empty
                if prompt == '':
-                    return trigger_describe(mode, img)
+                    return trigger_describe(mode, img, apply_styles)
                return gr.update(), gr.update()

-            uov_input_image.upload(trigger_auto_describe, inputs=[describe_method, uov_input_image, prompt],
-                                   outputs=[prompt, style_selections], show_progress=True, queue=True)
+            uov_input_image.upload(trigger_auto_describe, inputs=[describe_methods, uov_input_image, prompt, describe_apply_styles],
+                                   outputs=[prompt, style_selections], show_progress=True, queue=True) \
+                .then(fn=style_sorter.sort_styles, inputs=style_selections, outputs=style_selections, queue=False, show_progress=False) \
+                .then(lambda: None, _js='()=>{refresh_style_localization();}')

            enhance_input_image.upload(lambda: gr.update(value=True), outputs=enhance_checkbox, queue=False, show_progress=False) \
-                .then(trigger_auto_describe, inputs=[describe_method, enhance_input_image, prompt], outputs=[prompt, style_selections], show_progress=True, queue=True)
+                .then(trigger_auto_describe, inputs=[describe_methods, enhance_input_image, prompt, describe_apply_styles],
+                      outputs=[prompt, style_selections], show_progress=True, queue=True) \
+                .then(fn=style_sorter.sort_styles, inputs=style_selections, outputs=style_selections, queue=False, show_progress=False) \
+                .then(lambda: None, _js='()=>{refresh_style_localization();}')

 def dump_default_english_config():
    from modules.localization import dump_english_config
Author	SHA1	Message	Date
Nicolas Pereira	c0aa4f5f31	Merge `91c58b172c` into `2c78cec01d`	2024-08-05 11:31:55 +03:00
Manuel Schmid	2c78cec01d	Merge pull request #3436 from lllyasviel/develop fix: change wrong label for in describe apply styles checkbox	2024-08-03 15:18:24 +02:00
Manuel Schmid	ef0acca9f9	fix: change wrong label for in describe apply styles checkbox	2024-08-03 15:16:18 +02:00
Manuel Schmid	60af8d2d84	Merge pull request #3434 from lllyasviel/develop Release 2.5.3 - fix changelog	2024-08-03 15:11:35 +02:00
Manuel Schmid	39d07bf0f3	release: fix changelog	2024-08-03 15:10:27 +02:00
Manuel Schmid	f0dcf5a911	Merge pull request #3433 from lllyasviel/develop Release 2.5.3	2024-08-03 15:08:34 +02:00
Manuel Schmid	c4d5b160be	release: bump version to 2.5.3, update changelog	2024-08-03 15:07:14 +02:00
Manuel Schmid	2f08cb4360	feat: add checkbox and config to disable updating selected styles when describing an image (#3430 ) * feat: add checkbox and config to disable updating selected styles when describing an image * i18n: add translation for checkbox label * feat: change describe content type from Radio to CheckboxGroup, add config * fix: cast set to list when styles contains elements * feat: sort styles after describe	2024-08-03 14:46:31 +02:00
Sergii Dymchenko	da3d4d006f	Use weights_only for loading (#3427 ) Co-authored-by: Manuel Schmid <9307310+mashb1t@users.noreply.github.com>	2024-08-03 12:33:01 +02:00
Nicolas Pereira	91c58b172c	Add files via upload	2024-05-17 17:58:05 -03:00