bmaltais · bmaltais · Jun 27, 2023 · Jun 23, 2023 · Jun 26, 2023 · Jun 26, 2023
diff --git a/.release b/.release
@@ -0,0 +1 @@
+v21.7.16
diff --git a/README.md b/README.md
@@ -141,8 +141,6 @@
 5. Run the setup script by executing the following command:
    ```
    ./setup.sh
-
-
    ```
 
    Note: If you need additional options or information about the runpod environment, you can use `setup.sh -h` or `setup.sh --help` to display the help message.
@@ -156,10 +154,11 @@
 If you choose to use the interactive mode, the default values for the accelerate configuration screen will be "This machine," "None," and "No" for the remaining questions. These default answers are the same as the Windows installation.
 
 ### Runpod
+#### Manual installation
 
-To install the necessary components for Runpod and run it, follow these steps:
+To install the necessary components for Runpod and run kohya_ss, follow these steps:
 
-1. Select the pytorch 2.0.1 template. This is important. Other templates may not work.
+1. Select the Runpod pytorch 2.0.1 template. This is important. Other templates may not work.
 
 2. SSH into the Runpod.
 
@@ -188,6 +187,17 @@
 
 6. Connect to the public URL displayed after the installation process is completed.
 
+#### Pre-built Runpod template
+
+To run from a pre-built Runpod template you can:
+
+1. Open the Runpod template by clicking on https://runpod.io/gsc?template=ya6013lj5a&ref=w18gds2n
+
+2. Deploy the template on the desired host
+
+3. Once deployed connect to the Runpod on HTTP 3010 to connect to kohya_ss GUI. You can also connect to auto1111 on HTTP 3000.
+
+
 ### Docker
 #### Local docker build
 
@@ -330,8 +340,6 @@
 masterpiece, best quality, (1girl), in white shirts, upper body, looking at viewer, simple background --n low quality, worst quality, bad anatomy, bad composition, poor, low effort --w 768 --h 768 --d 1 --l 7.5 --s 28
 
 # prompt 2
-
-
 masterpiece, best quality, 1boy, in business suit, standing at street, looking back --n (low quality, worst quality), bad anatomy, bad composition, poor, low effort --w 576 --h 832 --d 2 --l 5.5 --s 40
 ```
 
@@ -374,8 +382,22 @@
 
 ## Change History
 
-* 2023/06/25 (v21.7.13)
+* 2023/06/26 (v21.7.16)
   - Improve runpod installation
+  - Add release info to GUI
+  - Sunc with sd-script repo
+  - Backrev bitsandbytes 0.39.1 on Linux to 0.35.0 because it was giving bad results
+* 2023/06/25 (v21.7.15)
+  - Improve runpod installation
+* 2023/06/24 (v21.7.14)
+  - To address training errors caused by the global revert of bitsandbytes-windows for Windows users, I recommend the following steps:
+
+Delete the venv folder.
+Execute the setup.bat file by running .\setup.bat
+
+By following these instructions, Windows users can effectively undo the problematic bitsandbytes module and resolve the training errors.
+* 2023/06/24 (v21.7.13)
+  - Emergency fix for accelerate version that was bumped for other platforms than windows torch 2
 * 2023/06/24 (v21.7.12)
   - Significantly improved the setup process on all platforms
   - Better support for runpod
@@ -384,109 +406,4 @@

 The setup solution is now much more modulat and will simplify requirements support across different environments... hoping this will make it easier to run on different OS.
 * 2023/06/19 (v21.7.10)
 - Quick fix for linux GUI startup where it would try to install darwin requirements on top of linux. Ugly fix but work. Hopefulle some linux user will improve via a PR.
-* 2023/06/18 (v21.7.9)
-- Implement temporary fix for validation of image dataset. Will no longer stop execution but will let training continue... this is changed to avoid stopping training on false positive... yet still raise awaireness that something might be wrong with the image dataset structure.
-* 2023/06/14 (v21.7.8)
-- Add tkinter to dockerised version (thanks to @burdokow)
-- Add option to create caption files from folder names to the `group_images.py` tool.
-- Prodigy optimizer is supported in each training script. It is a member of D-Adaptation and is effective for DyLoRA training. [PR #585](https://github.com/kohya-ss/sd-scripts/pull/585) Please see the PR for details. Thanks to sdbds!
-  - Install the package with `pip install prodigyopt`. Then specify the option like `--optimizer_type="prodigy"`.
-- Arbitrary Dataset is supported in each training script (except XTI). You can use it by defining a Dataset class that returns images and captions.
-  - Prepare a Python script and define a class that inherits `train_util.MinimalDataset`. Then specify the option like `--dataset_class package.module.DatasetClass` in each training script.
-  - Please refer to `MinimalDataset` for implementation. I will prepare a sample later.
-- The following features have been added to the generation script.
-  - Added an option `--highres_fix_disable_control_net` to disable ControlNet in the 2nd stage of Highres. Fix. Please try it if the image is disturbed by some ControlNet such as Canny.
-  - Added Variants similar to sd-dynamic-propmpts in the prompt.
-    - If you specify `{spring|summer|autumn|winter}`, one of them will be randomly selected.
-    - If you specify `{2$$chocolate|vanilla|strawberry}`, two of them will be randomly selected.
-    - If you specify `{1-2$$ and $$chocolate|vanilla|strawberry}`, one or two of them will be randomly selected and connected by ` and `.
-    - You can specify the number of candidates in the range `0-2`. You cannot omit one side like `-2` or `1-`.
-    - It can also be specified for the prompt option.
-    - If you specify `e` or `E`, all candidates will be selected and the prompt will be repeated multiple times (`--images_per_prompt` is ignored). It may be useful for creating X/Y plots.
-    - You can also specify `--am {e$$0.2|0.4|0.6|0.8|1.0},{e$$0.4|0.7|1.0} --d 1234`. In this case, 15 prompts will be generated with 5*3.
-    - There is no weighting function.
-- Add pre and posfix to wd14
-* 2023/06/12 (v21.7.7)
-- Add `Print only` button to all training tabs
-- Sort json file vars for easier visual search
-- Fixed a bug where clip skip did not work when training with weighted captions (`--weighted_captions` specified) and when generating sample images during training.
-- Add verification and reporting of bad dataset folder name structure for DB, LoRA and TI training.
-- Some docker build fix.
-* 2023/06/06 (v21.7.6)
-- Small UI improvements
-- Fix `train_network.py` to probably work with older versions of LyCORIS.
-- `gen_img_diffusers.py` now supports `BREAK` syntax.
-- Add Lycoris iA3, LoKr and DyLoRA support to the UI
-- Upgrade LuCORIS python module to 0.1.6
-* 2023/06/05 (v21 7.5)
-- Fix reported issue with LoHA: https://github.com/bmaltais/kohya_ss/issues/922
-* 2023/06/05 (v21.7.4)
-- Add manual accelerate config option
-- Remove the ability to switch between torch 1 and 2 as it was causing errors with the venv
-* 2023/06/04 (v21.7.3)
-- Add accelerate configuration from file
-- Fix issue with torch uninstallation resulting in Error sometimes
-- Fix broken link to cudann files
-* 2023/06/04 (v21.7.2)
-- Improve handling of legacy installations
-* 2023/06/04 (v21.7.1)
-- This is mostly an update to the whole setup method for kohya_ss. I got fedup with all the issues from the batch file method and leveraged the great work of vladimandic to improve the whole setup experience.
-
-There is now a new menu in setup.bat that will appear:
-
-```
-Kohya_ss GUI setup menu:
-
-0. Cleanup the venv
-1. Install kohya_ss gui [torch 1]
-2. Install kohya_ss gui [torch 2]
-3. Start GUI in browser
-4. Quit
-
-Enter your choice:
-```
-
-The only obscure option might be option 0. This will help cleanup a corrupted venv without having to delete de folder. This van be really usefull for cases where nothing is working anymore and you should re-install from scratch. Just run the venv cleanup then select the version of kohya_ss GUI you want to instal (torch1 or 2).
-
-You can also start the GUI right from the setup menu using option 3.
-
-After pulling a new version you can either re-run `setup.bat` and install the version you want... or just run `gui.bat` and it will update the python modules as required.
-
-Hope this is useful.
-
-* 2023/06/04 (v21.7.0)
-- Max Norm Regularization is now available in `train_network.py`. [PR #545](https://github.com/kohya-ss/sd-scripts/pull/545) Thanks to AI-Casanova!
-  - Max Norm Regularization is a technique to stabilize network training by limiting the norm of network weights. It may be effective in suppressing overfitting of LoRA and improving stability when used with other LoRAs. See PR for details.
-  - Specify as `--scale_weight_norms=1.0`. It seems good to try from `1.0`.
-  - The networks other than LoRA in this repository (such as LyCORIS) do not support this option.
-
-- Three types of dropout have been added to `train_network.py` and LoRA network.
-  - Dropout is a technique to suppress overfitting and improve network performance by randomly setting some of the network outputs to 0.
-  - `--network_dropout` is a normal dropout at the neuron level. In the case of LoRA, it is applied to the output of down. Proposed in [PR #545](https://github.com/kohya-ss/sd-scripts/pull/545) Thanks to AI-Casanova!
-    - `--network_dropout=0.1` specifies the dropout probability to `0.1`.
-    - Note that the specification method is different from LyCORIS.
-  - For LoRA network, `--network_args` can specify `rank_dropout` to dropout each rank with specified probability. Also `module_dropout` can be specified to dropout each module with specified probability.
-    - Specify as `--network_args "rank_dropout=0.2" "module_dropout=0.1"`.
-  - `--network_dropout`, `rank_dropout`, and `module_dropout` can be specified at the same time.
-  - Values of 0.1 to 0.3 may be good to try. Values greater than 0.5 should not be specified.
-  - `rank_dropout` and `module_dropout` are original techniques of this repository. Their effectiveness has not been verified yet.
-  - The networks other than LoRA in this repository (such as LyCORIS) do not support these options.
-
-- Added an option `--scale_v_pred_loss_like_noise_pred` to scale v-prediction loss like noise prediction in each training script.
-  - By scaling the loss according to the time step, the weights of global noise prediction and local noise prediction become the same, and the improvement of details may be expected.
-  - See [this article](https://xrg.hatenablog.com/entry/2023/06/02/202418) by xrg for details (written in Japanese). Thanks to xrg for the great suggestion!
-
-* 2023/06/03 (v21.6.5)
-- Fix dreambooth issue with new logging
-- Update setup and upgrade scripts
-- Adding test folder
-
-* 2023/05/28 (v21.5.15)
-- Show warning when image caption file does not exist during training. [PR #533](https://github.com/kohya-ss/sd-scripts/pull/533) Thanks to TingTingin!
-  - Warning is also displayed when using class+identifier dataset. Please ignore if it is intended.
-- `train_network.py` now supports merging network weights before training. [PR #542](https://github.com/kohya-ss/sd-scripts/pull/542) Thanks to u-haru!
-  - `--base_weights` option specifies LoRA or other model files (multiple files are allowed) to merge.
-  - `--base_weights_multiplier` option specifies multiplier of the weights to merge (multiple values are allowed). If omitted or less than `base_weights`, 1.0 is used.
-  - This is useful for incremental learning. See PR for details.
-- Show warning and continue training when uploading to HuggingFace fails.
diff --git a/docker-compose.yaml b/docker-compose.yaml
@@ -6,7 +6,7 @@ services:
     build:
       context: .
     ports:
-      - 127.0.0.1:7860:7860
+      - 127.0.0.1:3000:3000
     tty: true
     ipc: host
     environment:
@@ -28,5 +28,4 @@ services:
         reservations:
           devices:
             - driver: nvidia
-              device_ids: ['0']
-              capabilities: [gpu]
+              device_ids: ['all']
diff --git a/fine_tune.py b/fine_tune.py
@@ -397,7 +397,7 @@ def fn_recursive_set_mem_eff(module: torch.nn.Module):
             current_loss = loss.detach().item()  # 平均なのでbatch sizeは関係ないはず
             if args.logging_dir is not None:
                 logs = {"loss": current_loss, "lr": float(lr_scheduler.get_last_lr()[0])}
-                if args.optimizer_type.lower().startswith("DAdapt".lower()) or args.optimizer_type.lower() == "Prodigy":  # tracking d*lr value
+                if args.optimizer_type.lower().startswith("DAdapt".lower()) or args.optimizer_type.lower() == "Prodigy".lower():  # tracking d*lr value
                     logs["lr/d*lr"] = (
                         lr_scheduler.optimizers[0].param_groups[0]["d"] * lr_scheduler.optimizers[0].param_groups[0]["lr"]
                     )

diff --git a/kohya_gui.py b/kohya_gui.py
@@ -30,12 +30,19 @@ def UI(**kwargs):
         with open(os.path.join('./style.css'), 'r', encoding='utf8') as file:
             log.info('Load CSS...')
             css += file.read() + '\n'
+
+    if os.path.exists('./.release'):
+        with open(os.path.join('./.release'), 'r', encoding='utf8') as file:
+            release= file.read()
 
     interface = gr.Blocks(
-        css=css, title='Kohya_ss GUI', theme=gr.themes.Default()
+        css=css, title=f'Kohya_ss GUI {release}', theme=gr.themes.Default()
     )
 
     with interface:
+        gr.Markdown(
+            f'kohya_ss GUI release {release}'
+        )
         with gr.Tab('Dreambooth'):
             (
                 train_data_dir_input,

diff --git a/requirements_linux.txt b/requirements_linux.txt
@@ -1,4 +1,4 @@
 torch==2.0.1+cu118 torchvision==0.15.2+cu118 --extra-index-url https://download.pytorch.org/whl/cu118 # no_verify leave this to specify not checking this a verification stage
-xformers==0.0.20 bitsandbytes==0.39.1
+xformers==0.0.20 bitsandbytes==0.35.0
 accelerate==0.15.0 tensorboard==2.12.1 tensorflow==2.12.0
 -r requirements.txt
diff --git a/requirements_linux_docker.txt b/requirements_linux_docker.txt
@@ -1,5 +1,5 @@
 xformers==0.0.20
-bitsandbytes==0.39.1
+bitsandbytes==0.35.0
 accelerate==0.15.0
 tensorboard==2.12.1
 tensorflow==2.12.0
diff --git a/requirements_runpod.txt b/requirements_runpod.txt
@@ -1,5 +1,5 @@
 torch==2.0.1+cu118 torchvision==0.15.2+cu118 --extra-index-url https://download.pytorch.org/whl/cu118 # no_verify leave this to specify not checking this a verification stage
-xformers==0.0.20 bitsandbytes==0.39.1
+xformers==0.0.20 bitsandbytes==0.35.0
 accelerate==0.15.0 tensorboard==2.12.1 tensorflow==2.12.0
 tensorrt
 -r requirements.txt
diff --git a/setup-runpod.sh b/setup-runpod.sh
@@ -24,10 +24,15 @@ source "$SCRIPT_DIR/venv/bin/activate" || exit 1
 # Run setup_linux.py script with platform requirements
 echo "Running setup_linux.py..."
 python "$SCRIPT_DIR/setup/setup_linux.py" --platform-requirements-file=requirements_runpod.txt --show_stdout --no_run_accelerate
+pip3 cache purge
 
 # Configure accelerate
 echo "Configuring accelerate..."
 mkdir -p "/root/.cache/huggingface/accelerate"
 cp "$SCRIPT_DIR/config_files/accelerate/runpod.yaml" "/root/.cache/huggingface/accelerate/default_config.yaml"
 
 echo "Installation completed... You can start the gui with ./gui.sh --share --headless"
+
+# Deactivate the virtual environment
+echo "Deactivating venv..."
+deactivate
diff --git a/setup/setup_common.py b/setup/setup_common.py
@@ -233,19 +233,13 @@
 
 # report current version of code
 def check_repo_version(): # pylint: disable=unused-argument
-    #
-    # This function was adapted from code written by vladimandic: https://github.com/vladmandic/automatic/commits/master
-    #
-
-    if not os.path.exists('.git'):
-        log.error('Not a git repository')
-        return
-    # status = git('status')
-    # if 'branch' not in status:
-    #    log.error('Cannot get git repository status')
-    #    sys.exit(1)
-    ver = git('log -1 --pretty=format:"%h %ad"')
-    log.info(f'Version: {ver}')
+    if os.path.exists('.release'):
+        with open(os.path.join('./.release'), 'r', encoding='utf8') as file:
+            release= file.read()
+
+        log.info(f'Version: {release}')
+    else:
+        log.debug('Could not read release...')
 
 # execute git command
 def git(arg: str, folder: str = None, ignore: bool = False):
@@ -379,7 +373,7 @@

 def install_requirements(requirements_file, check_no_verify_flag=False, show_stdout: bool = False):
    if check_no_verify_flag:
        log.info(f'Verifying modules instalation status from {requirements_file}...')
    else:
        log.info(f'Installing modules from {requirements_file}...')
    with open(requirements_file, 'r', encoding='utf8') as f:
@@ -418,7 +412,7 @@
     try:
         import rich   # pylint: disable=unused-import
     except ImportError:
-        install('rich', 'rich')
+        install('--upgrade rich', 'rich')
 
 
 def run_cmd(run_cmd):