tintwotin tin2tin

## flux2_8GB_inference.py
import io
import os

import requests
import torch

from diffusers import Flux2Pipeline, Flux2Transformer2DModel


# you will need to have ~6.5GB of free VRAM and ~40GB of free RAM to run this script (~10 if you enable

## inference.md

      
              5 files
            
          
              1 fork
            
          
                6 comments
              
            
              10 stars
            
          
                sayakpaul
                / inference.md
            
            
              Last active
              February 5, 2025 14:13
            
              
                (Not so rigrously tested) example showing how to use `bitsandbytes`, `peft`, etc. to LoRA fine-tune Flux.1 Dev.
              
          
    When loading the LoRA params (that were obtained on a quantized base model) and merging them into the base model, it is recommended to first dequantize the base model, merge the LoRA params into it, and then quantize the model again. This is because merging into 4bit quantized models can lead to some rounding errors. Below, we provide an end-to-end example:

First, load the original model and merge the LoRA params into it:

from diffusers import FluxPipeline 
import torch 

ckpt_id = "black-forest-labs/FLUX.1-dev"
pipeline = FluxPipeline.from_pretrained(

  
## flux-dev-under-8gbs.py
# Taken from: https://gist.github.com/sayakpaul/23862a2e7f5ab73dfdcc513751289bea

from diffusers import FluxPipeline, FluxTransformer2DModel
from transformers import T5EncoderModel
import torch
import gc


def flush():
    gc.collect()

## run_flux_under_24gbs.py
from diffusers import FluxPipeline, AutoencoderKL
from diffusers.image_processor import VaeImageProcessor
from transformers import T5EncoderModel, T5TokenizerFast, CLIPTokenizer, CLIPTextModel
import torch
import gc


def flush():
    gc.collect()
    torch.cuda.empty_cache()

## forward_of_sdxl_original_unet.py
    def forward(self, x, timesteps=None, context=None, y=None, **kwargs):
        # broadcast timesteps to batch dimension
        timesteps = timesteps.expand(x.shape[0])

        hs = []
        t_emb = get_timestep_embedding(timesteps, self.model_channels)  # , repeat_only=False)
        t_emb = t_emb.to(x.dtype)
        emb = self.time_embed(t_emb)

        assert x.shape[0] == y.shape[0], f"batch size mismatch: {x.shape[0]} != {y.shape[0]}"

## DeepFloyd_IF_VRAM12GB.py
# huggingface login
from huggingface_hub import login

login()


# load textencorder in 8bit quantized
from transformers import T5EncoderModel
from diffusers import DiffusionPipeline
import datetime

## text-to-video-modelscope.py
# Ran it with the following packages installed:
# accelerate                   0.18.0
# diffusers                    0.16.0.dev0
# torch                        2.0.0+cu118
# torchvision                  0.15.0+cu118
# transformers                 4.28.1
# xformers                     0.0.18

import torch
from diffusers import DiffusionPipeline, DPMSolverMultistepScheduler

## interpolate_images.py
from PIL import Image
import stable_inference
import numpy as np
from einops import repeat

# Interpolate video between two conditionings
FOLDER = 'test/painting'
MAX_STRENGTH = 0.5 # Strength at maximum in the middle of the interpolation
SEED = 9001
SECONDS = 10

## kuchipaku_light.py
bl_info = {
    "name": "Kuchi Paku Light",
    "author": "ds54e",
    "version": (1, 1, 1),
    "blender": (2, 80, 0),
    "location": "View3D > Sidebar > KPL",
    "description": "Generate Kuchi-Paku animations from the sound sequences in the VSE",
    "warning": "",
    "doc_url": "",
    "category": "Animation",

## Node Tricks (Olive 0.2.x).md

      
              1 file
            
          
              0 forks
            
          
                0 comments
              
            
              3 stars
            
          
                ZoomTen
                / Node Tricks (Olive 0.2.x).md
            
            
              Last active
              July 25, 2021 14:56
            
              
                Sick Node Tricks - or, how to reproduce common effects using the node editor.
              
          
    General Tips and Tricks


Think of clip nodes as containers!

You can plug in an arbitrary composite node and make them "instances" of said node


Common Node Configurations

Drop shadow (TinglesMagicWords)

A simple drop shadow effect, assuming you have a solid color and transparent clip such as text.
	import io
	import os

	import requests
	import torch

	from diffusers import Flux2Pipeline, Flux2Transformer2DModel


	# you will need to have ~6.5GB of free VRAM and ~40GB of free RAM to run this script (~10 if you enable
	# Taken from: https://gist.github.com/sayakpaul/23862a2e7f5ab73dfdcc513751289bea

	from diffusers import FluxPipeline, FluxTransformer2DModel
	from transformers import T5EncoderModel
	import torch
	import gc


	def flush():
	gc.collect()
	from diffusers import FluxPipeline, AutoencoderKL
	from diffusers.image_processor import VaeImageProcessor
	from transformers import T5EncoderModel, T5TokenizerFast, CLIPTokenizer, CLIPTextModel
	import torch
	import gc


	def flush():
	gc.collect()
	torch.cuda.empty_cache()
	def forward(self, x, timesteps=None, context=None, y=None, **kwargs):
	# broadcast timesteps to batch dimension
	timesteps = timesteps.expand(x.shape[0])

	hs = []
	t_emb = get_timestep_embedding(timesteps, self.model_channels) # , repeat_only=False)
	t_emb = t_emb.to(x.dtype)
	emb = self.time_embed(t_emb)

	assert x.shape[0] == y.shape[0], f"batch size mismatch: {x.shape[0]} != {y.shape[0]}"
	# huggingface login
	from huggingface_hub import login

	login()


	# load textencorder in 8bit quantized
	from transformers import T5EncoderModel
	from diffusers import DiffusionPipeline
	import datetime
	# Ran it with the following packages installed:
	# accelerate 0.18.0
	# diffusers 0.16.0.dev0
	# torch 2.0.0+cu118
	# torchvision 0.15.0+cu118
	# transformers 4.28.1
	# xformers 0.0.18

	import torch
	from diffusers import DiffusionPipeline, DPMSolverMultistepScheduler
	from PIL import Image
	import stable_inference
	import numpy as np
	from einops import repeat

	# Interpolate video between two conditionings
	FOLDER = 'test/painting'
	MAX_STRENGTH = 0.5 # Strength at maximum in the middle of the interpolation
	SEED = 9001
	SECONDS = 10
	bl_info = {
	"name": "Kuchi Paku Light",
	"author": "ds54e",
	"version": (1, 1, 1),
	"blender": (2, 80, 0),
	"location": "View3D > Sidebar > KPL",
	"description": "Generate Kuchi-Paku animations from the sound sequences in the VSE",
	"warning": "",
	"doc_url": "",
	"category": "Animation",