Spaces:

feishen29
/

IMAGDressing-v1

Running on Zero

App Files Files Community

feishen29 commited on Jul 24, 2024

Commit

297e547

verified ·

1 Parent(s): 9c79eab

Upload app.py

Browse files

Files changed (1) hide show

app.py +5 -5

app.py CHANGED Viewed

@@ -59,7 +59,7 @@ parser.add_argument('--pretrained_vae_model_path',
                     default="./ckpt/sd-vae-ft-mse/",
                     type=str)
 parser.add_argument('--model_ckpt',
-                    default="/./ckpt/IMAGDressing-v1_512.pt",
                     type=str)
 parser.add_argument('--output_path', type=str, default="./output_ipa_control_resampler")
 # parser.add_argument('--device', type=str, default="cuda:0")
@@ -78,12 +78,12 @@ base_path = 'feishen29/IMAGDressing-v1'
 generator = torch.Generator(device=args.device).manual_seed(42)
 vae = AutoencoderKL.from_pretrained(args.pretrained_vae_model_path).to(dtype=torch.float16, device=args.device)
-tokenizer = CLIPTokenizer.from_pretrained(args.pretrained_model_name_or_path, subfolder="tokenizer")
-text_encoder = CLIPTextModel.from_pretrained(args.pretrained_model_name_or_path, subfolder="text_encoder").to(
     dtype=torch.float16, device=args.device)
 image_encoder = CLIPVisionModelWithProjection.from_pretrained(args.pretrained_image_encoder_path).to(
     dtype=torch.float16, device=args.device)
-unet = UNet2DConditionModel.from_pretrained(args.pretrained_model_name_or_path, subfolder="unet").to(
     dtype=torch.float16,device=args.device)
 image_face_fusion = pipeline('face_fusion_torch', model='damo/cv_unet_face_fusion_torch', model_revision='v1.0.3')
@@ -129,7 +129,7 @@ adapter_modules = torch.nn.ModuleList(unet.attn_processors.values())
 adapter_modules = adapter_modules.to(dtype=torch.float16, device=args.device)
 del st
-ref_unet = UNet2DConditionModel.from_pretrained(args.pretrained_model_name_or_path, subfolder="unet").to(
     dtype=torch.float16,
     device=args.device)
 ref_unet.set_attn_processor(

                     default="./ckpt/sd-vae-ft-mse/",
                     type=str)
 parser.add_argument('--model_ckpt',
+                    default="./ckpt/IMAGDressing-v1_512.pt",
                     type=str)
 parser.add_argument('--output_path', type=str, default="./output_ipa_control_resampler")
 # parser.add_argument('--device', type=str, default="cuda:0")
 generator = torch.Generator(device=args.device).manual_seed(42)
 vae = AutoencoderKL.from_pretrained(args.pretrained_vae_model_path).to(dtype=torch.float16, device=args.device)
+tokenizer = CLIPTokenizer.from_pretrained("./ckpt/tokenizer")
+text_encoder = CLIPTextModel.from_pretrained("./ckpt/text_encoder").to(
     dtype=torch.float16, device=args.device)
 image_encoder = CLIPVisionModelWithProjection.from_pretrained(args.pretrained_image_encoder_path).to(
     dtype=torch.float16, device=args.device)
+unet = UNet2DConditionModel.from_pretrained("./ckpt/unet").to(
     dtype=torch.float16,device=args.device)
 image_face_fusion = pipeline('face_fusion_torch', model='damo/cv_unet_face_fusion_torch', model_revision='v1.0.3')
 adapter_modules = adapter_modules.to(dtype=torch.float16, device=args.device)
 del st
+ref_unet = UNet2DConditionModel.from_pretrained("./ckpt/unet").to(
     dtype=torch.float16,
     device=args.device)
 ref_unet.set_attn_processor(