Spaces:

YueMafighting
/

FollowYourPose

Runtime error

App Files Files Community

mayuema commited on Apr 7, 2023

Commit

3a8c535

•

1 Parent(s): 0754e7d

first release

Browse files

Files changed (2) hide show

app_followyourpose.py → app.py +1 -38
inference_followyourpose.py +6 -31

app_followyourpose.py → app.py RENAMED Viewed

@@ -9,15 +9,10 @@ import gradio as gr
 from inference_followyourpose import merge_config_then_run
-# TITLE = '# [FateZero](http://fate-zero-edit.github.io/)'
 HF_TOKEN = os.getenv('HF_TOKEN')
-# pipe = InferencePipeline(HF_TOKEN)
 pipe = merge_config_then_run()
-# app = InferenceUtil(HF_TOKEN)
 with gr.Blocks(css='style.css') as demo:
-    # gr.Markdown(TITLE)
     gr.HTML(
     """
     <div style="text-align: center; max-width: 1200px; margin: 20px auto;">
@@ -134,11 +129,6 @@ with gr.Blocks(css='style.css') as demo:
             with gr.Accordion('Text Prompt', open=True):
-                # source_prompt = gr.Textbox(label='Source Prompt',
-                #                     info='A good prompt describes each frame and most objects in video. Especially, it has the object or attribute that we want to edit or preserve.',
-                #                     max_lines=1,
-                #                     placeholder='Example: "a silver jeep driving down a curvy road in the countryside"',
-                #                     value='a silver jeep driving down a curvy road in the countryside')
                 target_prompt = gr.Textbox(label='Target Prompt',
                                     info='A reasonable composition of video may achieve better results(e.g., "sunflower" video with "Van Gogh" prompt is better than "sunflower" with "Monet")',
                                     max_lines=1,
@@ -154,33 +144,6 @@ with gr.Blocks(css='style.css') as demo:
         with gr.Column():
             result = gr.Video(label='Result')
             # result.style(height=512, width=512)
-            # with gr.Accordion('FateZero Parameters for attention fusing', open=True):
-                # cross_replace_steps = gr.Slider(label='Cross-att replace steps',
-                #                 info='More steps, replace more cross attention to preserve semantic layout.',
-                #                 minimum=0.0,
-                #                 maximum=1.0,
-                #                 step=0.1,
-                #                 value=0.7)
-                # self_replace_steps = gr.Slider(label='Self-att replace steps',
-                #                 info='More steps, replace more spatial-temporal self-attention to preserve geometry and motion.',
-                #                 minimum=0.0,
-                #                 maximum=1.0,
-                #                 step=0.1,
-                #                 value=0.7)
-                # enhance_words = gr.Textbox(label='Enhanced words',
-                #                     info='Amplify the target-words cross attention',
-                #                     max_lines=1,
-                #                     placeholder='Example: "watercolor "',
-                #                     value='watercolor')
-                # enhance_words_value = gr.Slider(label='Target cross-att amplification',
-                #                 info='larger value, more elements of target words',
-                #                 minimum=0.0,
-                #                 maximum=20.0,
-                #                 step=1,
-                #                 value=10)
             with gr.Accordion('DDIM Parameters', open=True):
                 num_steps = gr.Slider(label='Number of Steps',
                                       info='larger value has better editing capacity, but takes more time and memory.',
@@ -208,4 +171,4 @@ with gr.Blocks(css='style.css') as demo:
     target_prompt.submit(fn=pipe.run, inputs=inputs, outputs=result)
     run_button.click(fn=pipe.run, inputs=inputs, outputs=result)
-demo.queue().launch(share=False, server_name='0.0.0.0', server_port=80)

 from inference_followyourpose import merge_config_then_run
 HF_TOKEN = os.getenv('HF_TOKEN')
 pipe = merge_config_then_run()
 with gr.Blocks(css='style.css') as demo:
     gr.HTML(
     """
     <div style="text-align: center; max-width: 1200px; margin: 20px auto;">
             with gr.Accordion('Text Prompt', open=True):
                 target_prompt = gr.Textbox(label='Target Prompt',
                                     info='A reasonable composition of video may achieve better results(e.g., "sunflower" video with "Van Gogh" prompt is better than "sunflower" with "Monet")',
                                     max_lines=1,
         with gr.Column():
             result = gr.Video(label='Result')
             # result.style(height=512, width=512)
             with gr.Accordion('DDIM Parameters', open=True):
                 num_steps = gr.Slider(label='Number of Steps',
                                       info='larger value has better editing capacity, but takes more time and memory.',
     target_prompt.submit(fn=pipe.run, inputs=inputs, outputs=result)
     run_button.click(fn=pipe.run, inputs=inputs, outputs=result)
+demo.queue().launch()

inference_followyourpose.py CHANGED Viewed

@@ -14,41 +14,16 @@ def get_time_string() -> str:
 class merge_config_then_run():
     def __init__(self) -> None:
             # Load the tokenizer
-        # pretrained_model_path = 'FateZero/ckpt/stable-diffusion-v1-4'
         self.tokenizer = None
         self.text_encoder = None
         self.vae = None
         self.unet = None
-        # cache_ckpt = False
-        # if cache_ckpt:
-        #     self.tokenizer = AutoTokenizer.from_pretrained(
-        #         pretrained_model_path,
-        #         # 'FateZero/ckpt/stable-diffusion-v1-4',
-        #         subfolder="tokenizer",
-        #         use_fast=False,
-        #     )
-        #     # Load models and create wrapper for stable diffusion
-        #     self.text_encoder = CLIPTextModel.from_pretrained(
-        #         pretrained_model_path,
-        #         subfolder="text_encoder",
-        #     )
-        #     self.vae = AutoencoderKL.from_pretrained(
-        #         pretrained_model_path,
-        #         subfolder="vae",
-        #     )
-        #     model_config = {
-        #         "lora": 160,
-        #         # temporal_downsample_time: 4
-        #         "SparseCausalAttention_index": ['mid'],
-        #         "least_sc_channel": 640
-        #     }
-        #     self.unet = UNetPseudo3DConditionModel.from_2d_model(
-        #         os.path.join(pretrained_model_path, "unet"), model_config=model_config
-        #     )
     def run(
         self,
         data_path,
@@ -64,12 +39,12 @@ class merge_config_then_run():
         top_crop=0,
         bottom_crop=0,
     ):
         default_edit_config='FollowYourPose/configs/pose_sample.yaml'
         Omegadict_default_edit_config = OmegaConf.load(default_edit_config)
         dataset_time_string = get_time_string()
         config_now = copy.deepcopy(Omegadict_default_edit_config)
-        # print(f"config_now['pretrained_model_path'] = model_id {model_id}")
         offset_dict = {
             "left": left_crop,

 class merge_config_then_run():
     def __init__(self) -> None:
             # Load the tokenizer
         self.tokenizer = None
         self.text_encoder = None
         self.vae = None
         self.unet = None
+    def download_model(self):
+        REPO_ID = 'YueMafighting/FollowYourPose_v1'
+        hf_hub_download(repo_id=REPO_ID, local_dir='./FollowYourPose/checkpoints', local_dir_use_symlinks=False)
     def run(
         self,
         data_path,
         top_crop=0,
         bottom_crop=0,
     ):
+        self.download_model()
         default_edit_config='FollowYourPose/configs/pose_sample.yaml'
         Omegadict_default_edit_config = OmegaConf.load(default_edit_config)
         dataset_time_string = get_time_string()
         config_now = copy.deepcopy(Omegadict_default_edit_config)
         offset_dict = {
             "left": left_crop,