Ë
    Õ†ilA  ã                   óØ  — d dl mZ ddlmZmZ ddlmZ ddlmZm	Z	m
Z
mZmZmZ ddlmZ ddlmZmZmZmZmZ dd	lmZmZmZmZmZmZmZ  ej<                  e«      Z  G d
„ de«      Z! G d„ de«      Z" G d„ de«      Z# G d„ de«      Z$ G d„ de«      Z% G d„ de«      Z& G d„ de«      Z' G d„ de«      Z( G d„ de«      Z) G d„ de«      Z* G d„ de«      Z+ G d „ d!e«      Z, G d"„ d#e«      Z- G d$„ d%e«      Z. G d&„ d'e«      Z/ ed(efd)efd*efd+efd,efd-efg«      Z0 ed.efd/e"fd0e#fd)efd1 ed2g¬3«      fd*efd+efd4e	fd,efd-efg
«      Z1 ed.efd5efd/e%fd0e&fd)efd1 ed6g¬3«      fd*efd+efd7e
fd,efd-efg«      Z2 ed(efd/e(fd0e)fd,e*fd-efg«      Z3 ed(efd)efd*efd+efd,efd-efg«      Z4 ed.efd0e#fd)efd*efd+efd,efd-efg«      Z5 ed(efd0e)fd,e.fd-efg«      Z6e0e1e2e3d8œe4e5e6d9œd:œZ7y;)<é   )Úloggingé   )ÚAutoPipelineBlocksÚSequentialPipelineBlocks)ÚInsertableDicté   )ÚWanAdditionalInputsStepÚWanPrepareFirstFrameLatentsStepÚ#WanPrepareFirstLastFrameLatentsStepÚWanPrepareLatentsStepÚWanSetTimestepsStepÚWanTextInputStep)ÚWanImageVaeDecoderStep)ÚWan22DenoiseStepÚWan22Image2VideoDenoiseStepÚWanDenoiseStepÚWanFLF2VDenoiseStepÚWanImage2VideoDenoiseStep)Ú!WanFirstLastFrameImageEncoderStepÚ$WanFirstLastFrameVaeImageEncoderStepÚWanImageCropResizeStepÚWanImageEncoderStepÚWanImageResizeStepÚWanTextEncoderStepÚWanVaeImageEncoderStepc                   ó0   — e Zd ZeeeegZg d¢Ze	d„ «       Z
y)ÚWanCoreDenoiseStep©ÚinputÚset_timestepsÚprepare_latentsÚdenoisec                  ó   — 	 y)Na`  denoise block that takes encoded conditions and runs the denoising process.
This is a sequential pipeline blocks:
 - `WanTextInputStep` is used to adjust the batch size of the model inputs
 - `WanSetTimestepsStep` is used to set the timesteps
 - `WanPrepareLatentsStep` is used to prepare the latents
 - `WanDenoiseStep` is used to denoise the latents
© ©Úselfs    úx/home/obispo/Crisostomo_bridge/mision_env/lib/python3.12/site-packages/diffusers/modular_pipelines/wan/modular_blocks.pyÚdescriptionzWanCoreDenoiseStep.description;   s   € ðEð	
ó    N)Ú__name__Ú
__module__Ú__qualname__r   r   r   r   Úblock_classesÚblock_namesÚpropertyr(   r$   r)   r'   r   r   2   s/   „ àØØØð	€Mò K€Kàñ
ó ñ
r)   r   c                   ó0   — e Zd ZdZeegZddgZed„ «       Z	y)ÚWanImage2VideoImageEncoderStepÚwanÚimage_resizeÚimage_encoderc                  ó   — y)NzjImage2Video Image Encoder step that resize the image and encode the image to generate the image embeddingsr$   r%   s    r'   r(   z*WanImage2VideoImageEncoderStep.descriptionN   s   € à{r)   N)
r*   r+   r,   Ú
model_namer   r   r-   r.   r/   r(   r$   r)   r'   r1   r1   I   s0   „ Ø€JØ'Ð)<Ð=€MØ! ?Ð3€Kàñ|ó ñ|r)   r1   c                   ó0   — e Zd ZdZeegZddgZed„ «       Z	y)Ú!WanImage2VideoVaeImageEncoderStepr2   r3   Úvae_image_encoderc                  ó   — y)NzvImage2Video Vae Image Encoder step that resize the image and encode the first frame image to its latent representationr$   r%   s    r'   r(   z-WanImage2VideoVaeImageEncoderStep.descriptionY   s   € ð Hr)   N)
r*   r+   r,   r6   r   r   r-   r.   r/   r(   r$   r)   r'   r8   r8   T   s1   „ Ø€JØ'Ð)?Ð@€MØ!Ð#6Ð7€KàñHó ñHr)   r8   c                   óD   — e Zd Ze edg¬«      eeeegZ	g d¢Z
ed„ «       Zy)ÚWanImage2VideoCoreDenoiseStepÚfirst_frame_latents©Úimage_latent_inputs©r   Úadditional_inputsr    r!   Úprepare_first_frame_latentsr"   c                  ó   — 	 y)Na2  denoise block that takes encoded text and image latent conditions and runs the denoising process.
This is a sequential pipeline blocks:
 - `WanTextInputStep` is used to adjust the batch size of the model inputs
 - `WanAdditionalInputsStep` is used to adjust the batch size of the latent conditions
 - `WanSetTimestepsStep` is used to set the timesteps
 - `WanPrepareLatentsStep` is used to prepare the latents
 - `WanPrepareFirstFrameLatentsStep` is used to prepare the first frame latent conditions
 - `WanImage2VideoDenoiseStep` is used to denoise the latents
r$   r%   s    r'   r(   z)WanImage2VideoCoreDenoiseStep.descriptionq   ó   € ðPð		
r)   N)r*   r+   r,   r   r	   r   r   r
   r   r-   r.   r/   r(   r$   r)   r'   r<   r<   _   s?   „ àÙÐ5JÐ4KÔLØØØ'Ø!ð€Mò€Kð ñ

ó ñ

r)   r<   c                   ó2   — e Zd ZdZeeegZg d¢Ze	d„ «       Z
y)ÚWanFLF2VImageEncoderStepr2   )r3   Úlast_image_resizer4   c                  ó   — y)Nz{FLF2V Image Encoder step that resize and encode and encode the first and last frame images to generate the image embeddingsr$   r%   s    r'   r(   z$WanFLF2VImageEncoderStep.descriptionˆ   s   € ð Mr)   N)r*   r+   r,   r6   r   r   r   r-   r.   r/   r(   r$   r)   r'   rF   rF   ƒ   s.   „ Ø€JØ'Ð)?ÐAbÐc€MÚH€KàñMó ñMr)   rF   c                   ó2   — e Zd ZdZeeegZg d¢Ze	d„ «       Z
y)ÚWanFLF2VVaeImageEncoderStepr2   )r3   rG   r9   c                  ó   — y)Nz€FLF2V Vae Image Encoder step that resize and encode and encode the first and last frame images to generate the latent conditionsr$   r%   s    r'   r(   z'WanFLF2VVaeImageEncoderStep.description“   s   € ð Rr)   N)r*   r+   r,   r6   r   r   r   r-   r.   r/   r(   r$   r)   r'   rJ   rJ   Ž   s.   „ Ø€JØ'Ð)?ÐAeÐf€MÚL€KàñRó ñRr)   rJ   c                   óD   — e Zd Ze edg¬«      eeeegZ	g d¢Z
ed„ «       Zy)ÚWanFLF2VCoreDenoiseStepÚfirst_last_frame_latentsr>   )r   rA   r    r!   Ú prepare_first_last_frame_latentsr"   c                  ó   — 	 y)Na*  denoise block that takes encoded text and image latent conditions and runs the denoising process.
This is a sequential pipeline blocks:
 - `WanTextInputStep` is used to adjust the batch size of the model inputs
 - `WanAdditionalInputsStep` is used to adjust the batch size of the latent conditions
 - `WanSetTimestepsStep` is used to set the timesteps
 - `WanPrepareLatentsStep` is used to prepare the latents
 - `WanPrepareFirstLastFrameLatentsStep` is used to prepare the latent conditions
 - `WanImage2VideoDenoiseStep` is used to denoise the latents
r$   r%   s    r'   r(   z#WanFLF2VCoreDenoiseStep.description«   rD   r)   N)r*   r+   r,   r   r	   r   r   r   r   r-   r.   r/   r(   r$   r)   r'   rM   rM   ™   s?   „ àÙÐ5OÐ4PÔQØØØ+Øð€Mò€Kð ñ

ó ñ

r)   rM   c                   ó4   — e Zd ZeegZddgZddgZed„ «       Z	y)ÚWanAutoImageEncoderStepÚflf2v_image_encoderÚimage2video_image_encoderÚ
last_imageÚimagec                  ó   — 	 y)Nal  Image Encoder step that encode the image to generate the image embeddingsThis is an auto pipeline block that works for image2video tasks. - `WanFLF2VImageEncoderStep` (flf2v) is used when `last_image` is provided. - `WanImage2VideoImageEncoderStep` (image2video) is used when `image` is provided. - if `last_image` or `image` is not provided, step will be skipped.r$   r%   s    r'   r(   z#WanAutoImageEncoderStep.descriptionÀ   ó   € ðUð	
r)   N)
r*   r+   r,   rF   r1   r-   r.   Úblock_trigger_inputsr/   r(   r$   r)   r'   rR   rR   »   s5   „ Ø-Ð/MÐN€MØ(Ð*EÐF€KØ(¨'Ð2Ðàñ
ó ñ
r)   rR   c                   ó4   — e Zd ZeegZddgZddgZed„ «       Z	y)ÚWanAutoVaeImageEncoderStepÚflf2v_vae_image_encoderÚimage2video_vae_image_encoderrU   rV   c                  ó   — 	 y)Nas  Vae Image Encoder step that encode the image to generate the image latentsThis is an auto pipeline block that works for image2video tasks. - `WanFLF2VVaeImageEncoderStep` (flf2v) is used when `last_image` is provided. - `WanImage2VideoVaeImageEncoderStep` (image2video) is used when `image` is provided. - if `last_image` or `image` is not provided, step will be skipped.r$   r%   s    r'   r(   z&WanAutoVaeImageEncoderStep.descriptionÑ   rX   r)   N)
r*   r+   r,   rJ   r8   r-   r.   rY   r/   r(   r$   r)   r'   r[   r[   Ì   s5   „ Ø0Ð2SÐT€MØ,Ð.MÐN€KØ(¨'Ð2Ðàñ
ó ñ
r)   r[   c                   ó<   — e Zd ZeeegZg d¢Zg d¢Ze	de
fd„«       Zy)ÚWanAutoDenoiseStep)Úflf2vÚimage2videoÚ
text2video)rN   r=   NÚreturnc                  ó   — 	 y)Na«  Denoise step that iteratively denoise the latents. This is a auto pipeline block that works for text2video and image2video tasks. - `WanCoreDenoiseStep` (text2video) for text2vid tasks. - `WanCoreImage2VideoCoreDenoiseStep` (image2video) for image2video tasks. - if `first_frame_latents` is provided, `WanCoreImage2VideoDenoiseStep` will be used.
 - if `first_frame_latents` is not provided, `WanCoreDenoiseStep` will be used.
r$   r%   s    r'   r(   zWanAutoDenoiseStep.descriptionæ   s   € ðbð	
r)   N)r*   r+   r,   rM   r<   r   r-   r.   rY   r/   Ústrr(   r$   r)   r'   r`   r`   Ý   s8   „ àØ%Øð€Mò
 9€KÚTÐàð
˜Sò 
ó ñ
r)   r`   c                   ó2   — e Zd ZeeeeegZg d¢Z	e
d„ «       Zy)ÚWanAutoBlocks)Útext_encoderr4   r9   r"   Údecodec                  ó   — 	 y)NzvAuto Modular pipeline for text-to-video using Wan.
- for text-to-video generation, all you need to provide is `prompt`r$   r%   s    r'   r(   zWanAutoBlocks.description  ó   € ðTð	
r)   N)r*   r+   r,   r   rR   r[   r`   r   r-   r.   r/   r(   r$   r)   r'   rh   rh   ó   s3   „ àØØ"ØØð€Mò€Kð ñ
ó ñ
r)   rh   c                   ó0   — e Zd ZeeeegZg d¢Ze	d„ «       Z
y)ÚWan22CoreDenoiseStepr   c                  ó   — 	 y)Nal  denoise block that takes encoded conditions and runs the denoising process.
This is a sequential pipeline blocks:
 - `WanTextInputStep` is used to adjust the batch size of the model inputs
 - `WanSetTimestepsStep` is used to set the timesteps
 - `WanPrepareLatentsStep` is used to prepare the latents
 - `Wan22DenoiseStep` is used to denoise the latents in wan2.2
r$   r%   s    r'   r(   z Wan22CoreDenoiseStep.description  s   € ðQð	
r)   N)r*   r+   r,   r   r   r   r   r-   r.   r/   r(   r$   r)   r'   rn   rn     s/   „ àØØØð	€Mò K€Kàñ
ó ñ
r)   rn   c                   óD   — e Zd Ze edg¬«      eeeegZ	g d¢Z
ed„ «       Zy)ÚWan22Image2VideoCoreDenoiseStepr=   r>   r@   c                  ó   — 	 y)Na>  denoise block that takes encoded text and image latent conditions and runs the denoising process.
This is a sequential pipeline blocks:
 - `WanTextInputStep` is used to adjust the batch size of the model inputs
 - `WanAdditionalInputsStep` is used to adjust the batch size of the latent conditions
 - `WanSetTimestepsStep` is used to set the timesteps
 - `WanPrepareLatentsStep` is used to prepare the latents
 - `WanPrepareFirstFrameLatentsStep` is used to prepare the first frame latent conditions
 - `Wan22Image2VideoDenoiseStep` is used to denoise the latents in wan2.2
r$   r%   s    r'   r(   z+Wan22Image2VideoCoreDenoiseStep.description9  s   € ð\ð		
r)   N)r*   r+   r,   r   r	   r   r   r
   r   r-   r.   r/   r(   r$   r)   r'   rq   rq   '  s?   „ àÙÐ5JÐ4KÔLØØØ'Ø#ð€Mò€Kð ñ

ó ñ

r)   rq   c                   ó:   — e Zd ZeegZddgZddgZede	fd„«       Z
y)ÚWan22AutoDenoiseSteprb   rc   r=   Nrd   c                  ó   — 	 y)Na¯  Denoise step that iteratively denoise the latents. This is a auto pipeline block that works for text2video and image2video tasks. - `Wan22Image2VideoCoreDenoiseStep` (image2video) for image2video tasks. - `Wan22CoreDenoiseStep` (text2video) for text2vid tasks. - if `first_frame_latents` is provided, `Wan22Image2VideoCoreDenoiseStep` will be used.
 - if `first_frame_latents` is not provided, `Wan22CoreDenoiseStep` will be used.
r$   r%   s    r'   r(   z Wan22AutoDenoiseStep.descriptionO  s   € ðdð	
r)   )r*   r+   r,   rq   rn   r-   r.   rY   r/   rf   r(   r$   r)   r'   rt   rt   G  s?   „ à'Øð€Mð ! ,Ð/€KØ1°4Ð8Ðàð
˜Sò 
ó ñ
r)   rt   c                   ó0   — e Zd ZeeeegZg d¢Ze	d„ «       Z
y)ÚWan22AutoBlocks)ri   r9   r"   rj   c                  ó   — 	 y)NzyAuto Modular pipeline for text-to-video using Wan2.2.
- for text-to-video generation, all you need to provide is `prompt`r$   r%   s    r'   r(   zWan22AutoBlocks.descriptioni  rl   r)   N)r*   r+   r,   r   r[   rt   r   r-   r.   r/   r(   r$   r)   r'   rw   rw   [  s0   „ àØ"ØØð	€Mò€Kð ñ
ó ñ
r)   rw   ri   r   r    r!   r"   rj   r3   r4   r9   rA   r=   r>   rB   rG   rN   rO   )rc   rb   ra   Úauto)rc   rb   ry   )zwan2.1zwan2.2N)8Úutilsr   Úmodular_pipeliner   r   Úmodular_pipeline_utilsr   Úbefore_denoiser	   r
   r   r   r   r   Údecodersr   r"   r   r   r   r   r   Úencodersr   r   r   r   r   r   r   Ú
get_loggerr*   Úloggerr   r1   r8   r<   rF   rJ   rM   rR   r[   r`   rh   rn   rq   rt   rw   ÚTEXT2VIDEO_BLOCKSÚIMAGE2VIDEO_BLOCKSÚFLF2V_BLOCKSÚAUTO_BLOCKSÚTEXT2VIDEO_BLOCKS_WAN22ÚIMAGE2VIDEO_BLOCKS_WAN22ÚAUTO_BLOCKS_WAN22Ú
ALL_BLOCKSr$   r)   r'   ú<module>rŠ      sŠ  ðõ ß KÝ 3÷÷ õ -÷õ ÷÷ ñ ð 
ˆ×	Ñ	˜HÓ	%€ô

Ð1ô 
ô.|Ð%=ô |ôHÐ(@ô Hô
Ð$<ô 
ôHMÐ7ô MôRÐ":ô Rô
Ð6ô 
ôD
Ð0ô 
ô"
Ð!3ô 
ô"
Ð+ô 
ô,
Ð,ô 
ô:
Ð3ô 
ô.
Ð&>ô 
ô@
Ð-ô 
ô(
Ð.ô 
ñ2 #à	Ð+Ð,Ø	Ð"Ð#Ø	Ð-Ð.Ø	Ð1Ð2Ø	NÐ#Ø	Ð)Ð*ðó	Ð ñ $à	Ð+Ð,Ø	Ð8Ð9Ø	Ð?Ð@Ø	Ð"Ð#Ø	Ñ5ÐK`ÐJaÔbÐcØ	Ð-Ð.Ø	Ð1Ð2Ø	&Ð(GÐHØ	Ð-Ð.Ø	Ð)Ð*ðóÐ ñ  à	Ð+Ð,Ø	Ð4Ð5Ø	Ð2Ð3Ø	Ð9Ð:Ø	Ð"Ð#Ø	Ñ5ÐKeÐJfÔgÐhØ	Ð-Ð.Ø	Ð1Ð2Ø	+Ð-PÐQØ	Ð'Ð(Ø	Ð)Ð*ðó€ñ  à	Ð+Ð,Ø	Ð1Ð2Ø	Ð8Ð9Ø	Ð&Ð'Ø	Ð)Ð*ðó€ñ )à	Ð+Ð,Ø	Ð"Ð#Ø	Ð-Ð.Ø	Ð1Ð2Ø	Ð$Ð%Ø	Ð)Ð*ðó	Ð ñ *à	Ð+Ð,Ø	Ð?Ð@Ø	Ð"Ð#Ø	Ð-Ð.Ø	Ð1Ð2Ø	Ð$Ð%Ø	Ð)Ð*ðó
Ð ñ #à	Ð+Ð,Ø	Ð8Ð9Ø	Ð(Ð)Ø	Ð)Ð*ð	óÐ ð (Ø)ØØñ	ð .Ø/Ø!ññ
r)   