ó
    +ýòhùE  ã                   ó  • S SK JrJrJrJr  S SKrS SKJr  SSKJ	r	J
r
  SSKJrJr  SSKJrJrJr  SSKJr  S	S
KJrJr  SSKJr  \" 5       (       a  S SKJs  Jr  SrOSr\R<                  " \5      r Sr!SS jr" " S S\5      r#g)é    )ÚCallableÚListÚOptionalÚUnionN)ÚXLMRobertaTokenizeré   )ÚUNet2DConditionModelÚVQModel)ÚDDIMSchedulerÚDDPMScheduler)Úis_torch_xla_availableÚloggingÚreplace_example_docstring)Úrandn_tensoré   )ÚDiffusionPipelineÚImagePipelineOutputé   )ÚMultilingualCLIPTFav  
    Examples:
        ```py
        >>> from diffusers import KandinskyPipeline, KandinskyPriorPipeline
        >>> import torch

        >>> pipe_prior = KandinskyPriorPipeline.from_pretrained("kandinsky-community/Kandinsky-2-1-prior")
        >>> pipe_prior.to("cuda")

        >>> prompt = "red cat, 4k photo"
        >>> out = pipe_prior(prompt)
        >>> image_emb = out.image_embeds
        >>> negative_image_emb = out.negative_image_embeds

        >>> pipe = KandinskyPipeline.from_pretrained("kandinsky-community/kandinsky-2-1")
        >>> pipe.to("cuda")

        >>> image = pipe(
        ...     prompt,
        ...     image_embeds=image_emb,
        ...     negative_image_embeds=negative_image_emb,
        ...     height=768,
        ...     width=768,
        ...     num_inference_steps=100,
        ... ).images

        >>> image[0].save("cat.png")
        ```
c                 ón   • XS-  -  nXS-  -  S:w  a  US-  nXS-  -  nXS-  -  S:w  a  US-  nX2-  XB-  4$ )Nr   r   r   © )ÚhÚwÚscale_factorÚnew_hÚnew_ws        Új/home/james-whalen/.local/lib/python3.13/site-packages/diffusers/pipelines/kandinsky/pipeline_kandinsky.pyÚget_new_h_wr   K   s[   € Ø˜q‘Ñ €EØ˜‰?Ñ˜aÓØ‰
ˆØ˜q‘Ñ €EØ˜‰?Ñ˜aÓØ‰
ˆØÑ Ñ!5Ð5Ð5ó    c            !       ó"  ^ • \ rS rSrSrSrS\S\S\S\	\
\4   S\4
U 4S	 jjrS
 r SS jr\R"                  " 5       \" \5                  SS\	\\\   4   S\	\R,                  \\R,                     4   S\	\R,                  \\R,                     4   S\\	\\\   4      S\S\S\S\S\S\\	\R4                  \\R4                     4      S\\R,                     S\\   S\\\\\R,                  /S4      S\S\4S jj5       5       rSrU =r$ ) ÚKandinskyPipelineéU   aõ  
Pipeline for text-to-image generation using Kandinsky

This model inherits from [`DiffusionPipeline`]. Check the superclass documentation for the generic methods the
library implements for all the pipelines (such as downloading or saving, running on a particular device, etc.)

Args:
    text_encoder ([`MultilingualCLIP`]):
        Frozen text-encoder.
    tokenizer ([`XLMRobertaTokenizer`]):
        Tokenizer of class
    scheduler (Union[`DDIMScheduler`,`DDPMScheduler`]):
        A scheduler to be used in combination with `unet` to generate image latents.
    unet ([`UNet2DConditionModel`]):
        Conditional U-Net architecture to denoise the image embedding.
    movq ([`VQModel`]):
        MoVQ Decoder to generate the image from the latents.
ztext_encoder->unet->movqÚtext_encoderÚ	tokenizerÚunetÚ	schedulerÚmovqc                 ó°   >• [         TU ]  5         U R                  UUUUUS9  S[        U R                  R
                  R                  5      S-
  -  U l        g )N)r#   r$   r%   r&   r'   r   r   )ÚsuperÚ__init__Úregister_modulesÚlenr'   ÚconfigÚblock_out_channelsÚmovq_scale_factor)Úselfr#   r$   r%   r&   r'   Ú	__class__s         €r   r*   ÚKandinskyPipeline.__init__k   s\   ø€ ô 	‰ÑÔà×ÑØ%ØØØØð 	ñ 	
ð "#¤s¨4¯9©9×+;Ñ+;×+NÑ+NÓ'OÐRSÑ'SÑ!TˆÕr   c                 ó¶   • Uc  [        XX2S9nO<UR                  U:w  a  [        SUR                   SU 35      eUR                  U5      nXVR                  -  nU$ )N)Ú	generatorÚdeviceÚdtypezUnexpected latents shape, got z, expected )r   ÚshapeÚ
ValueErrorÚtoÚinit_noise_sigma)r0   r7   r6   r5   r4   Úlatentsr&   s          r   Úprepare_latentsÚ!KandinskyPipeline.prepare_latents   s`   € Ø‰?Ü" 5ÀfÑZ‰Gà}‰} Ó%Ü Ð#AÀ'Ç-Á-ÀÐP[Ð\aÐ[bÐ!cÓdÐdØ—j‘j Ó(ˆGà×6Ñ6Ñ6ˆØˆr   Nc                 ó^  • [        U[        5      (       a  [        U5      OSnU R                  USSSSSSS9nUR                  nU R                  USSS9R                  n	U	R
                  S	   UR
                  S	   :¼  a…  [        R                  " X‰5      (       dj  U R                  R                  U	S S 2U R                  R                  S-
  S	24   5      n
[        R                  S
U R                  R                   SU
 35        UR                  U5      nUR                  R                  U5      nU R                  X‹S9u  pÍUR                  USS9nUR                  USS9nUR                  USS9nU(       Ga²  Uc  S/U-  nO†[!        U5      [!        U5      La$  [#        S[!        U5       S[!        U5       S35      e[        U[$        5      (       a  U/nO2U[        U5      :w  a!  ['        SU S[        U5       SU SU S3	5      eUnU R                  USSSSSSS9nUR                  R                  U5      nUR                  R                  U5      nU R                  UUS9u  nnUR
                  S   nUR)                  SU5      nUR+                  Xc-  U5      nUR
                  S   nUR)                  SUS5      nUR+                  Xc-  US	5      nUR                  USS9n[        R,                  " UU/5      n[        R,                  " UU/5      n[        R,                  " UU/5      nXÍU4$ )Nr   Ú
max_lengthTéM   Úpt)ÚpaddingÚ
truncationr?   Úreturn_attention_maskÚadd_special_tokensÚreturn_tensorsÚlongest)rB   rF   éÿÿÿÿz\The following part of your input was truncated because CLIP can only handle sequences up to z	 tokens: )Ú	input_idsÚattention_maskr   ©ÚdimÚ z?`negative_prompt` should be the same type to `prompt`, but got z != Ú.z`negative_prompt`: z has batch size z, but `prompt`: zT. Please make sure that passed `negative_prompt` matches the batch size of `prompt`.)rB   r?   rC   rD   rE   rF   )Ú
isinstanceÚlistr,   r$   rI   r7   ÚtorchÚequalÚbatch_decodeÚmodel_max_lengthÚloggerÚwarningr9   rJ   r#   Úrepeat_interleaveÚtypeÚ	TypeErrorÚstrr8   ÚrepeatÚviewÚcat)r0   Úpromptr5   Únum_images_per_promptÚdo_classifier_free_guidanceÚnegative_promptÚ
batch_sizeÚtext_inputsÚtext_input_idsÚuntruncated_idsÚremoved_textÚ	text_maskÚprompt_embedsÚtext_encoder_hidden_statesÚuncond_tokensÚuncond_inputÚuncond_text_input_idsÚuncond_text_maskÚnegative_prompt_embedsÚ!uncond_text_encoder_hidden_statesÚseq_lens                        r   Ú_encode_promptÚ KandinskyPipeline._encode_promptŠ   s§  € ô %/¨v´t×$<Ñ$<”S˜”[À!ˆ
à—n‘nØØ ØØØ"&Ø#Øð %ð 
ˆð %×.Ñ.ˆØŸ.™.¨¸ÐSW˜.ÐX×bÑbˆà× Ñ  Ñ$¨×(<Ñ(<¸RÑ(@Ó@ÌÏÊÐUc×IuÑIuØŸ>™>×6Ñ6°ÂqÈ$Ï.É.×JiÑJiÐlmÑJmÐprÐJrÐGrÑ7sÓtˆLÜN‰NðØ—N‘N×3Ñ3Ð4°I¸l¸^ðMôð
 (×*Ñ*¨6Ó2ˆØ×.Ñ.×1Ñ1°&Ó9ˆ	à48×4EÑ4EØ$ð 5Fð 5
Ñ1ˆð &×7Ñ7Ð8MÐSTÐ7ÐUˆØ%?×%QÑ%QÐRgÐmnÐ%QÐ%oÐ"Ø×/Ñ/Ð0EÈ1Ð/ÐMˆ	ç&àÑ&Ø!#  zÑ 1‘Üf“¤T¨/Ó%:Ò:ÜØUÔVZÐ[jÓVkÐUlð mÜ˜V›~ Qð(óð ô ˜O¬S×1Ñ1Ø!0Ð 1‘Øœs ?Ó3Ó3Ü Ø)¨/Ð):Ð:JÌ3ÈÓK_ÐJ`ð aØxÐ/°
¨|ð <3ð3óð ð !0àŸ>™>ØØ$ØØØ&*Ø#'Ø#ð *ð ˆLð %1×$:Ñ$:×$=Ñ$=¸fÓ$EÐ!Ø+×:Ñ:×=Ñ=¸fÓEÐàHL×HYÑHYØ/Ð@Pð IZð IÑEÐ"Ð$Eð -×2Ñ2°1Ñ5ˆGØ%;×%BÑ%BÀ1ÐF[Ó%\Ð"Ø%;×%@Ñ%@ÀÑAcÐelÓ%mÐ"à7×=Ñ=¸aÑ@ˆGØ0Q×0XÑ0XÐYZÐ\qÐstÓ0uÐ-Ø0Q×0VÑ0VØÑ2°G¸Ró1Ð-ð  0×AÑAÐBWÐ]^ÐAÐ_Ðô "ŸIšIÐ'=¸}Ð&MÓNˆMÜ).¯ªÐ4UÐWqÐ3rÓ)sÐ&äŸ	š	Ð#3°YÐ"?Ó@ˆIà¸)ÐCÐCr   r^   Úimage_embedsÚnegative_image_embedsra   ÚheightÚwidthÚnum_inference_stepsÚguidance_scaler_   r4   r;   Úoutput_typeÚcallbackÚcallback_stepsÚreturn_dictc           	      ó|  • [        U[        5      (       a  SnO8[        U[        5      (       a  [        U5      nO[	        S[        U5       35      eU R                  nUU	-  nUS:„  nU R                  UUU	UU5      u  nnn[        U[        5      (       a  [        R                  " USS9n[        U[        5      (       a  [        R                  " USS9nU(       aN  UR                  U	SS9nUR                  U	SS9n[        R                  " X2/SS9R                  UR                  US9nU R                  R                  UUS9  U R                  R                  nU R                   R"                  R$                  n['        XVU R(                  5      u  pVU R+                  UUXV4UR                  UU
UU R                  5      n[-        U R/                  U5      5       GH˜  u  nnU(       a  [        R                  " U/S-  5      OUnUUS	.nU R!                  UUUUS
S9S   nU(       aj  UR1                  UR2                  S   SS9u  nnUR5                  S5      u  nnUR5                  S5      u  nn UUUU-
  -  -   n[        R                  " UU /SS9n[7        U R                  R"                  S5      (       a$  U R                  R"                  R8                  S;   d   UR1                  UR2                  S   SS9u  nnU R                  R;                  UUUU
S9R<                  nUb-  UU-  S:X  a$  U[?        U R                  SS5      -  n!U" U!UU5        [@        (       d  GMƒ  [B        RD                  " 5         GM›     U RF                  RI                  USS9S   n"U RK                  5         US;  a  [	        SU 35      eUS;   aX  U"S-  S-   n"U"RM                  SS5      n"U"RO                  5       RQ                  SSSS5      RS                  5       RU                  5       n"US:X  a  U RW                  U"5      n"U(       d  U"4$ [Y        U"S9$ )at  
Function invoked when calling the pipeline for generation.

Args:
    prompt (`str` or `List[str]`):
        The prompt or prompts to guide the image generation.
    image_embeds (`torch.Tensor` or `List[torch.Tensor]`):
        The clip image embeddings for text prompt, that will be used to condition the image generation.
    negative_image_embeds (`torch.Tensor` or `List[torch.Tensor]`):
        The clip image embeddings for negative text prompt, will be used to condition the image generation.
    negative_prompt (`str` or `List[str]`, *optional*):
        The prompt or prompts not to guide the image generation. Ignored when not using guidance (i.e., ignored
        if `guidance_scale` is less than `1`).
    height (`int`, *optional*, defaults to 512):
        The height in pixels of the generated image.
    width (`int`, *optional*, defaults to 512):
        The width in pixels of the generated image.
    num_inference_steps (`int`, *optional*, defaults to 100):
        The number of denoising steps. More denoising steps usually lead to a higher quality image at the
        expense of slower inference.
    guidance_scale (`float`, *optional*, defaults to 4.0):
        Guidance scale as defined in [Classifier-Free Diffusion
        Guidance](https://huggingface.co/papers/2207.12598). `guidance_scale` is defined as `w` of equation 2.
        of [Imagen Paper](https://huggingface.co/papers/2205.11487). Guidance scale is enabled by setting
        `guidance_scale > 1`. Higher guidance scale encourages to generate images that are closely linked to
        the text `prompt`, usually at the expense of lower image quality.
    num_images_per_prompt (`int`, *optional*, defaults to 1):
        The number of images to generate per prompt.
    generator (`torch.Generator` or `List[torch.Generator]`, *optional*):
        One or a list of [torch generator(s)](https://pytorch.org/docs/stable/generated/torch.Generator.html)
        to make generation deterministic.
    latents (`torch.Tensor`, *optional*):
        Pre-generated noisy latents, sampled from a Gaussian distribution, to be used as inputs for image
        generation. Can be used to tweak the same generation with different prompts. If not provided, a latents
        tensor will ge generated by sampling using the supplied random `generator`.
    output_type (`str`, *optional*, defaults to `"pil"`):
        The output format of the generate image. Choose between: `"pil"` (`PIL.Image.Image`), `"np"`
        (`np.array`) or `"pt"` (`torch.Tensor`).
    callback (`Callable`, *optional*):
        A function that calls every `callback_steps` steps during inference. The function is called with the
        following arguments: `callback(step: int, timestep: int, latents: torch.Tensor)`.
    callback_steps (`int`, *optional*, defaults to 1):
        The frequency at which the `callback` function is called. If not specified, the callback is called at
        every step.
    return_dict (`bool`, *optional*, defaults to `True`):
        Whether or not to return a [`~pipelines.ImagePipelineOutput`] instead of a plain tuple.

Examples:

Returns:
    [`~pipelines.ImagePipelineOutput`] or `tuple`
r   z2`prompt` has to be of type `str` or `list` but is g      ð?r   rK   )r6   r5   )r5   r   )Útext_embedsrs   F)ÚsampleÚtimestepÚencoder_hidden_statesÚadded_cond_kwargsr|   Úvariance_type)ÚlearnedÚlearned_range)r4   ÚorderT)Úforce_not_quantizer   )rA   ÚnpÚpilzIOnly the output types `pt`, `pil` and `np` are supported not output_type=)rˆ   r‰   g      à?r   r‰   )Úimages)-rO   rZ   rP   r,   r8   rX   Ú_execution_devicerq   rQ   r]   rW   r9   r6   r&   Úset_timestepsÚ	timestepsr%   r-   Úin_channelsr   r/   r<   Ú	enumerateÚprogress_barÚsplitr7   ÚchunkÚhasattrrƒ   ÚstepÚprev_sampleÚgetattrÚXLA_AVAILABLEÚxmÚ	mark_stepr'   ÚdecodeÚmaybe_free_model_hooksÚclampÚcpuÚpermuteÚfloatÚnumpyÚnumpy_to_pilr   )#r0   r^   rs   rt   ra   ru   rv   rw   rx   r_   r4   r;   ry   rz   r{   r|   rb   r5   r`   rh   ri   Ú_Útimesteps_tensorÚnum_channels_latentsÚiÚtÚlatent_model_inputr‚   Ú
noise_predÚvariance_predÚnoise_pred_uncondÚnoise_pred_textÚvariance_pred_textÚstep_idxÚimages#                                      r   Ú__call__ÚKandinskyPipeline.__call__ð   sE  € ôR fœc×"Ñ"Ø‰JÜ˜¤×%Ñ%Ü˜V›‰JäÐQÔRVÐW]ÓR^ÐQ_Ð`ÓaÐaà×'Ñ'ˆàÐ"7Ñ7ˆ
Ø&4°sÑ&:Ð#à7;×7JÑ7JØFÐ1Ð3NÐP_ó8
Ñ4ˆÐ1°1ô l¤D×)Ñ)Ü Ÿ9š9 \°qÑ9ˆLÜÐ+¬T×2Ñ2Ü$)§I¢IÐ.CÈÑ$KÐ!æ&Ø'×9Ñ9Ð:OÐUVÐ9ÐWˆLØ$9×$KÑ$KÐLaÐghÐ$KÐ$iÐ!ä Ÿ9š9Ð&;Ð%JÐPQÑR×UÑUØ#×)Ñ)°&ð Vð ˆLð 	‰×$Ñ$Ð%8ÀÐ$ÑHØŸ>™>×3Ñ3Ðà#Ÿy™y×/Ñ/×;Ñ;Ðä# F°4×3IÑ3IÓJ‰ˆð ×&Ñ&ØÐ-¨vÐ=Ø&×,Ñ,ØØØØN‰Nó
ˆô ˜d×/Ñ/Ð0@ÓA×B‰DˆAˆqæ=X¤§¢¨G¨9°q©=Ô!9Ð^eÐà0=È|Ñ \ÐØŸ™Ø)ØØ&@Ø"3Ø!ð #ð ð ñˆJö +Ø,6×,<Ñ,<¸W¿]¹]È1Ñ=MÐSTÐ,<Ð,UÑ)
˜MØ5?×5EÑ5EÀaÓ5HÑ2Ð! ?Ø(5×(;Ñ(;¸AÓ(>Ñ%Ð%Ø.°À?ÐUfÑCfÑ1gÑg
Ü"ŸYšY¨
Ð4FÐ'GÈQÑO
ô ˜Ÿ™×-Ñ-¨×?Ñ?Ø—N‘N×)Ñ)×7Ñ7Ð;WÓWà *× 0Ñ 0°·±¸qÑ1AÀqÐ 0Ð I‘
˜Að —n‘n×)Ñ)ØØØØ#ð	 *ð ÷
 ‰kð ð Ñ#¨¨NÑ(:¸aÓ(?Ø¤¨¯©¸ÀÓ CÑCÙ˜ 1 gÔ.ç}Ü—’—ñO CðT —	‘	× Ñ  ¸TÐ ÐBÀ8ÑLˆà×#Ñ#Ô%àÐ1Ó1ÜÐhÐitÐhuÐvÓwÐwà˜-Ó'Ø˜C‘K #Ñ%ˆEØ—K‘K  1Ó%ˆEØ—I‘I“K×'Ñ'¨¨1¨a°Ó3×9Ñ9Ó;×AÑAÓCˆEà˜%ÓØ×%Ñ% eÓ,ˆEæØ8ˆOä"¨%Ñ0Ð0r   )r/   )N)Né   r±   éd   g      @r   NNr‰   Nr   T) Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__doc__Úmodel_cpu_offload_seqr   r   r	   r   r   r   r
   r*   r<   rq   rQ   Úno_gradr   ÚEXAMPLE_DOC_STRINGrZ   r   ÚTensorr   ÚintrŸ   Ú	Generatorr   Úboolr¯   Ú__static_attributes__Ú__classcell__)r1   s   @r   r!   r!   U   së  ø† ñð& 7ÐðUà&ðUð 'ðUð #ð	Uð
 ˜¨Ð5Ñ6ðUð ÷Uò(	ð" ôdDðL ‡]‚]ƒ_ÙÐ1Ó2ð <@ØØØ#&Ø #Ø%&ØMQØ*.Ø%*ØGKØØ ñ!q1àc˜4 ™9nÑ%ðq1ð ˜EŸL™L¨$¨u¯|©|Ñ*<Ð<Ñ=ðq1ð  % U§\¡\°4¸¿¹Ñ3EÐ%EÑFð	q1ð
 " %¨¨T°#©Y¨Ñ"7Ñ8ðq1ð ðq1ð ðq1ð !ðq1ð ðq1ð  #ðq1ð ˜E %§/¡/°4¸¿¹Ñ3HÐ"HÑIÑJðq1ð ˜%Ÿ,™,Ñ'ðq1ð ˜c‘]ðq1ð ˜8 S¨#¨u¯|©|Ð$<¸dÐ$BÑCÑDðq1ð ðq1ð  ô!q1ó 3ó öq1r   r!   )é   )$Útypingr   r   r   r   rQ   Útransformersr   Úmodelsr	   r
   Ú
schedulersr   r   Úutilsr   r   r   Úutils.torch_utilsr   Úpipeline_utilsr   r   r#   r   Útorch_xla.core.xla_modelÚcoreÚ	xla_modelr˜   r—   Ú
get_loggerr³   rU   rº   r   r!   r   r   r   Ú<module>rÍ      sy   ð÷ 3Ó 2ã õ÷ 4ß 6÷ñ õ
 .ß CÝ *ñ ×Ñß)Ð)àMà€Mà	×	Ò	˜HÓ	%€ðÐ ô>6ôN1Ð)õ N1r   