
    +hWD                         S SK JrJrJrJrJrJrJr  S SKrS SK	J
r
Jr  SSKJrJr  SSKJrJr  SSKJr  SSKJrJr  S	S
KJrJrJr  \" 5       (       a  S SKJs  Jr  SrOSrSr  " S S\\5      r!g)    )AnyCallableDictListOptionalTupleUnionN)CLIPTextModelWithProjectionCLIPTokenizer   )PipelineImageInputVaeImageProcessor)UVit2DModelVQModel)AmusedScheduler)is_torch_xla_availablereplace_example_docstring   )DeprecatedPipelineMixinDiffusionPipelineImagePipelineOutputTFa  
    Examples:
        ```py
        >>> import torch
        >>> from diffusers import AmusedImg2ImgPipeline
        >>> from diffusers.utils import load_image

        >>> pipe = AmusedImg2ImgPipeline.from_pretrained(
        ...     "amused/amused-512", variant="fp16", torch_dtype=torch.float16
        ... )
        >>> pipe = pipe.to("cuda")

        >>> prompt = "winter mountains"
        >>> input_image = (
        ...     load_image(
        ...         "https://huggingface.co/datasets/diffusers/docs-images/resolve/main/open_muse/mountains.jpg"
        ...     )
        ...     .resize((512, 512))
        ...     .convert("RGB")
        ... )
        >>> image = pipe(prompt, input_image).images[0]
        ```
c            -       `  ^  \ rS rSr% Sr\\S'   \\S'   \\S'   \	\S'   \
\S'   \\S'   S	rS/rS\S\S\	S\
S\4
U 4S
 jjr\R                   " 5       \" \5                          S!S\\\\   \4      S\S\S\S\S\\\\\   4      S\\   S\\R4                     S\\R6                     S\\R6                     S\\R6                     S\\R6                     S\S\\\\\R6                  /S4      S\S\\\\4      S\S\ \\4   S\\\ \\4   \\   4   4&S jj5       5       r!S r"U =r#$ )"AmusedImg2ImgPipeline<   z0.33.1image_processorvqvae	tokenizertext_encodertransformer	schedulerz text_encoder->transformer->vqvaec                 
  > [         TU ]  5         U R                  UUUUUS9  [        U SS 5      (       a/  S[	        U R
                  R                  R                  5      S-
  -  OSU l        [        U R                  SS9U l
        g )N)r   r   r   r   r    r   r         F)vae_scale_factordo_normalize)super__init__register_modulesgetattrlenr   configblock_out_channelsr$   r   r   )selfr   r   r   r   r    	__class__s         l/home/james-whalen/.local/lib/python3.13/site-packages/diffusers/pipelines/amused/pipeline_amused_img2img.pyr'   AmusedImg2ImgPipeline.__init__L   s     	%# 	 	
 ELDRY[_D`D`A#djj''::;a?@fg 	  1$BWBWfkl    Npromptimagestrengthnum_inference_stepsguidance_scalenegative_promptnum_images_per_prompt	generatorprompt_embedsencoder_hidden_statesnegative_prompt_embedsnegative_encoder_hidden_statesreturn_dictcallbackcallback_stepscross_attention_kwargs"micro_conditioning_aesthetic_scoremicro_conditioning_crop_coordtemperaturec           
         U	b  U
b  U	c  U
b  [        S5      eUb  Ub  Uc  Ub  [        S5      eUc  U	b  Ub  U	b  [        S5      e[        U[        5      (       a  U/nUb  [        U5      nOU	R                  S   nUU-  nU	cv  U R                  USSSU R
                  R                  S	9R                  R                  U R                  5      nU R                  USSS
9nUR                  n	UR                  S   n
U	R                  US5      n	U
R                  USS5      n
US:  a  Uc  Uc  S/[        U5      -  n[        U[        5      (       a  U/nU R                  USSSU R
                  R                  S	9R                  R                  U R                  5      nU R                  USSS
9nUR                  nUR                  S   nUR                  US5      nUR                  USS5      n[        R                  " X/5      n	[        R                  " X/5      n
U R                   R#                  U5      nUR                  SS u  nn[        R$                  " UUUS   US   U/U R                  U
R&                  S9nUR)                  S5      nUR+                  US:  a  SU-  OUS5      nU R,                  R/                  UUU R                  5        [1        [        U R,                  R2                  5      U-  5      n[        U R,                  R2                  5      U-
  nU R4                  R&                  [        R6                  :H  =(       a     U R4                  R8                  R:                  nU(       a  U R4                  R=                  5         U R4                  R?                  UR                  U R4                  R&                  U R                  S95      R@                  nUR                  u  nnn n!U R4                  RC                  U5      S   S   RE                  UU U!5      nU R,                  RG                  UU R,                  R2                  US-
     US9nUR                  USS5      nU RI                  US9 n"[K        U[        U R,                  R2                  5      5       GHG  n#U R,                  R2                  U#   n$US:  a  [        RL                  " U/S-  5      n%OUn%U RO                  U%UU	U
US9n&US:  a  U&RQ                  S5      u  n'n(U'UU(U'-
  -  -   n&U R,                  RS                  U&U$UUS9RT                  nU#[        U R,                  R2                  5      S-
  :X  d   U#S-   U R,                  RV                  -  S:X  a@  U"RY                  5         Ub-  U#U-  S:X  a$  U#[[        U R,                  SS5      -  n)U" U)U$U5        [\        (       d  GM2  [^        R`                  " 5         GMJ     SSS5        US:X  a  Un*OU R4                  Rc                  USUUU Rd                  -  UU Rd                  -  U R4                  R8                  Rf                  4S9Rh                  Rk                  SS5      n*U R                   Rm                  U*U5      n*U(       a  U R4                  Ro                  5         U Rq                  5         U(       d  U*4$ [s        U*5      $ ! , (       d  f       N= f)a  
The call function to the pipeline for generation.

Args:
    prompt (`str` or `List[str]`, *optional*):
        The prompt or prompts to guide image generation. If not defined, you need to pass `prompt_embeds`.
    image (`torch.Tensor`, `PIL.Image.Image`, `np.ndarray`, `List[torch.Tensor]`, `List[PIL.Image.Image]`, or `List[np.ndarray]`):
        `Image`, numpy array or tensor representing an image batch to be used as the starting point. For both
        numpy array and pytorch tensor, the expected value range is between `[0, 1]` If it's a tensor or a list
        or tensors, the expected shape should be `(B, C, H, W)` or `(C, H, W)`. If it is a numpy array or a
        list of arrays, the expected shape should be `(B, H, W, C)` or `(H, W, C)` It can also accept image
        latents as `image`, but if passing latents directly it is not encoded again.
    strength (`float`, *optional*, defaults to 0.5):
        Indicates extent to transform the reference `image`. Must be between 0 and 1. `image` is used as a
        starting point and more noise is added the higher the `strength`. The number of denoising steps depends
        on the amount of noise initially added. When `strength` is 1, added noise is maximum and the denoising
        process runs for the full number of iterations specified in `num_inference_steps`. A value of 1
        essentially ignores `image`.
    num_inference_steps (`int`, *optional*, defaults to 12):
        The number of denoising steps. More denoising steps usually lead to a higher quality image at the
        expense of slower inference.
    guidance_scale (`float`, *optional*, defaults to 10.0):
        A higher guidance scale value encourages the model to generate images closely linked to the text
        `prompt` at the expense of lower image quality. Guidance scale is enabled when `guidance_scale > 1`.
    negative_prompt (`str` or `List[str]`, *optional*):
        The prompt or prompts to guide what to not include in image generation. If not defined, you need to
        pass `negative_prompt_embeds` instead. Ignored when not using guidance (`guidance_scale < 1`).
    num_images_per_prompt (`int`, *optional*, defaults to 1):
        The number of images to generate per prompt.
    generator (`torch.Generator`, *optional*):
        A [`torch.Generator`](https://pytorch.org/docs/stable/generated/torch.Generator.html) to make
        generation deterministic.
    prompt_embeds (`torch.Tensor`, *optional*):
        Pre-generated text embeddings. Can be used to easily tweak text inputs (prompt weighting). If not
        provided, text embeddings are generated from the `prompt` input argument. A single vector from the
        pooled and projected final hidden states.
    encoder_hidden_states (`torch.Tensor`, *optional*):
        Pre-generated penultimate hidden states from the text encoder providing additional text conditioning.
    negative_prompt_embeds (`torch.Tensor`, *optional*):
        Pre-generated negative text embeddings. Can be used to easily tweak text inputs (prompt weighting). If
        not provided, `negative_prompt_embeds` are generated from the `negative_prompt` input argument.
    negative_encoder_hidden_states (`torch.Tensor`, *optional*):
        Analogous to `encoder_hidden_states` for the positive prompt.
    output_type (`str`, *optional*, defaults to `"pil"`):
        The output format of the generated image. Choose between `PIL.Image` or `np.array`.
    return_dict (`bool`, *optional*, defaults to `True`):
        Whether or not to return a [`~pipelines.stable_diffusion.StableDiffusionPipelineOutput`] instead of a
        plain tuple.
    callback (`Callable`, *optional*):
        A function that calls every `callback_steps` steps during inference. The function is called with the
        following arguments: `callback(step: int, timestep: int, latents: torch.Tensor)`.
    callback_steps (`int`, *optional*, defaults to 1):
        The frequency at which the `callback` function is called. If not specified, the callback is called at
        every step.
    cross_attention_kwargs (`dict`, *optional*):
        A kwargs dictionary that if specified is passed along to the [`AttentionProcessor`] as defined in
        [`self.processor`](https://github.com/huggingface/diffusers/blob/main/src/diffusers/models/attention_processor.py).
    micro_conditioning_aesthetic_score (`int`, *optional*, defaults to 6):
        The targeted aesthetic score according to the laion aesthetic classifier. See
        https://laion.ai/blog/laion-aesthetics/ and the micro-conditioning section of
        https://huggingface.co/papers/2307.01952.
    micro_conditioning_crop_coord (`Tuple[int]`, *optional*, defaults to (0, 0)):
        The targeted height, width crop coordinates. See the micro-conditioning section of
        https://huggingface.co/papers/2307.01952.
    temperature (`Union[int, Tuple[int, int], List[int]]`, *optional*, defaults to (2, 0)):
        Configures the temperature scheduler on `self.scheduler` see `AmusedScheduler#set_timesteps`.

Examples:

Returns:
    [`~pipelines.pipeline_utils.ImagePipelineOutput`] or `tuple`:
        If `return_dict` is `True`, [`~pipelines.pipeline_utils.ImagePipelineOutput`] is returned, otherwise a
        `tuple` is returned where the first element is a list with the generated images.
NzGpass either both `prompt_embeds` and `encoder_hidden_states` or neitherzYpass either both `negative_prompt_embeds` and `negative_encoder_hidden_states` or neitherz,pass only one of `prompt` or `prompt_embeds`r   pt
max_lengthT)return_tensorspadding
truncationrG   )r>   output_hidden_statesr"   g      ? )devicedtyper   )rO   rN   )r9   )total)micro_condspooled_text_embr;   rA   )model_outputtimestepsampler9   orderlatent)force_not_quantizeshape):
ValueError
isinstancestrr*   rZ   r   model_max_length	input_idsto_execution_devicer   text_embedshidden_statesrepeattorchconcatr   
preprocesstensorrO   	unsqueezeexpandr    set_timestepsint	timestepsr   float16r+   force_upcastfloatencodelatentsquantizereshape	add_noiseprogress_barrangecatr   chunkstepprev_samplerW   updater)   XLA_AVAILABLExm	mark_stepdecoder$   latent_channelsrV   clippostprocesshalfmaybe_free_model_hooksr   )+r-   r2   r3   r4   r5   r6   r7   r8   r9   r:   r;   r<   r=   output_typer>   r?   r@   rA   rB   rC   rD   
batch_sizer_   outputsheightwidthrR   start_timestep_idxneeds_upcastingrr   latents_bszchannelslatents_heightlatents_widthrv   irU   model_inputrT   uncond_logitscond_logitsstep_idxoutputs+                                              r/   __call__AmusedImg2ImgPipeline.__call__b   s   H %*?*G!&;&Gfgg".3Q3Y"*/M/Yk  N}4&:LQ^QjKLLfc""XFVJ&,,Q/J"77
 #$>>:: '  i4112  ''	tZ^'_G#//M$+$9$9"$=!%,,-BAF 5 < <=RTUWX YC%-"*')dS[&8Oos33'6&7O NN##'(##~~>> +  )BBt556  ++I4^b+c)0)<)<&181F1Fr1J.%;%B%BCXZ[%\"-K-R-RShjkmn-o*!LL*@)PQM$)LL2P1h$i!$$//6BC( ll-a0-a02 ))'--

 "++A.!((>C;OZU_acd$$%8+tG]G]^!#dnn&>&>"?("JK !9!9:=PP****emm;^

@Q@Q@^@^JJ**##EHH4::3C3CDLbLbH$cdll?F}}<X~}**%%g.q1!4<<[.Zgh..**T^^--.@1.DEQZ + 
 ..!61=%89\-s4>>3K3K/LM>>33A6!C'"'))WIM":K")K#// +$1*?+A  0   "C'1=1C1CA1F.M;#0>[S`E`3a#aL..--!-%"'	 . 
 +  DNN44599q1uH\H\>\`a>a '')+N0Ba0G#$(K#K 8W= =LLNE N :J ("FZZ&&#'d333T222JJ%%55	 ' 	 fTT!QZ  ))55fkJF

!##%9"6**y :9s   9E[[
[!)r   r$   )NNg      ?   g      $@Nr"   NNNNNpilTNr"   N   )r   r   )r   r   )$__name__
__module____qualname____firstlineno___last_supported_versionr   __annotations__r   r   r
   r   r   model_cpu_offload_seq_exclude_from_cpu_offloadr'   re   no_gradr   EXAMPLE_DOC_STRINGr   r	   r   r]   r   rp   rl   	GeneratorTensorboolr   r   r   r   r   __static_attributes____classcell__)r.   s   @r/   r   r   <   sJ   &&&N-->
 ")	mm !m 2	m
 !m #m, ]]_12 37$(#% $;?/0/3048<9=AE GK;?239?>D+G+tCy#~./G+ "G+ 	G+
 !G+ G+ "%T#Y"78G+  (}G+ EOO,G+  -G+  (5G+ !) 6G+ )1(>G+ G+  8S#u||$<d$BCD!G+" #G+$ !)c3h 8%G+& -0'G+( (-S#X)G+* 3c3hc:;+G+ 3 G+r1   r   )"typingr   r   r   r   r   r   r	   re   transformersr
   r   r   r   r   modelsr   r   
schedulersr   utilsr   r   pipeline_utilsr   r   r   torch_xla.core.xla_modelcore	xla_modelr~   r}   r   r    r1   r/   <module>r      s^    E D D  C D * ) F \ \ ))MM 2o+35F o+r1   