ó
    fT–hâ  ã                   ót  • S SK JrJrJr  S SKrSSKJr  SSKJ	r	  SSK
Jr  SSKJr  SSKJr  SS	KJrJr  S
SKJrJrJrJr  S
SKJr  SSKJr  SSKJr  \R<                  " \5      r Sr! " S S\5      r" " S S\5      r# " S S\5      r$ " S S\	\5      r% " S S\5      r& " S S\5      r' " S S\5      r(/ SQr)g) é    )ÚOptionalÚTupleÚUnionNé   )ÚCache)ÚFlashAttentionKwargs)ÚGradientCheckpointingLayer)ÚCausalLMOutputWithPast)ÚUnpack)Ú
LossKwargsÚloggingé   )ÚGlmAttentionÚGlmForCausalLMÚGlmForSequenceClassificationÚGlmForTokenClassification)ÚPhi3MLPé   )Ú
Glm4Config)ÚGlm4RMSNormzTHUDM/GLM-4-9B-Chat-0414c                   ó   • \ rS rSrSrg)ÚGlm4MLPé%   © N©Ú__name__Ú
__module__Ú__qualname__Ú__firstlineno__Ú__static_attributes__r   ó    Ú]/var/www/auris/envauris/lib/python3.13/site-packages/transformers/models/glm4/modular_glm4.pyr   r   %   ó   † Úr!   r   c                   ó€  ^ • \ rS rSrS\S\4U 4S jjr       SS\R                  S\	\R                     S\	\R                     S\	\   S	\	\   S
\	\   S\	\R                     S\	\\R                  \R                  4      S\\   S\\R                   \	\\R                   \R                   4      4   4S jjrSrU =r$ )ÚGlm4DecoderLayeré)   ÚconfigÚ	layer_idxc                 ó˜  >• [         TU ]  5         UR                  U l        [        XS9U l        [        U5      U l        [        UR                  UR                  S9U l	        [        UR                  UR                  S9U l
        [        UR                  UR                  S9U l        [        UR                  UR                  S9U l        g )N)r'   r(   )Úeps)ÚsuperÚ__init__Úhidden_sizeÚGlm4AttentionÚ	self_attnr   Úmlpr   Úrms_norm_epsÚinput_layernormÚpost_attention_layernormÚpost_self_attn_layernormÚpost_mlp_layernorm)Úselfr'   r(   Ú	__class__s      €r"   r,   ÚGlm4DecoderLayer.__init__*   sŸ   ø€ Ü‰ÑÔØ!×-Ñ-ˆÔÜ&¨fÑJˆŒä˜6“?ˆŒÜ*¨6×+=Ñ+=À6×CVÑCVÑWˆÔÜ(3°F×4FÑ4FÈF×L_ÑL_Ñ(`ˆÔ%Ü(3°F×4FÑ4FÈF×L_ÑL_Ñ(`ˆÔ%Ü"-¨f×.@Ñ.@Àf×FYÑFYÑ"ZˆÕr!   Úhidden_statesÚattention_maskÚposition_idsÚpast_key_valueÚoutput_attentionsÚ	use_cacheÚcache_positionÚposition_embeddingsÚkwargsÚreturnc	                 ó   • Un
U R                  U5      nU R                  " SUUUUUUUUS.U	D6u  pU R                  U5      nX¡-   nUn
U R                  U5      nU R	                  U5      nU R                  U5      nX¡-   nU4nU(       a  XË4-  nU$ )N)r9   r:   r;   r<   r=   r>   r?   r@   r   )r2   r/   r4   r3   r0   r5   )r6   r9   r:   r;   r<   r=   r>   r?   r@   rA   ÚresidualÚself_attn_weightsÚoutputss                r"   ÚforwardÚGlm4DecoderLayer.forward5   sÅ   € ð !ˆà×,Ñ,¨]Ó;ˆð ,0¯>ª>ð 
,
Ø'Ø)Ø%Ø)Ø/ØØ)Ø 3ñ
,
ð ñ
,
Ñ(ˆð ×5Ñ5°mÓDˆØ Ñ0ˆð !ˆØ×5Ñ5°mÓDˆØŸ™ Ó/ˆØ×/Ñ/°Ó>ˆØ Ñ0ˆà Ð"ˆÞØÐ+Ñ+ˆGàˆr!   )r-   r2   r0   r3   r5   r4   r/   )NNNFFNN)r   r   r   r   r   Úintr,   ÚtorchÚTensorr   Ú
LongTensorr   Úboolr   r   r   ÚFloatTensorrG   r    Ú__classcell__©r7   s   @r"   r%   r%   )   s  ø† ð	[˜zð 	[°c÷ 	[ð 26Ø37Ø*.Ø,1Ø$)Ø59ØKOñ+à—|‘|ð+ð ! §¡Ñ.ð+ð ˜u×/Ñ/Ñ0ð	+ð
 ! ™ð+ð $ D™>ð+ð ˜D‘>ð+ð ! ×!1Ñ!1Ñ2ð+ð & e¨E¯L©L¸%¿,¹,Ð,FÑ&GÑHð+ð Ð-Ñ.ð+ð 
ˆu× Ñ  (¨5°×1BÑ1BÀE×DUÑDUÐ1UÑ+VÑ"WÐWÑ	X÷+ó +r!   r%   c                   ó   • \ rS rSrSrg)r.   éc   r   Nr   r   r!   r"   r.   r.   c   r#   r!   r.   c                   ó   • \ rS rSrSrg)ÚKwargsForCausalLMég   r   Nr   r   r!   r"   rT   rT   g   s   † º3r!   rT   c                   óD   ^ • \ rS rSrS\\   S\\\4   4U 4S jjr	Sr
U =r$ )ÚGlm4ForCausalLMéj   Úsuper_kwargsrB   c                 ó$   >• [         TU ]  " S0 UD6$ )aò  
labels (`torch.LongTensor` of shape `(batch_size, sequence_length)`, *optional*):
    Labels for computing the masked language modeling loss. Indices should either be in `[0, ...,
    config.vocab_size]` or -100 (see `input_ids` docstring). Tokens with indices set to `-100` are ignored
    (masked), the loss is only computed for the tokens with labels in `[0, ..., config.vocab_size]`.

Example:

```python
>>> from transformers import AutoTokenizer, Glm4ForCausalLM

>>> model = Glm4ForCausalLM.from_pretrained("THUDM/GLM-4-9B-Chat-0414")
>>> tokenizer = AutoTokenizer.from_pretrained("THUDM/GLM-4-9B-Chat-0414")

>>> prompt = "Hey, are you conscious? Can you talk to me?"
>>> inputs = tokenizer(prompt, return_tensors="pt")

>>> # Generate
>>> generate_ids = model.generate(inputs.input_ids, max_length=30)
>>> tokenizer.batch_decode(generate_ids, skip_special_tokens=True, clean_up_tokenization_spaces=False)[0]
"Hey, are you conscious? Can you talk to me?\nI'm not conscious, but I can talk to you."
```r   )r+   rG   )r6   rY   r7   s     €r"   rG   ÚGlm4ForCausalLM.forwardk   s   ø€ ô4 ‰wŠÑ. Ñ.Ð.r!   r   )r   r   r   r   r   rT   r   r   r
   rG   r    rO   rP   s   @r"   rW   rW   j   s0   ø† ð/àÐ0Ñ1ð/ð 
ˆuÐ,Ð,Ñ	-÷/õ /r!   rW   c                   ó   • \ rS rSrSrg)ÚGlm4ForSequenceClassificationéˆ   r   Nr   r   r!   r"   r]   r]   ˆ   r#   r!   r]   c                   ó   • \ rS rSrSrg)ÚGlm4ForTokenClassificationéŒ   r   Nr   r   r!   r"   r`   r`   Œ   r#   r!   r`   )ÚGlm4PreTrainedModelÚ	Glm4ModelrW   r]   r`   )*Útypingr   r   r   Útorch.utils.checkpointrJ   Úcache_utilsr   Úmodeling_flash_attention_utilsr   Úmodeling_layersr	   Úmodeling_outputsr
   Úprocessing_utilsr   Úutilsr   r   Úglm.modeling_glmr   r   r   r   Úphi3.modeling_phi3r   Úconfiguration_glm4r   Úmodeling_glm4r   Ú
get_loggerr   ÚloggerÚ_CHECKPOINT_FOR_DOCr   r%   r.   rT   rW   r]   r`   Ú__all__r   r!   r"   Ú<module>rt      s©   ð÷  *Ñ )ã å  Ý BÝ 9Ý 6Ý &ß (ß tÓ tÝ (Ý *Ý &ð 
×	Ò	˜HÓ	%€à0Ð ô	ˆgô 	ô7Ð1ô 7ôt	Lô 	ô ?Ð,¨jÔ >ô/nô /ô<	Ð$@ô 	ô	Ð!:ô 	òr!   