+
    ~j8                         R t ^ RIHt ^RIHt ^RIHt ^RIHt ^RI	H
t
 ]! RR7      ] ! R R	]4      4       4       tR	.tR
# )zLLaMA model configuration)strict)PreTrainedConfig)RopeParameters)auto_docstring)intervalzmeta-llama/Llama-2-7b-hf)
checkpointc                     a a ] tR t^t oRtRtR.tRRRRRRRR	R
RRRRR	/tRR.R.3RRR.R.3RR.R.3/tRt	Rt
Rt^ t^ tRtRtRt]! RRR7      ! RR7      tRtR tRt^t^t^tR!tRtR!tRtR!tRtV 3R" ltR# t V3R$ lt!R%t"Vt#V ;t$# )&LlamaConfigaP  
```python
>>> from transformers import LlamaModel, LlamaConfig

>>> # Initializing a LLaMA llama-7b style configuration
>>> configuration = LlamaConfig()

>>> # Initializing a model from the llama-7b style configuration
>>> model = LlamaModel(configuration)

>>> # Accessing the model configuration
>>> configuration = model.config
```llamapast_key_valueszlayers.*.self_attn.q_projcolwisezlayers.*.self_attn.k_projzlayers.*.self_attn.v_projzlayers.*.self_attn.o_projrowwisezlayers.*.mlp.gate_projzlayers.*.mlp.up_projzlayers.*.mlp.down_projembed_tokens	input_idsinputs_embedslayershidden_statesattention_masknormi }  i   i +  Nsilui   g        g      ?)minmaxg{Gz?)defaultgư>TFc                   < V P                   f#   V P                  V P                  ,          V n         V P                  f   V P                  V n        \        SV `  ! R/ VB  R # )N )head_dimhidden_sizenum_attention_headsnum_key_value_headssuper__post_init__)selfkwargs	__class__s   &,ڂ/Users/mitch_tango/dev/rabbit-r1-livekit/agent/.venv/lib/python3.14/site-packages/transformers/models/llama/configuration_llama.pyr    LlamaConfig.__post_init__V   sO    ==  ,,0H0HHDM##+'+'?'?D$''    c                    V P                   V P                  ,          ^ 8w  d'   \        RV P                    RV P                   R24      hR# )zOPart of `@strict`-powered validation. Validates the architecture of the config.zThe hidden size (z6) is not a multiple of the number of attention heads (z).N)r   r   
ValueError)r!   s   &r$   validate_architecture!LlamaConfig.validate_architecture^   sS    d666!;#D$4$4#5 622327  <r&   c                  < V ^8  d   Qh/ S[ ;R&   S[ ;R&   S[ ;R&   S[ ;R&   S[ ;R&   S[ R,          ;R&   S[;R&   S[ ;R	&   S[;R
&   S[;R&   S[;R&   S[ R,          ;R&   S[ R,          ;R&   S[ S[S[ ,          ,          R,          ;R&   S[ R,          ;R&   S[;R&   S[S[,          R,          ;R&   S[;R&   S[ S[,          R,          ;R&   S[;R&   S[ R,          ;R&   # )   
vocab_sizer   intermediate_sizenum_hidden_layersr   Nr   
hidden_actmax_position_embeddingsinitializer_rangerms_norm_eps	use_cachepad_token_idbos_token_ideos_token_idpretraining_tptie_word_embeddingsrope_parametersattention_biasattention_dropoutmlp_biasr   )intstrfloatboollistr   dict)format__classdict__s   "r$   __annotate__LlamaConfig.__annotate__   st    F G H I J "K L M N !O P t*Q R S T !'U V GW X Y Z [ \ *#] ^ * _ ` S	/D(,a b $J"c d %e f $d*T18g h  i j U{T)/k l m n Djo r&   )r   r   )%__name__
__module____qualname____firstlineno____doc__
model_typekeys_to_ignore_at_inferencebase_model_tp_planbase_model_pp_planr-   r   r.   r/   r   r   r0   r1   r   r2   r3   r4   r5   r6   r7   r8   r9   r:   r;   r<   r=   r   r    r)   __annotate_func____static_attributes____classdictcell____classcell__)r#   rE   s   @@r$   r	   r	      s     J#4"5 	$Y#Y#Y#Y )	 ) 	+(9:O%568IJ/"_$56 JK"!&*J#''CS9$GLI#L L+,L!"N %48O N,/HH(C  r&   r	   N)rL   huggingface_hub.dataclassesr   configuration_utilsr   modeling_rope_utilsr   utilsr   utils.type_validatorsr   r	   __all__r   r&   r$   <module>r[      sP   &   . 3 1 # - 56E" E  7EP /r&   