File tree Expand file tree Collapse file tree
tests/conversion/test_configs Expand file tree Collapse file tree Original file line number Diff line number Diff line change 1313 ffn_hidden : 1024
1414 n_embd : 768
1515 dropout : 0.0
16- bias : false # true # True: bias in Linears, like GPT-2. False: a bit better and faster
16+ bias : false # True: bias in Linears, like GPT-2. False: a bit better and faster
1717 attention_config :
1818 qkv_transforms :
1919 - type_hint : RotaryTransform
@@ -30,21 +30,21 @@ model:
3030 config :
3131 normalized_shape : ${model.config.n_embd}
3232 eps : 1e-5
33- # bias: true
33+ bias : true
3434 ffn_norm :
3535 component_key : layer_norm
3636 variant_key : layer_norm
3737 config :
3838 normalized_shape : ${model.config.n_embd}
3939 eps : 1e-5
40- # bias: true
40+ bias : false
4141 lm_head_norm :
4242 component_key : layer_norm
4343 variant_key : layer_norm
4444 config :
4545 normalized_shape : ${model.config.n_embd}
4646 eps : 1e-5
47- # bias: true
47+ bias : true
4848
4949checkpointed_model :
5050 component_key : model
You can’t perform that action at this time.
0 commit comments