small fix on idefics (#954)

transposing the fixes from
https://github.com/huggingface/transformers/pull/25787
This commit is contained in:
Victor SANH 2023-09-01 12:44:34 -04:00 committed by GitHub
parent 4f5d93ecd0
commit 2bc287bfcd
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
1 changed files with 2 additions and 2 deletions

View File

@ -51,7 +51,7 @@ class IdeficsVisionConfig(PretrainedConfig):
Number of attention heads for each attention layer in the Transformer encoder. Number of attention heads for each attention layer in the Transformer encoder.
image_num_channels (`int`, *optional*, defaults to `3`): image_num_channels (`int`, *optional*, defaults to `3`):
Number of image channels. Number of image channels.
hidden_act (`str` or `function`, *optional*, defaults to `"quick_gelu"`): hidden_act (`str` or `function`, *optional*, defaults to `"gelu"`):
The non-linear activation function (function or string) in the encoder and pooler. If string, `"gelu"`, The non-linear activation function (function or string) in the encoder and pooler. If string, `"gelu"`,
`"relu"`, `"selu"` and `"gelu_new"` ``"quick_gelu"` are supported. `"relu"`, `"selu"` and `"gelu_new"` ``"quick_gelu"` are supported.
layer_norm_eps (`float`, *optional*, defaults to 1e-5): layer_norm_eps (`float`, *optional*, defaults to 1e-5):
@ -80,7 +80,7 @@ class IdeficsVisionConfig(PretrainedConfig):
num_hidden_layers=32, num_hidden_layers=32,
num_attention_heads=16, num_attention_heads=16,
num_channels=3, num_channels=3,
hidden_act="quick_gelu", hidden_act="gelu",
layer_norm_eps=1e-5, layer_norm_eps=1e-5,
attention_dropout=0.0, attention_dropout=0.0,
initializer_range=0.02, initializer_range=0.02,