Skip to content

Commit 0411151

Browse files
committed
Add large variations of electra in presets
1 parent b268e26 commit 0411151

File tree

2 files changed

+32
-4
lines changed

2 files changed

+32
-4
lines changed

keras_nlp/models/electra/electra_presets.py

Lines changed: 30 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525
"path": "electra",
2626
"model_card": "https://github.com/google-research/electra",
2727
},
28-
"kaggle_handle": "kaggle://pranavprajapati16/electra/keras/electra_base_discriminator_en/1",
28+
"kaggle_handle": "kaggle://keras/electra/keras/electra_base_discriminator_en/1",
2929
},
3030
"electra_small_discriminator_en": {
3131
"metadata": {
@@ -38,7 +38,7 @@
3838
"path": "electra",
3939
"model_card": "https://github.com/google-research/electra",
4040
},
41-
"kaggle_handle": "kaggle://pranavprajapati16/electra/keras/electra_small_discriminator_en/1",
41+
"kaggle_handle": "kaggle://keras/electra/keras/electra_small_discriminator_en/1",
4242
},
4343
"electra_small_generator_en": {
4444
"metadata": {
@@ -51,7 +51,7 @@
5151
"path": "electra",
5252
"model_card": "https://github.com/google-research/electra",
5353
},
54-
"kaggle_handle": "kaggle://pranavprajapati16/electra/keras/electra_small_generator_en/1",
54+
"kaggle_handle": "kaggle://keras/electra/keras/electra_small_generator_en/1",
5555
},
5656
"electra_base_generator_en": {
5757
"metadata": {
@@ -64,6 +64,32 @@
6464
"path": "electra",
6565
"model_card": "https://github.com/google-research/electra",
6666
},
67-
"kaggle_handle": "kaggle://pranavprajapati16/electra/keras/electra_base_generator_en/1",
67+
"kaggle_handle": "kaggle://keras/electra/keras/electra_base_generator_en/1",
68+
},
69+
"electra_large_generator_en": {
70+
"metadata": {
71+
"description": (
72+
"ELECTRA: Pre-training Text Encoders as Discriminators Rather Than Generators"
73+
"This is large generator model with 24 layers."
74+
),
75+
"params": 51065344,
76+
"official_name": "ELECTRA",
77+
"path": "electra",
78+
"model_card": "https://github.com/google-research/electra",
79+
},
80+
"kaggle_handle": "kaggle://pranavprajapati16/electra/keras/electra_large_generator_en/1",
81+
},
82+
"electra_large_discriminator_en": {
83+
"metadata": {
84+
"description": (
85+
"ELECTRA: Pre-training Text Encoders as Discriminators Rather Than Generators"
86+
"This is large discriminator model with 24 layers."
87+
),
88+
"params": 335141888,
89+
"official_name": "ELECTRA",
90+
"path": "electra",
91+
"model_card": "https://github.com/google-research/electra",
92+
},
93+
"kaggle_handle": "kaggle://pranavprajapati16/electra/keras/electra_large_discriminator_en/1",
6894
},
6995
}

tools/checkpoint_conversion/convert_electra_checkpoints.py

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -37,6 +37,8 @@
3737
"electra_small_generator_en": "google/electra-small-generator",
3838
"electra_base_discriminator_en": "google/electra-base-discriminator",
3939
"electra_small_discriminator_en": "google/electra-small-discriminator",
40+
"electra_large_discriminator_en": "google/electra-large-discriminator",
41+
"electra_large_generator_en": "google/electra-large-generator",
4042
}
4143

4244
EXTRACT_DIR = "./model"

0 commit comments

Comments
 (0)