Skip to content
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
Show all changes
27 commits
Select commit Hold shift + click to select a range
62eaf03
Start landing code for Kaggle integration (#1320)
mattdangerw Nov 20, 2023
21fb04c
Switch byte pair tokenizer to save_assets/load_assets (#1322)
mattdangerw Nov 21, 2023
0e3c674
Convert SentencePieceTokenizer and associated models to new assets pa…
nkovela1 Nov 21, 2023
3619a6a
Add tests for Presets workflow, Add Metadata (#1326)
nkovela1 Nov 23, 2023
38806fd
Automatically add the keras framework to kaggle handles (#1331)
mattdangerw Nov 29, 2023
e0d34dc
Fix a failing byte pair tokenizer test (#1336)
mattdangerw Nov 30, 2023
0820d62
Use set comparison for assets (#1335)
mattdangerw Nov 30, 2023
c4b0c3c
Fix whisper tokenizer saving (#1334)
mattdangerw Nov 30, 2023
e3f8d06
Remove special case Bart from_preset (#1333)
mattdangerw Nov 30, 2023
dbb6487
Fix t5 tokenizer presets (#1339)
mattdangerw Nov 30, 2023
6130253
Script to convert presets (#1340)
mattdangerw Nov 30, 2023
814959b
Switch all preset to the new Kaggle format (#1338)
mattdangerw Dec 1, 2023
2aced24
Let kagglehub select latest version (#1342)
mattdangerw Dec 4, 2023
245b7e9
Use the proper title for example (#1346)
Philmod Dec 5, 2023
6ad8a30
Update conversion script (#1347)
mattdangerw Dec 6, 2023
7cc4323
Improve preset error messages (#1349)
mattdangerw Dec 7, 2023
9cc8110
Use subclass checking check_preset_class (#1344)
mattdangerw Dec 7, 2023
4606f32
Add a hacky fix for TF 2.13 and 2.14 weights.h5 loading (#1353)
mattdangerw Dec 7, 2023
9cb5838
Another fix for saving on Keras 2 (#1354)
mattdangerw Dec 7, 2023
039ff45
Switch our preset to there final kaggle location (#1345)
mattdangerw Dec 7, 2023
9cc3f84
Fix rebase issue in bytepair tokenizer (#1366)
nkovela1 Dec 12, 2023
6f7f9a0
Change encoding to utf-8 to fix Kaggle branch test failure for PyTorc…
sampathweb Dec 13, 2023
ddfca77
Fix GPU test issue with Keras 2 (#1368)
nkovela1 Dec 14, 2023
0e43f09
Add in-place modification of file keys for backwards compatibility (#…
nkovela1 Dec 15, 2023
4d84eb1
Add file renaming logic for modification (#1370)
nkovela1 Dec 16, 2023
29a0ae5
Fix task pre-processor in tasks (#1373)
sampathweb Dec 20, 2023
401e569
Backwards compatible fix for functional model saving (#1378)
mattdangerw Jan 4, 2024
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Prev Previous commit
Next Next commit
Switch our preset to there final kaggle location (#1345)
  • Loading branch information
mattdangerw committed Jan 4, 2024
commit 039ff4520bde904999ae6246309712a68a8ec85b
8 changes: 4 additions & 4 deletions keras_nlp/models/albert/albert_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/albert_base_en_uncased",
"kaggle_handle": "kaggle://keras/albert/albert_base_en_uncased/1",
},
"albert_large_en_uncased": {
"metadata": {
Expand All @@ -39,7 +39,7 @@
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/albert_large_en_uncased",
"kaggle_handle": "kaggle://keras/albert/albert_large_en_uncased/1",
},
"albert_extra_large_en_uncased": {
"metadata": {
Expand All @@ -52,7 +52,7 @@
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/albert_extra_large_en_uncased",
"kaggle_handle": "kaggle://keras/albert/albert_extra_large_en_uncased/1",
},
"albert_extra_extra_large_en_uncased": {
"metadata": {
Expand All @@ -65,6 +65,6 @@
"path": "albert",
"model_card": "https://github.com/google-research/albert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/albert_extra_extra_large_en_uncased",
"kaggle_handle": "kaggle://keras/albert/albert_extra_extra_large_en_uncased/1",
},
}
6 changes: 3 additions & 3 deletions keras_nlp/models/bart/bart_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
"path": "bart",
"model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/bart/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bart_base_en",
"kaggle_handle": "kaggle://keras/bart/bart_base_en/1",
},
"bart_large_en": {
"metadata": {
Expand All @@ -47,7 +47,7 @@
"dropout": 0.1,
"max_sequence_length": 1024,
},
"kaggle_handle": "gs://keras-nlp-kaggle/bart_large_en",
"kaggle_handle": "kaggle://keras/bart/bart_large_en/1",
},
"bart_large_en_cnn": {
"metadata": {
Expand All @@ -69,6 +69,6 @@
"dropout": 0.1,
"max_sequence_length": 1024,
},
"kaggle_handle": "gs://keras-nlp-kaggle/bart_large_en_cnn",
"kaggle_handle": "kaggle://keras/bart/bart_large_en_cnn/1",
},
}
22 changes: 10 additions & 12 deletions keras_nlp/models/bert/bert_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,8 +13,6 @@
# limitations under the License.
"""BERT model preset configurations."""

# TODO(jbischof): document presets in keras.io and use URL in docstrings
# Metadata for loading pretrained model weights.
backbone_presets = {
"bert_tiny_en_uncased": {
"metadata": {
Expand All @@ -27,7 +25,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_tiny_en_uncased",
"kaggle_handle": "kaggle://keras/bert/bert_tiny_en_uncased/1",
},
"bert_small_en_uncased": {
"metadata": {
Expand All @@ -40,7 +38,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_small_en_uncased",
"kaggle_handle": "kaggle://keras/bert/bert_small_en_uncased/1",
},
"bert_medium_en_uncased": {
"metadata": {
Expand All @@ -53,7 +51,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_medium_en_uncased",
"kaggle_handle": "kaggle://keras/bert/bert_medium_en_uncased/1",
},
"bert_base_en_uncased": {
"metadata": {
Expand All @@ -66,7 +64,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_base_en_uncased",
"kaggle_handle": "kaggle://keras/bert/bert_base_en_uncased/1",
},
"bert_base_en": {
"metadata": {
Expand All @@ -79,7 +77,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_base_en",
"kaggle_handle": "kaggle://keras/bert/bert_base_en/1",
},
"bert_base_zh": {
"metadata": {
Expand All @@ -91,7 +89,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_base_zh",
"kaggle_handle": "kaggle://keras/bert/bert_base_zh/1",
},
"bert_base_multi": {
"metadata": {
Expand All @@ -103,7 +101,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_base_multi",
"kaggle_handle": "kaggle://keras/bert/bert_base_multi/1",
},
"bert_large_en_uncased": {
"metadata": {
Expand All @@ -116,7 +114,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_large_en_uncased",
"kaggle_handle": "kaggle://keras/bert/bert_large_en_uncased/1",
},
"bert_large_en": {
"metadata": {
Expand All @@ -129,7 +127,7 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_large_en",
"kaggle_handle": "kaggle://keras/bert/bert_large_en/1",
},
}

Expand All @@ -144,6 +142,6 @@
"path": "bert",
"model_card": "https://github.com/google-research/bert/blob/master/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/bert_tiny_en_uncased_sst2",
"kaggle_handle": "kaggle://keras/bert/bert_tiny_en_uncased_sst2/1",
}
}
10 changes: 5 additions & 5 deletions keras_nlp/models/deberta_v3/deberta_v3_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-xsmall",
},
"kaggle_handle": "gs://keras-nlp-kaggle/deberta_v3_extra_small_en",
"kaggle_handle": "kaggle://keras/deberta_v3/deberta_v3_extra_small_en/1",
},
"deberta_v3_small_en": {
"metadata": {
Expand All @@ -38,7 +38,7 @@
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-small",
},
"kaggle_handle": "gs://keras-nlp-kaggle/deberta_v3_small_en",
"kaggle_handle": "kaggle://keras/deberta_v3/deberta_v3_small_en/1",
},
"deberta_v3_base_en": {
"metadata": {
Expand All @@ -51,7 +51,7 @@
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-base",
},
"kaggle_handle": "gs://keras-nlp-kaggle/deberta_v3_base_en",
"kaggle_handle": "kaggle://keras/deberta_v3/deberta_v3_base_en/1",
},
"deberta_v3_large_en": {
"metadata": {
Expand All @@ -64,7 +64,7 @@
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/deberta-v3-large",
},
"kaggle_handle": "gs://keras-nlp-kaggle/deberta_v3_large_en",
"kaggle_handle": "kaggle://keras/deberta_v3/deberta_v3_large_en/1",
},
"deberta_v3_base_multi": {
"metadata": {
Expand All @@ -77,6 +77,6 @@
"path": "deberta_v3",
"model_card": "https://huggingface.co/microsoft/mdeberta-v3-base",
},
"kaggle_handle": "gs://keras-nlp-kaggle/deberta_v3_base_multi",
"kaggle_handle": "kaggle://keras/deberta_v3/deberta_v3_base_multi/1",
},
}
6 changes: 3 additions & 3 deletions keras_nlp/models/distil_bert/distil_bert_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@
"path": "distil_bert",
"model_card": "https://huggingface.co/distilbert-base-uncased",
},
"kaggle_handle": "gs://keras-nlp-kaggle/distil_bert_base_en_uncased",
"kaggle_handle": "kaggle://keras/distil_bert/distil_bert_base_en_uncased/1",
},
"distil_bert_base_en": {
"metadata": {
Expand All @@ -40,7 +40,7 @@
"path": "distil_bert",
"model_card": "https://huggingface.co/distilbert-base-cased",
},
"kaggle_handle": "gs://keras-nlp-kaggle/distil_bert_base_en",
"kaggle_handle": "kaggle://keras/distil_bert/distil_bert_base_en/1",
},
"distil_bert_base_multi": {
"metadata": {
Expand All @@ -52,6 +52,6 @@
"path": "distil_bert",
"model_card": "https://huggingface.co/distilbert-base-multilingual-cased",
},
"kaggle_handle": "gs://keras-nlp-kaggle/distil_bert_base_multi",
"kaggle_handle": "kaggle://keras/distil_bert/distil_bert_base_multi/1",
},
}
4 changes: 2 additions & 2 deletions keras_nlp/models/f_net/f_net_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
"path": "f_net",
"model_card": "https://github.com/google-research/google-research/blob/master/f_net/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/f_net_base_en",
"kaggle_handle": "kaggle://keras/f_net/f_net_base_en/1",
},
"f_net_large_en": {
"metadata": {
Expand All @@ -38,6 +38,6 @@
"path": "f_net",
"model_card": "https://github.com/google-research/google-research/blob/master/f_net/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/f_net_large_en",
"kaggle_handle": "kaggle://keras/f_net/f_net_large_en/1",
},
}
10 changes: 5 additions & 5 deletions keras_nlp/models/gpt2/gpt2_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@
"path": "gpt2",
"model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/gpt2_base_en",
"kaggle_handle": "kaggle://keras/gpt2/gpt2_base_en/1",
},
"gpt2_medium_en": {
"metadata": {
Expand All @@ -39,7 +39,7 @@
"path": "gpt2",
"model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/gpt2_medium_en",
"kaggle_handle": "kaggle://keras/gpt2/gpt2_medium_en/1",
},
"gpt2_large_en": {
"metadata": {
Expand All @@ -52,7 +52,7 @@
"path": "gpt2",
"model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/gpt2_large_en",
"kaggle_handle": "kaggle://keras/gpt2/gpt2_large_en/1",
},
"gpt2_extra_large_en": {
"metadata": {
Expand All @@ -65,7 +65,7 @@
"path": "gpt2",
"model_card": "https://github.com/openai/gpt-2/blob/master/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/gpt2_extra_large_en",
"kaggle_handle": "kaggle://keras/gpt2/gpt2_extra_large_en/1",
},
"gpt2_base_en_cnn_dailymail": {
"metadata": {
Expand All @@ -77,6 +77,6 @@
"official_name": "GPT-2",
"path": "gpt2",
},
"kaggle_handle": "gs://keras-nlp-kaggle/gpt2_base_en_cnn_dailymail",
"kaggle_handle": "kaggle://keras/gpt2/gpt2_base_en_cnn_dailymail/1",
},
}
8 changes: 4 additions & 4 deletions keras_nlp/models/opt/opt_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -26,7 +26,7 @@
"path": "opt",
"model_card": "https://github.com/facebookresearch/metaseq/blob/main/projects/OPT/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/opt_125m_en",
"kaggle_handle": "kaggle://keras/opt/opt_125m_en/1",
},
# We skip the 350m checkpoint because it does not match the structure of
# other checkpoints.
Expand All @@ -41,7 +41,7 @@
"path": "opt",
"model_card": "https://github.com/facebookresearch/metaseq/blob/main/projects/OPT/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/opt_1.3b_en",
"kaggle_handle": "kaggle://keras/opt/opt_1.3b_en/1",
},
"opt_2.7b_en": {
"metadata": {
Expand All @@ -54,7 +54,7 @@
"path": "opt",
"model_card": "https://github.com/facebookresearch/metaseq/blob/main/projects/OPT/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/opt_2.7b_en",
"kaggle_handle": "kaggle://keras/opt/opt_2.7b_en/1",
},
"opt_6.7b_en": {
"metadata": {
Expand All @@ -67,6 +67,6 @@
"path": "opt",
"model_card": "https://github.com/facebookresearch/metaseq/blob/main/projects/OPT/model_card.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/opt_6.7b_en",
"kaggle_handle": "kaggle://keras/opt/opt_6.7b_en/1",
},
}
4 changes: 2 additions & 2 deletions keras_nlp/models/roberta/roberta_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
"path": "roberta",
"model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/roberta/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/roberta_base_en",
"kaggle_handle": "kaggle://keras/roberta/roberta_base_en/1",
},
"roberta_large_en": {
"metadata": {
Expand All @@ -38,6 +38,6 @@
"path": "roberta",
"model_card": "https://github.com/facebookresearch/fairseq/blob/main/examples/roberta/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/roberta_large_en",
"kaggle_handle": "kaggle://keras/roberta/roberta_large_en/1",
},
}
12 changes: 6 additions & 6 deletions keras_nlp/models/t5/t5_presets.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,7 +25,7 @@
"path": "t5",
"model_card": "https://github.com/google-research/text-to-text-transfer-transformer/blob/main/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/t5_small_multi",
"kaggle_handle": "kaggle://keras/t5/t5_small_multi/1",
},
"t5_base_multi": {
"metadata": {
Expand All @@ -38,7 +38,7 @@
"path": "t5",
"model_card": "https://github.com/google-research/text-to-text-transfer-transformer/blob/main/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/t5_base_multi",
"kaggle_handle": "kaggle://keras/t5/t5_base_multi/1",
},
"t5_large_multi": {
"metadata": {
Expand All @@ -51,7 +51,7 @@
"path": "t5",
"model_card": "https://github.com/google-research/text-to-text-transfer-transformer/blob/main/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/t5_large_multi",
"kaggle_handle": "kaggle://keras/t5/t5_large_multi/1",
},
"flan_small_multi": {
"metadata": {
Expand All @@ -64,7 +64,7 @@
"path": "t5",
"model_card": "https://github.com/google-research/text-to-text-transfer-transformer/blob/main/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/flan_small_multi",
"kaggle_handle": "kaggle://keras/t5/flan_small_multi/1",
},
"flan_base_multi": {
"metadata": {
Expand All @@ -77,7 +77,7 @@
"path": "t5",
"model_card": "https://github.com/google-research/text-to-text-transfer-transformer/blob/main/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/flan_base_multi",
"kaggle_handle": "kaggle://keras/t5/flan_base_multi/1",
},
"flan_large_multi": {
"metadata": {
Expand All @@ -90,6 +90,6 @@
"path": "t5",
"model_card": "https://github.com/google-research/text-to-text-transfer-transformer/blob/main/README.md",
},
"kaggle_handle": "gs://keras-nlp-kaggle/flan_large_multi",
"kaggle_handle": "kaggle://keras/t5/flan_large_multi/1",
},
}
Loading