|
| 1 | +MODELS_MASTER = { |
| 2 | + "path": "models/", |
| 3 | + "title": "Models", |
| 4 | + "toc": True, |
| 5 | + "children": [ |
| 6 | + { |
| 7 | + "path": "bert/", |
| 8 | + "title": "Bert", |
| 9 | + "toc": True, |
| 10 | + "children": [ |
| 11 | + { |
| 12 | + "path": "bert_tokenizer", |
| 13 | + "title": "BertTokenizer", |
| 14 | + "generate": [ |
| 15 | + "keras_nlp.models.BertTokenizer", |
| 16 | + "keras_nlp.models.BertTokenizer.from_preset", |
| 17 | + ], |
| 18 | + }, |
| 19 | + { |
| 20 | + "path": "bert_preprocessor", |
| 21 | + "title": "BertPreprocessor layer", |
| 22 | + "generate": [ |
| 23 | + "keras_nlp.models.BertPreprocessor", |
| 24 | + "keras_nlp.models.BertPreprocessor.from_preset", |
| 25 | + "keras_nlp.models.BertPreprocessor.tokenizer", |
| 26 | + ], |
| 27 | + }, |
| 28 | + { |
| 29 | + "path": "bert_backbone", |
| 30 | + "title": "BertBackbone model", |
| 31 | + "generate": [ |
| 32 | + "keras_nlp.models.BertBackbone", |
| 33 | + "keras_nlp.models.BertBackbone.from_preset", |
| 34 | + ], |
| 35 | + }, |
| 36 | + { |
| 37 | + "path": "bert_classifier", |
| 38 | + "title": "BertClassifier model", |
| 39 | + "generate": [ |
| 40 | + "keras_nlp.models.BertClassifier", |
| 41 | + "keras_nlp.models.BertClassifier.from_preset", |
| 42 | + "keras_nlp.models.BertClassifier.backbone", |
| 43 | + "keras_nlp.models.BertClassifier.preprocessor", |
| 44 | + ], |
| 45 | + }, |
| 46 | + ], |
| 47 | + }, |
| 48 | + { |
| 49 | + "path": "distil_bert/", |
| 50 | + "title": "DistilBert", |
| 51 | + "toc": True, |
| 52 | + "children": [ |
| 53 | + { |
| 54 | + "path": "distil_bert_tokenizer", |
| 55 | + "title": "DistilBertTokenizer", |
| 56 | + "generate": [ |
| 57 | + "keras_nlp.models.DistilBertTokenizer", |
| 58 | + "keras_nlp.models.DistilBertTokenizer.from_preset", |
| 59 | + ], |
| 60 | + }, |
| 61 | + { |
| 62 | + "path": "distil_bert_preprocessor", |
| 63 | + "title": "DistilBertPreprocessor layer", |
| 64 | + "generate": [ |
| 65 | + "keras_nlp.models.DistilBertPreprocessor", |
| 66 | + "keras_nlp.models.DistilBertPreprocessor.from_preset", |
| 67 | + "keras_nlp.models.DistilBertPreprocessor.tokenizer", |
| 68 | + ], |
| 69 | + }, |
| 70 | + { |
| 71 | + "path": "distil_bert_backbone", |
| 72 | + "title": "DistilBertBackbone model", |
| 73 | + "generate": [ |
| 74 | + "keras_nlp.models.DistilBertBackbone", |
| 75 | + "keras_nlp.models.DistilBertBackbone.from_preset", |
| 76 | + ], |
| 77 | + }, |
| 78 | + { |
| 79 | + "path": "distil_bert_classifier", |
| 80 | + "title": "DistilBertClassifier model", |
| 81 | + "generate": [ |
| 82 | + "keras_nlp.models.DistilBertClassifier", |
| 83 | + "keras_nlp.models.DistilBertClassifier.from_preset", |
| 84 | + "keras_nlp.models.DistilBertClassifier.backbone", |
| 85 | + "keras_nlp.models.DistilBertClassifier.preprocessor", |
| 86 | + ], |
| 87 | + }, |
| 88 | + ], |
| 89 | + }, |
| 90 | + { |
| 91 | + "path": "roberta/", |
| 92 | + "title": "Roberta", |
| 93 | + "toc": True, |
| 94 | + "children": [ |
| 95 | + { |
| 96 | + "path": "roberta_tokenizer", |
| 97 | + "title": "RobertaTokenizer", |
| 98 | + "generate": [ |
| 99 | + "keras_nlp.models.RobertaTokenizer", |
| 100 | + "keras_nlp.models.RobertaTokenizer.from_preset", |
| 101 | + ], |
| 102 | + }, |
| 103 | + { |
| 104 | + "path": "roberta_preprocessor", |
| 105 | + "title": "RobertaPreprocessor layer", |
| 106 | + "generate": [ |
| 107 | + "keras_nlp.models.RobertaPreprocessor", |
| 108 | + "keras_nlp.models.RobertaPreprocessor.from_preset", |
| 109 | + "keras_nlp.models.RobertaPreprocessor.tokenizer", |
| 110 | + ], |
| 111 | + }, |
| 112 | + { |
| 113 | + "path": "roberta_backbone", |
| 114 | + "title": "RobertaBackbone model", |
| 115 | + "generate": [ |
| 116 | + "keras_nlp.models.RobertaBackbone", |
| 117 | + "keras_nlp.models.RobertaBackbone.from_preset", |
| 118 | + ], |
| 119 | + }, |
| 120 | + { |
| 121 | + "path": "roberta_classifier", |
| 122 | + "title": "RobertaClassifier model", |
| 123 | + "generate": [ |
| 124 | + "keras_nlp.models.RobertaClassifier", |
| 125 | + "keras_nlp.models.RobertaClassifier.from_preset", |
| 126 | + "keras_nlp.models.RobertaClassifier.backbone", |
| 127 | + "keras_nlp.models.RobertaClassifier.preprocessor", |
| 128 | + ], |
| 129 | + }, |
| 130 | + ], |
| 131 | + }, |
| 132 | + { |
| 133 | + "path": "xlm_roberta/", |
| 134 | + "title": "XLMRoberta", |
| 135 | + "toc": True, |
| 136 | + "children": [ |
| 137 | + { |
| 138 | + "path": "xlm_roberta_tokenizer", |
| 139 | + "title": "XLMRobertaTokenizer", |
| 140 | + "generate": [ |
| 141 | + "keras_nlp.models.XLMRobertaTokenizer", |
| 142 | + "keras_nlp.models.XLMRobertaTokenizer.from_preset", |
| 143 | + ], |
| 144 | + }, |
| 145 | + { |
| 146 | + "path": "xlm_roberta_preprocessor", |
| 147 | + "title": "XLMRobertaPreprocessor layer", |
| 148 | + "generate": [ |
| 149 | + "keras_nlp.models.XLMRobertaPreprocessor", |
| 150 | + "keras_nlp.models.XLMRobertaPreprocessor.from_preset", |
| 151 | + "keras_nlp.models.XLMRobertaPreprocessor.tokenizer", |
| 152 | + ], |
| 153 | + }, |
| 154 | + { |
| 155 | + "path": "xlm_roberta_backbone", |
| 156 | + "title": "XLMRobertaBackbone model", |
| 157 | + "generate": [ |
| 158 | + "keras_nlp.models.XLMRobertaBackbone", |
| 159 | + "keras_nlp.models.XLMRobertaBackbone.from_preset", |
| 160 | + ], |
| 161 | + }, |
| 162 | + { |
| 163 | + "path": "xlm_roberta_classifier", |
| 164 | + "title": "XLMRobertaClassifier model", |
| 165 | + "generate": [ |
| 166 | + "keras_nlp.models.XLMRobertaClassifier", |
| 167 | + "keras_nlp.models.XLMRobertaClassifier.from_preset", |
| 168 | + "keras_nlp.models.XLMRobertaClassifier.backbone", |
| 169 | + "keras_nlp.models.XLMRobertaClassifier.preprocessor", |
| 170 | + ], |
| 171 | + }, |
| 172 | + ], |
| 173 | + }, |
| 174 | + ], |
| 175 | +} |
| 176 | + |
1 | 177 | TOKENIZERS_MASTER = { |
2 | 178 | "path": "tokenizers/", |
3 | 179 | "title": "Tokenizers", |
|
69 | 245 | ], |
70 | 246 | }, |
71 | 247 | { |
72 | | - "path": "unicode_character_tokenizer", |
73 | | - "title": "UnicodeCharacterTokenizer", |
| 248 | + "path": "unicode_codepoint_tokenizer", |
| 249 | + "title": "UnicodeCodepointTokenizer", |
74 | 250 | "generate": [ |
75 | | - "keras_nlp.tokenizers.UnicodeCharacterTokenizer", |
76 | | - "keras_nlp.tokenizers.UnicodeCharacterTokenizer.tokenize", |
77 | | - "keras_nlp.tokenizers.UnicodeCharacterTokenizer.detokenize", |
78 | | - "keras_nlp.tokenizers.UnicodeCharacterTokenizer.get_vocabulary", |
79 | | - "keras_nlp.tokenizers.UnicodeCharacterTokenizer.vocabulary_size", |
80 | | - "keras_nlp.tokenizers.UnicodeCharacterTokenizer.token_to_id", |
81 | | - "keras_nlp.tokenizers.UnicodeCharacterTokenizer.id_to_token", |
| 251 | + "keras_nlp.tokenizers.UnicodeCodepointTokenizer", |
| 252 | + "keras_nlp.tokenizers.UnicodeCodepointTokenizer.tokenize", |
| 253 | + "keras_nlp.tokenizers.UnicodeCodepointTokenizer.detokenize", |
| 254 | + "keras_nlp.tokenizers.UnicodeCodepointTokenizer.get_vocabulary", |
| 255 | + "keras_nlp.tokenizers.UnicodeCodepointTokenizer.vocabulary_size", |
| 256 | + "keras_nlp.tokenizers.UnicodeCodepointTokenizer.token_to_id", |
| 257 | + "keras_nlp.tokenizers.UnicodeCodepointTokenizer.id_to_token", |
82 | 258 | ], |
83 | 259 | }, |
| 260 | + { |
| 261 | + "path": "compute_word_piece_vocabulary", |
| 262 | + "title": "compute_word_piece_vocabulary function", |
| 263 | + "generate": ["keras_nlp.tokenizers.compute_word_piece_vocabulary"], |
| 264 | + }, |
| 265 | + { |
| 266 | + "path": "compute_sentence_piece_proto", |
| 267 | + "title": "compute_sentence_piece_proto function", |
| 268 | + "generate": ["keras_nlp.tokenizers.compute_sentence_piece_proto"], |
| 269 | + }, |
84 | 270 | ], |
85 | 271 | } |
86 | 272 |
|
87 | | -LAYERS_MASTER = { |
88 | | - "path": "layers/", |
89 | | - "title": "Layers", |
| 273 | +PREPROCESSING_LAYERS_MASTER = { |
| 274 | + "path": "preprocessing_layers/", |
| 275 | + "title": "Preprocessing Layers", |
| 276 | + "toc": True, |
| 277 | + "children": [ |
| 278 | + { |
| 279 | + "path": "start_end_packer", |
| 280 | + "title": "StartEndPacker layer", |
| 281 | + "generate": ["keras_nlp.layers.StartEndPacker"], |
| 282 | + }, |
| 283 | + { |
| 284 | + "path": "multi_segment_packer", |
| 285 | + "title": "MultiSegmentPacker layer", |
| 286 | + "generate": ["keras_nlp.layers.MultiSegmentPacker"], |
| 287 | + }, |
| 288 | + { |
| 289 | + "path": "random_swap", |
| 290 | + "title": "RandomSwap layer", |
| 291 | + "generate": ["keras_nlp.layers.RandomSwap"], |
| 292 | + }, |
| 293 | + { |
| 294 | + "path": "random_deletion", |
| 295 | + "title": "RandomDeletion layer", |
| 296 | + "generate": ["keras_nlp.layers.RandomDeletion"], |
| 297 | + }, |
| 298 | + { |
| 299 | + "path": "masked_lm_mask_generator", |
| 300 | + "title": "MaskedLMMaskGenerator layer", |
| 301 | + "generate": ["keras_nlp.layers.MaskedLMMaskGenerator"], |
| 302 | + }, |
| 303 | + ], |
| 304 | +} |
| 305 | + |
| 306 | +MODELING_LAYERS_MASTER = { |
| 307 | + "path": "modeling_layers/", |
| 308 | + "title": "Modeling Layers", |
90 | 309 | "toc": True, |
91 | 310 | "children": [ |
92 | 311 | { |
|
126 | 345 | "generate": ["keras_nlp.layers.TokenAndPositionEmbedding"], |
127 | 346 | }, |
128 | 347 | { |
129 | | - "path": "mlm_mask_generator", |
130 | | - "title": "MLMMaskGenerator layer", |
131 | | - "generate": ["keras_nlp.layers.MLMMaskGenerator"], |
132 | | - }, |
133 | | - { |
134 | | - "path": "mlm_head", |
135 | | - "title": "MLMHead layer", |
136 | | - "generate": ["keras_nlp.layers.MLMHead"], |
137 | | - }, |
138 | | - { |
139 | | - "path": "start_end_packer", |
140 | | - "title": "StartEndPacker layer", |
141 | | - "generate": ["keras_nlp.layers.StartEndPacker"], |
142 | | - }, |
143 | | - { |
144 | | - "path": "multi_segment_packer", |
145 | | - "title": "MultiSegmentPacker layer", |
146 | | - "generate": ["keras_nlp.layers.MultiSegmentPacker"], |
| 348 | + "path": "masked_lm_head", |
| 349 | + "title": "MaskedLMHead layer", |
| 350 | + "generate": ["keras_nlp.layers.MaskedLMHead"], |
147 | 351 | }, |
148 | 352 | ], |
149 | 353 | } |
|
169 | 373 | "title": "RougeN metric", |
170 | 374 | "generate": ["keras_nlp.metrics.RougeN"], |
171 | 375 | }, |
| 376 | + { |
| 377 | + "path": "bleu", |
| 378 | + "title": "Bleu metric", |
| 379 | + "generate": ["keras_nlp.metrics.Bleu"], |
| 380 | + }, |
| 381 | + { |
| 382 | + "path": "edit_distance", |
| 383 | + "title": "EditDistance metric", |
| 384 | + "generate": ["keras_nlp.metrics.EditDistance"], |
| 385 | + }, |
| 386 | + |
172 | 387 | ], |
173 | 388 | } |
174 | 389 |
|
|
210 | 425 | "title": "KerasNLP", |
211 | 426 | "toc": True, |
212 | 427 | "children": [ |
| 428 | + MODELS_MASTER, |
213 | 429 | TOKENIZERS_MASTER, |
214 | | - LAYERS_MASTER, |
| 430 | + PREPROCESSING_LAYERS_MASTER, |
| 431 | + MODELING_LAYERS_MASTER, |
215 | 432 | METRICS_MASTER, |
216 | 433 | UTILS_MASTER, |
217 | 434 | ], |
|
0 commit comments