|
| 1 | +# Parameters for Adam: |
| 2 | +# ============================================================================== |
| 3 | +Adam.b1 = 0.9 |
| 4 | +Adam.b2 = 0.999 |
| 5 | +Adam.clip_grad_norm = None |
| 6 | +Adam.eps = 1e-05 |
| 7 | +Adam.weight_decay_rate = 1e-05 |
| 8 | + |
| 9 | +# Parameters for AddLossWeights: |
| 10 | +# ============================================================================== |
| 11 | +# None. |
| 12 | + |
| 13 | +# Parameters for backend: |
| 14 | +# ============================================================================== |
| 15 | +backend.name = 'jax' |
| 16 | + |
| 17 | +# Parameters for BucketByLength: |
| 18 | +# ============================================================================== |
| 19 | +BucketByLength.length_axis = 0 |
| 20 | +BucketByLength.strict_pad_on_len = False |
| 21 | + |
| 22 | +# Parameters for FilterByLength: |
| 23 | +# ============================================================================== |
| 24 | +FilterByLength.length_axis = 0 |
| 25 | + |
| 26 | +# Parameters for LogSoftmax: |
| 27 | +# ============================================================================== |
| 28 | +LogSoftmax.axis = -1 |
| 29 | + |
| 30 | +# Parameters for random_spans_helper: |
| 31 | +# ============================================================================== |
| 32 | +# None. |
| 33 | + |
| 34 | +# Parameters for SentencePieceVocabulary: |
| 35 | +# ============================================================================== |
| 36 | +# None. |
| 37 | + |
| 38 | +# Parameters for data.TFDS: |
| 39 | +# ============================================================================== |
| 40 | +# None. |
| 41 | + |
| 42 | +# Parameters for tf_inputs.TFDS: |
| 43 | +# ============================================================================== |
| 44 | +# None. |
| 45 | + |
| 46 | +# Parameters for data.Tokenize: |
| 47 | +# ============================================================================== |
| 48 | +# None. |
| 49 | + |
| 50 | +# Parameters for tf_inputs.Tokenize: |
| 51 | +# ============================================================================== |
| 52 | +tf_inputs.Tokenize.keys = None |
| 53 | +tf_inputs.Tokenize.n_reserved_ids = 0 |
| 54 | +tf_inputs.Tokenize.vocab_type = 'subword' |
| 55 | + |
| 56 | +# Parameters for Vocabulary: |
| 57 | +# ============================================================================== |
| 58 | +# None. |
| 59 | + |
| 60 | +# Parameters for warmup_and_rsqrt_decay: |
| 61 | +# ============================================================================== |
| 62 | +# None. |
0 commit comments