|
4 | 4 | POST: > |
5 | 5 | s['global_batch_size'] = v['value'] |
6 | 6 |
|
7 | | -# TODO: Update with official compliance requirements |
| 7 | +- KEY: |
| 8 | + NAME: max_sequence_length |
| 9 | + REQ: EXACTLY_ONE |
| 10 | + CHECK: " v['value'] == 8192 " |
| 11 | + |
| 12 | +- KEY: |
| 13 | + NAME: opt_name |
| 14 | + REQ: EXACTLY_ONE |
| 15 | + CHECK: " v['value'] == 'adamw' " |
| 16 | + |
8 | 17 | - KEY: |
9 | 18 | NAME: opt_base_learning_rate |
10 | 19 | REQ: EXACTLY_ONE |
11 | 20 |
|
12 | 21 | - KEY: |
13 | | - NAME: opt_lamb_epsilon |
| 22 | + NAME: opt_end_learning_rate |
14 | 23 | REQ: EXACTLY_ONE |
15 | 24 |
|
16 | 25 | - KEY: |
17 | | - NAME: opt_learning_rate_training_steps |
| 26 | + NAME: opt_learning_rate_decay_steps |
18 | 27 | REQ: EXACTLY_ONE |
| 28 | + CHECK: " v['value'] * s['global_batch_size'] == 1.2e6 " |
19 | 29 |
|
20 | 30 | - KEY: |
21 | 31 | NAME: opt_learning_rate_warmup_steps |
22 | 32 | REQ: EXACTLY_ONE |
23 | 33 |
|
24 | 34 | - KEY: |
25 | | - NAME: num_warmup_steps |
| 35 | + NAME: opt_learning_rate_decay_schedule |
| 36 | + REQ: EXACTLY_ONE |
| 37 | + CHECK: " v['value'] == 'cosine with linear warmup' " |
| 38 | + |
| 39 | +- KEY: |
| 40 | + NAME: opt_adamw_beta_1 |
26 | 41 | REQ: EXACTLY_ONE |
| 42 | + CHECK: " v['value'] == 0.9 " |
27 | 43 |
|
28 | 44 | - KEY: |
29 | | - NAME: start_warmup_step |
| 45 | + NAME: opt_adamw_beta_2 |
30 | 46 | REQ: EXACTLY_ONE |
| 47 | + CHECK: " v['value'] == 0.95 " |
31 | 48 |
|
32 | 49 | - KEY: |
33 | | - NAME: opt_lamb_beta_1 |
| 50 | + NAME: opt_adamw_epsilon |
34 | 51 | REQ: EXACTLY_ONE |
| 52 | + CHECK: " v['value'] == 1e-05 " |
35 | 53 |
|
36 | 54 | - KEY: |
37 | | - NAME: opt_lamb_beta_2 |
| 55 | + NAME: opt_adamw_weight_decay |
38 | 56 | REQ: EXACTLY_ONE |
| 57 | + CHECK: " v['value'] == 0.1 " |
39 | 58 |
|
40 | 59 | - KEY: |
41 | | - NAME: opt_lamb_weight_decay_rate |
| 60 | + NAME: opt_gradient_clip_norm |
42 | 61 | REQ: EXACTLY_ONE |
| 62 | + CHECK: " v['value'] == 1.0 " |
| 63 | + |
| 64 | +- KEY: |
| 65 | + NAME: gradient_accumulation_steps |
| 66 | + REQ: EXACTLY_ONE |
| 67 | + CHECK: " v['value'] > 0 " |
| 68 | + |
| 69 | +- KEY: |
| 70 | + NAME: eval_samples |
| 71 | + REQ: EXACTLY_ONE |
| 72 | + CHECK: " v['value'] == 5760 " |
43 | 73 |
|
44 | 74 | - KEY: |
45 | 75 | NAME: eval_accuracy |
46 | 76 | REQ: AT_LEAST_ONE |
47 | 77 | CHECK: |
48 | | - - "'epoch_num' in v['metadata']" |
49 | | - ATLEAST_ONE_CHECK: "(v['value'] >= 0.720) and v['value'] < 1.0" |
| 78 | + - "'samples_count' in v['metadata']" |
| 79 | + ATLEAST_ONE_CHECK: "(v['value'] <= 3.3) and v['value'] > 0.0" |
| 80 | + |
| 81 | +- KEY: |
| 82 | + NAME: MAX_STEPS |
| 83 | + REQ: EXACTLY_ONE |
| 84 | + CHECK: " v['value'] == 1200000 " |
| 85 | + |
0 commit comments