Update README.md
Browse files
README.md
CHANGED
@@ -22,7 +22,7 @@ tags:
|
|
22 |
1. Model:
|
23 |
- Dropout rate: 0.0
|
24 |
- Activations: `silu`, `gated-silu`
|
25 |
-
-
|
26 |
|
27 |
2. Data processing:
|
28 |
- Input length: 1024
|
@@ -44,7 +44,6 @@ tags:
|
|
44 |
- Device: GPU
|
45 |
- Precision: bfloat16, tf32
|
46 |
|
47 |
-
|
48 |
## plots
|
49 |
|
50 |
|
|
|
22 |
1. Model:
|
23 |
- Dropout rate: 0.0
|
24 |
- Activations: `silu`, `gated-silu`
|
25 |
+
- torch compile: true
|
26 |
|
27 |
2. Data processing:
|
28 |
- Input length: 1024
|
|
|
44 |
- Device: GPU
|
45 |
- Precision: bfloat16, tf32
|
46 |
|
|
|
47 |
## plots
|
48 |
|
49 |
|