Spaces:
Runtime error
Runtime error
Upload folder using huggingface_hub
Browse files- run_transformers_training.py +6 -2
- transformers_config.json +11 -4
run_transformers_training.py
CHANGED
@@ -1,5 +1,5 @@
|
|
1 |
-
#!/usr/bin/env
|
2 |
-
# coding
|
3 |
|
4 |
# Basic Python imports
|
5 |
import os
|
@@ -12,6 +12,10 @@ import time
|
|
12 |
import warnings
|
13 |
from importlib.util import find_spec
|
14 |
import multiprocessing
|
|
|
|
|
|
|
|
|
15 |
|
16 |
# Check hardware capabilities first
|
17 |
CUDA_AVAILABLE = "CUDA_VISIBLE_DEVICES" in os.environ or os.environ.get("NVIDIA_VISIBLE_DEVICES") != ""
|
|
|
1 |
+
#!/usr/bin/env python3
|
2 |
+
# -*- coding: utf-8 -*-
|
3 |
|
4 |
# Basic Python imports
|
5 |
import os
|
|
|
12 |
import warnings
|
13 |
from importlib.util import find_spec
|
14 |
import multiprocessing
|
15 |
+
import torch
|
16 |
+
import random
|
17 |
+
import numpy as np
|
18 |
+
from tqdm import tqdm
|
19 |
|
20 |
# Check hardware capabilities first
|
21 |
CUDA_AVAILABLE = "CUDA_VISIBLE_DEVICES" in os.environ or os.environ.get("NVIDIA_VISIBLE_DEVICES") != ""
|
transformers_config.json
CHANGED
@@ -67,7 +67,14 @@
|
|
67 |
"offload_params": false
|
68 |
},
|
69 |
"ddp_find_unused_parameters": false,
|
70 |
-
"dataloader_num_workers": 2
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
71 |
},
|
72 |
|
73 |
"logging": {
|
@@ -112,11 +119,11 @@
|
|
112 |
"use_gradient_checkpointing": true,
|
113 |
"use_flash_attention": true
|
114 |
},
|
115 |
-
"multi_gpu_strategy": "
|
116 |
},
|
117 |
"system_settings": {
|
118 |
-
"cuda_memory_fraction": 0.
|
119 |
-
"dataloader_num_workers":
|
120 |
"dataloader_pin_memory": true
|
121 |
},
|
122 |
"memory_breakdown": {
|
|
|
67 |
"offload_params": false
|
68 |
},
|
69 |
"ddp_find_unused_parameters": false,
|
70 |
+
"dataloader_num_workers": 2,
|
71 |
+
"ddp_config": {
|
72 |
+
"enabled": true,
|
73 |
+
"backend": "nccl",
|
74 |
+
"find_unused_parameters": false,
|
75 |
+
"broadcast_buffers": false,
|
76 |
+
"gradient_as_bucket_view": true
|
77 |
+
}
|
78 |
},
|
79 |
|
80 |
"logging": {
|
|
|
119 |
"use_gradient_checkpointing": true,
|
120 |
"use_flash_attention": true
|
121 |
},
|
122 |
+
"multi_gpu_strategy": "ddp"
|
123 |
},
|
124 |
"system_settings": {
|
125 |
+
"cuda_memory_fraction": 0.75,
|
126 |
+
"dataloader_num_workers": 4,
|
127 |
"dataloader_pin_memory": true
|
128 |
},
|
129 |
"memory_breakdown": {
|