Add files using upload-large-folder tool
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +7 -0
- llama3b/Megatron-DeepSpeed/wandb/run-20240906_124210-jep2n358/logs/debug-internal.log +3 -0
- llama3b/Megatron-DeepSpeed/wandb/run-20240906_124210-jep2n358/run-jep2n358.wandb +3 -0
- llama3b/Megatron-DeepSpeed/wandb/run-20240906_130234-jep2n358/logs/debug-internal.log +3 -0
- llama3b/Megatron-DeepSpeed/wandb/run-20240906_130234-jep2n358/run-jep2n358.wandb +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_05_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_07_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_11_mp_rank_06_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_1_mp_rank_07_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_5_mp_rank_06_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_01-model_01-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_05-model_00-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_08-model_00-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_10-model_01-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_13-model_00-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_14-model_01-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_15-model_01-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_15-model_02-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_16-model_02-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_17-model_03-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_21-model_02-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_22-model_01-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_27-model_00-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_29-model_03-model_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_10_mp_rank_04_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_11_mp_rank_04_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_04_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_05_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_06_optim_states.pt +3 -0
- llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_07_optim_states.pt +3 -0
.gitattributes
CHANGED
@@ -36,3 +36,10 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
|
|
36 |
llama3b/Megatron-DeepSpeed/wandb/run-20240906_125809-jep2n358/run-jep2n358.wandb filter=lfs diff=lfs merge=lfs -text
|
37 |
llama3b/Megatron-DeepSpeed/wandb/run-20240906_130023-jep2n358/run-jep2n358.wandb filter=lfs diff=lfs merge=lfs -text
|
38 |
llama3b/Megatron-DeepSpeed/wandb/run-20240906_131856-1kmt9fpr/run-1kmt9fpr.wandb filter=lfs diff=lfs merge=lfs -text
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
36 |
llama3b/Megatron-DeepSpeed/wandb/run-20240906_125809-jep2n358/run-jep2n358.wandb filter=lfs diff=lfs merge=lfs -text
|
37 |
llama3b/Megatron-DeepSpeed/wandb/run-20240906_130023-jep2n358/run-jep2n358.wandb filter=lfs diff=lfs merge=lfs -text
|
38 |
llama3b/Megatron-DeepSpeed/wandb/run-20240906_131856-1kmt9fpr/run-1kmt9fpr.wandb filter=lfs diff=lfs merge=lfs -text
|
39 |
+
llama3b/Megatron-DeepSpeed/wandb/run-20240906_124210-jep2n358/run-jep2n358.wandb filter=lfs diff=lfs merge=lfs -text
|
40 |
+
llama3b/results/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/2024-09-04_03-33/run.log filter=lfs diff=lfs merge=lfs -text
|
41 |
+
llama3b/results/llamav2-3b/128/sangraha-hindi-TI135000-TP4PP2DP16-MBS8/2024-09-02_07-16/run.log filter=lfs diff=lfs merge=lfs -text
|
42 |
+
llama3b/results/llamav2-3b/128/sangraha-hindi-TI260500-TP4PP2DP16-MBS8/2024-09-03_16-10/run.log filter=lfs diff=lfs merge=lfs -text
|
43 |
+
llama3b/Megatron-DeepSpeed/wandb/run-20240906_124210-jep2n358/logs/debug-internal.log filter=lfs diff=lfs merge=lfs -text
|
44 |
+
llama3b/Megatron-DeepSpeed/wandb/run-20240906_130234-jep2n358/run-jep2n358.wandb filter=lfs diff=lfs merge=lfs -text
|
45 |
+
llama3b/Megatron-DeepSpeed/wandb/run-20240906_130234-jep2n358/logs/debug-internal.log filter=lfs diff=lfs merge=lfs -text
|
llama3b/Megatron-DeepSpeed/wandb/run-20240906_124210-jep2n358/logs/debug-internal.log
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6846dd37bd3e71189471f5a4783b9214f39ed40d6c0fdfb13ebc6eb4e2de1154
|
3 |
+
size 36041636
|
llama3b/Megatron-DeepSpeed/wandb/run-20240906_124210-jep2n358/run-jep2n358.wandb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2c4c02306f09aacd8029f70cc118277854ec689974802afe60728362c7db4dba
|
3 |
+
size 22707822
|
llama3b/Megatron-DeepSpeed/wandb/run-20240906_130234-jep2n358/logs/debug-internal.log
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:074b427d4880d769b46539155aaa6ffed20e90d472d8d6fbeda7ee727d8ca83d
|
3 |
+
size 59550809
|
llama3b/Megatron-DeepSpeed/wandb/run-20240906_130234-jep2n358/run-jep2n358.wandb
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:688fce8f6f06e13f2e2121025d9d66b12021ed7c0c502d6d4a31246ee7424e69
|
3 |
+
size 37957929
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4129bcf5b6b3eea649fcd6403b6e4f257f9d2bf6789a1f4af4449eb423223d1c
|
3 |
+
size 334793712
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3a56941ad2f669e9d7417665953b249a79d84109530333fc455ab8e0557ac704
|
3 |
+
size 334793712
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6f44b5fa390c455ee2f1f362372f74fc5747badf181c3e6f61b888ef37145d66
|
3 |
+
size 334794042
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_02_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6610fdb90b458b83e8304048493864ac799d02543cccd4e9933de6b0d9c7d8a8
|
3 |
+
size 334794042
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_03_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:197d0abb7c5784734e82916b2d1b2f048bac92d6946150c9f7b89adf65f1c1c7
|
3 |
+
size 334794042
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_05_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9148463efcfffc37c3bd22ee1b258ffc0e0e076b8f607db5214c34548ed26c83
|
3 |
+
size 334796282
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_10_mp_rank_07_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ec1eed271899ce8bb6872096ffffcf344a6d73ad833bb47374ecc830da5fac22
|
3 |
+
size 334796282
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e873a9136f2e07bb63c3616037546f86d5232914a1dbee4bbf5e4c71862b6dd1
|
3 |
+
size 334793914
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_11_mp_rank_06_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1906853fef935a1f8580fed28bde19999b24cd0dc172dd0da25525abe6b3c741
|
3 |
+
size 334796346
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_12_mp_rank_02_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:04ee89432361b052f0b06c689bcb5f3824d843148492ceb22777160142356c5b
|
3 |
+
size 334793978
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_14_mp_rank_03_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0c27b7dc81f43cce749f9fe36744a40e71050488edcf3d432f5941f6b10bf239
|
3 |
+
size 334794042
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6d6414b40593be90dff4798758dd03f8ba7a6ec7859a0e2bb22a8051a349070
|
3 |
+
size 334793914
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_15_mp_rank_03_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:64a932ddb5ac7046322e31ef0d3629632936fb4ae1d4c65b6608874c5e74789c
|
3 |
+
size 334793914
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_1_mp_rank_02_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:693383210cfad37ec874e7902e827b40fd12c9377868d9914411e31aad454409
|
3 |
+
size 334793968
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_1_mp_rank_07_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91d33b0e200c83125776c3cfbc2f452396bab27138e5cdc91b81de19cc3b316b
|
3 |
+
size 334796336
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89ce92625f00ade2a22edf801da729bd003b6c6f2cfc10e589548e8488d7c801
|
3 |
+
size 334793968
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_2_mp_rank_02_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3f4585ea184b5dcfc8824ab0a331a5c00b9d4033f44b7ebf0a4cf0980f66b773
|
3 |
+
size 334793968
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:91f7f979e707b46fcc66ed051a6517215e0c3886674343f2bc0a6c06a1cb556b
|
3 |
+
size 334793968
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4f6975ed6561e2e276b1738aef6900c1ab8ca60eced7193e940119db7921635a
|
3 |
+
size 334793968
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_5_mp_rank_06_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fc7c5decc426c6002d04d5babc76fa7518d7b90fcd84678cb96d25aac6c306d0
|
3 |
+
size 334796272
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/bf16_zero_pp_rank_8_mp_rank_03_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1d1a4c42b761ab31793056439562aa8a544683fddbd159c57eaecb0f0f8427b
|
3 |
+
size 334793968
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_01-model_01-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:da51138f8ec0ce87e79e888227bbf777f4c530b66709e7289c018412a35ab739
|
3 |
+
size 77858191
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_05-model_00-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:95ae95e9e703655e8f78396ba5a0a51fdf164ef8ea169a75ad99bc27e5a145c9
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_08-model_00-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f721c14245add9aad01845712ecab7ce8377be94a4ec6ebda50f5ab9aad63c3
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_10-model_01-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0242d77f3084f0d3816bd01c5cf99231db8d6ab3631992f57b38810e161a43d5
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_13-model_00-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:472cfa5950c8d290aeaecbef2a7f0ad110906be56d2b081c2cd7d0768df3779b
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_14-model_01-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a2224222ae97970ad8e9f6e103b59198a79d2619a2f1263ca615086382707b0c
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_15-model_01-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:226ff65c9077fd4f4de78dc3a3eded2cf410b7d904493d83cc46308e35393dbd
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_15-model_02-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eca917849e40668fd0b8de80482d82185673865714563f5e8e9458c7a503ead4
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_16-model_02-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e327eb9ee3a6f72bc4997c725a9b5201ec7e28bc02baa6f79d665618782857af
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_17-model_03-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee2f346eaeac2f1be52beac2c43dc8e8b61fe3385a0e80582c88e4dcff7ef904
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_21-model_02-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b8fd42276ff85b92fe3a1d8d0d5fba8f5b464a6ba40a42d9239c42c438cf0d8f
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_22-model_01-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fbc191bc11e189e3e1ed49eb84d71e49eb89ee7396731d1a5228444428d945ad
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_27-model_00-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c9997746062796264cbee016eab4036a6c5fd191e05829b30823b6a9eadbcd65
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step3000/layer_29-model_03-model_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e708d46f990d79db46c7fa613c9570fd14eb22ab41ba81b7cffa8890841840c8
|
3 |
+
size 58211118
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8d984210b9837d2931c1892924f6bb7aad2f2d1f2329a089824e8f89e74cba1
|
3 |
+
size 334793712
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_0_mp_rank_03_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:779dae82be2ea91129b51779cb7ad8ddce8b1f23b3656a974f33fd4c2ceb19d9
|
3 |
+
size 334793712
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_10_mp_rank_04_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9dae86b2f10bcfa7ab6c1742b83d01fba63fa7008720bdd0a824383e26f01e66
|
3 |
+
size 334796282
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_11_mp_rank_02_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a31b6cf1387184dbb5fe11eb2b1fecbbf68377924b36814f9d42c2f48b92822b
|
3 |
+
size 334793914
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_11_mp_rank_04_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:07371fa140da5a4cad4eb001caf4455b0530f3bfca2ae17ce04a6d150e574ea3
|
3 |
+
size 334796346
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7644c555a437fcebdad8bdcb69efdba440f915ebae15810191592e8fc79b4e01
|
3 |
+
size 334793978
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_04_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c20b03f506de53a659ce0b78aa128483745e9bf3275082be01dfb38abbcc61aa
|
3 |
+
size 334796346
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_05_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:54e15c9d4d84dc8553b785cbe2e649c4cba7feec69b0686cee3b44f430a0e6ee
|
3 |
+
size 334796346
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_06_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ef1c970d60f0ccee8fc8d7c1fe2ac44c03aa00d5ff63f0a694ce53a255250d70
|
3 |
+
size 334796346
|
llama3b/checkpoint/llamav2-3b/128/sangraha-hindi-TI15500-TP4PP2DP16-MBS8/global_step8000/bf16_zero_pp_rank_12_mp_rank_07_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bf859a0c6da91b3af34dc04747d21c4c05270a1904e4a2c96f8d34d9674396ea
|
3 |
+
size 334796346
|