mzhaoshuai
commited on
Upload CLIP4STR Pre-trained on DataComp-1B, LAION-2B, and DFN-5B
Browse files
clip4str_base_6e9fe947ac.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:15f9c480e8db69cf8c7436d918dc3867e9055234f2f55f4c2de31cf0cc6b119c
|
3 |
+
size 633162005
|
clip4str_base_6e9fe947ac_log.txt
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Benchmark (Subset) set:
|
2 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
3 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
4 |
+
| IIIT5k | 3000 | 99.50 | 99.88 | 97.98 | 5.09 |
|
5 |
+
| SVT | 647 | 98.30 | 99.59 | 97.05 | 5.86 |
|
6 |
+
| IC13_1015 | 1015 | 98.62 | 99.59 | 97.81 | 5.32 |
|
7 |
+
| IC15_1811 | 1811 | 91.39 | 97.19 | 95.21 | 5.38 |
|
8 |
+
| IC15_2077 | 2077 | 91.14 | 96.97 | 94.71 | 5.33 |
|
9 |
+
| SVTP | 645 | 97.98 | 99.50 | 96.99 | 5.87 |
|
10 |
+
| CUTE80 | 288 | 98.96 | 99.36 | 98.09 | 5.53 |
|
11 |
+
| HOST | 2416 | 79.30 | 94.30 | 88.73 | 5.37 |
|
12 |
+
| WOST | 2416 | 88.78 | 96.82 | 92.93 | 5.40 |
|
13 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
14 |
+
| Combined | 14315 | 91.85 | 97.60 | 94.65 | 5.35 |
|
15 |
+
|
16 |
+
|
17 |
+
Benchmark set:
|
18 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
19 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
20 |
+
| IIIT5k | 3000 | 99.50 | 99.88 | 97.98 | 5.09 |
|
21 |
+
| SVT | 647 | 98.30 | 99.59 | 97.05 | 5.86 |
|
22 |
+
| IC13_1015 | 1015 | 98.62 | 99.59 | 97.81 | 5.32 |
|
23 |
+
| IC15_1811 | 1811 | 91.39 | 97.19 | 95.21 | 5.38 |
|
24 |
+
| IC15_2077 | 2077 | 91.14 | 96.97 | 94.71 | 5.33 |
|
25 |
+
| SVTP | 645 | 97.98 | 99.50 | 96.99 | 5.87 |
|
26 |
+
| CUTE80 | 288 | 98.96 | 99.36 | 98.09 | 5.53 |
|
27 |
+
| HOST | 2416 | 79.30 | 94.30 | 88.73 | 5.37 |
|
28 |
+
| WOST | 2416 | 88.78 | 96.82 | 92.93 | 5.40 |
|
29 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
30 |
+
| Combined | 14315 | 91.85 | 97.60 | 94.65 | 5.35 |
|
31 |
+
|
32 |
+
|
33 |
+
New set:
|
34 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
35 |
+
|:--------:|----------:|---------:|--------:|-----------:|-------------:|
|
36 |
+
| ArT | 35149 | 85.81 | 95.34 | 93.74 | 5.41 |
|
37 |
+
| COCOv1.4 | 9825 | 81.29 | 93.94 | 88.58 | 5.92 |
|
38 |
+
| Uber | 80551 | 92.05 | 96.71 | 93.27 | 5.36 |
|
39 |
+
|----------|-----------|----------|---------|------------|--------------|
|
40 |
+
| Combined | 125525 | 89.46 | 96.11 | 93.03 | 5.42 |
|
41 |
+
|
42 |
+
|
43 |
+
Time: Total 654.3242173194885s, Average 4.6790919430741456ms. Total samples 139840.
|
clip4str_huge_3e942729b1.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ae6808c0c0af0c0b679653597c0214d0c0eb504b8d84df1ac030023b0a0215c
|
3 |
+
size 4080917077
|
clip4str_huge_3e942729b1_log.txt
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Benchmark (Subset) set:
|
2 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
3 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
4 |
+
| IIIT5k | 3000 | 99.53 | 99.86 | 97.82 | 5.09 |
|
5 |
+
| SVT | 647 | 99.07 | 99.78 | 97.26 | 5.86 |
|
6 |
+
| IC13_1015 | 1015 | 98.92 | 99.52 | 97.64 | 5.32 |
|
7 |
+
| IC15_1811 | 1811 | 91.72 | 97.41 | 94.43 | 5.37 |
|
8 |
+
| IC15_2077 | 2077 | 90.95 | 97.11 | 93.75 | 5.33 |
|
9 |
+
| SVTP | 645 | 97.98 | 99.46 | 96.43 | 5.86 |
|
10 |
+
| CUTE80 | 288 | 98.96 | 99.67 | 97.30 | 5.53 |
|
11 |
+
| HOST | 2416 | 82.57 | 95.34 | 87.73 | 5.38 |
|
12 |
+
| WOST | 2416 | 90.94 | 97.41 | 92.50 | 5.39 |
|
13 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
14 |
+
| Combined | 14315 | 92.84 | 97.93 | 94.09 | 5.35 |
|
15 |
+
|
16 |
+
|
17 |
+
Benchmark set:
|
18 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
19 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
20 |
+
| IIIT5k | 3000 | 99.53 | 99.86 | 97.82 | 5.09 |
|
21 |
+
| SVT | 647 | 99.07 | 99.78 | 97.26 | 5.86 |
|
22 |
+
| IC13_1015 | 1015 | 98.92 | 99.52 | 97.64 | 5.32 |
|
23 |
+
| IC15_1811 | 1811 | 91.72 | 97.41 | 94.43 | 5.37 |
|
24 |
+
| IC15_2077 | 2077 | 90.95 | 97.11 | 93.75 | 5.33 |
|
25 |
+
| SVTP | 645 | 97.98 | 99.46 | 96.43 | 5.86 |
|
26 |
+
| CUTE80 | 288 | 98.96 | 99.67 | 97.30 | 5.53 |
|
27 |
+
| HOST | 2416 | 82.57 | 95.34 | 87.73 | 5.38 |
|
28 |
+
| WOST | 2416 | 90.94 | 97.41 | 92.50 | 5.39 |
|
29 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
30 |
+
| Combined | 14315 | 92.84 | 97.93 | 94.09 | 5.35 |
|
31 |
+
|
32 |
+
|
33 |
+
New set:
|
34 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
35 |
+
|:--------:|----------:|---------:|--------:|-----------:|-------------:|
|
36 |
+
| ArT | 35149 | 86.41 | 95.64 | 93.20 | 5.41 |
|
37 |
+
| COCOv1.4 | 9825 | 82.96 | 94.56 | 87.63 | 5.91 |
|
38 |
+
| Uber | 80551 | 91.71 | 96.59 | 92.23 | 5.36 |
|
39 |
+
|----------|-----------|----------|---------|------------|--------------|
|
40 |
+
| Combined | 125525 | 89.54 | 96.17 | 92.14 | 5.42 |
|
41 |
+
|
42 |
+
|
43 |
+
Time: Total 4051.573532819748s, Average 28.97292286055312ms. Total samples 139840.
|
clip4str_huge_5eef9f86e2.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c0d3f67d337c70d4b46a418ca296fdbe5b178f6712664872f1a1495eea248e8c
|
3 |
+
size 4080917141
|
clip4str_huge_5eef9f86e2_log.txt
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Benchmark (Subset) set:
|
2 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
3 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
4 |
+
| IIIT5k | 3000 | 99.67 | 99.94 | 97.54 | 5.09 |
|
5 |
+
| SVT | 647 | 98.61 | 99.64 | 96.93 | 5.87 |
|
6 |
+
| IC13_1015 | 1015 | 98.92 | 99.59 | 97.82 | 5.32 |
|
7 |
+
| IC15_1811 | 1811 | 91.61 | 97.55 | 94.25 | 5.37 |
|
8 |
+
| IC15_2077 | 2077 | 91.09 | 97.14 | 93.47 | 5.33 |
|
9 |
+
| SVTP | 645 | 98.45 | 99.61 | 96.26 | 5.86 |
|
10 |
+
| CUTE80 | 288 | 99.65 | 99.65 | 97.26 | 5.53 |
|
11 |
+
| HOST | 2416 | 80.55 | 94.82 | 86.80 | 5.37 |
|
12 |
+
| WOST | 2416 | 89.98 | 97.16 | 91.79 | 5.39 |
|
13 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
14 |
+
| Combined | 14315 | 92.39 | 97.84 | 93.68 | 5.35 |
|
15 |
+
|
16 |
+
|
17 |
+
Benchmark set:
|
18 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
19 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
20 |
+
| IIIT5k | 3000 | 99.67 | 99.94 | 97.54 | 5.09 |
|
21 |
+
| SVT | 647 | 98.61 | 99.64 | 96.93 | 5.87 |
|
22 |
+
| IC13_1015 | 1015 | 98.92 | 99.59 | 97.82 | 5.32 |
|
23 |
+
| IC15_1811 | 1811 | 91.61 | 97.55 | 94.25 | 5.37 |
|
24 |
+
| IC15_2077 | 2077 | 91.09 | 97.14 | 93.47 | 5.33 |
|
25 |
+
| SVTP | 645 | 98.45 | 99.61 | 96.26 | 5.86 |
|
26 |
+
| CUTE80 | 288 | 99.65 | 99.65 | 97.26 | 5.53 |
|
27 |
+
| HOST | 2416 | 80.55 | 94.82 | 86.80 | 5.37 |
|
28 |
+
| WOST | 2416 | 89.98 | 97.16 | 91.79 | 5.39 |
|
29 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
30 |
+
| Combined | 14315 | 92.39 | 97.84 | 93.68 | 5.35 |
|
31 |
+
|
32 |
+
|
33 |
+
New set:
|
34 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
35 |
+
|:--------:|----------:|---------:|--------:|-----------:|-------------:|
|
36 |
+
| ArT | 35149 | 86.24 | 95.52 | 92.95 | 5.41 |
|
37 |
+
| COCOv1.4 | 9825 | 82.47 | 94.29 | 87.33 | 5.91 |
|
38 |
+
| Uber | 80551 | 91.19 | 96.40 | 91.74 | 5.36 |
|
39 |
+
|----------|-----------|----------|---------|------------|--------------|
|
40 |
+
| Combined | 125525 | 89.12 | 95.99 | 91.73 | 5.42 |
|
41 |
+
|
42 |
+
|
43 |
+
Time: Total 4061.6468493938446s, Average 29.044957447038364ms. Total samples 139840.
|
clip4str_large_3c9d881b88.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4d1638c057c6cd827c7a048715179f1a7af6a678ae2c9c75ee7fd72b1a1eccc
|
3 |
+
size 1787639049
|
clip4str_large_3c9d881b88_log.txt
ADDED
@@ -0,0 +1,43 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
Benchmark (Subset) set:
|
2 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
3 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
4 |
+
| IIIT5k | 3000 | 99.60 | 99.88 | 97.77 | 5.09 |
|
5 |
+
| SVT | 647 | 98.61 | 99.63 | 97.18 | 5.87 |
|
6 |
+
| IC13_1015 | 1015 | 99.01 | 99.63 | 97.73 | 5.32 |
|
7 |
+
| IC15_1811 | 1811 | 91.88 | 97.52 | 94.77 | 5.37 |
|
8 |
+
| IC15_2077 | 2077 | 91.43 | 97.33 | 94.19 | 5.33 |
|
9 |
+
| SVTP | 645 | 98.14 | 99.44 | 96.42 | 5.86 |
|
10 |
+
| CUTE80 | 288 | 99.65 | 99.94 | 97.37 | 5.54 |
|
11 |
+
| HOST | 2416 | 81.08 | 94.91 | 88.33 | 5.38 |
|
12 |
+
| WOST | 2416 | 90.60 | 97.26 | 93.04 | 5.39 |
|
13 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
14 |
+
| Combined | 14315 | 92.64 | 97.88 | 94.38 | 5.35 |
|
15 |
+
|
16 |
+
|
17 |
+
Benchmark set:
|
18 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
19 |
+
|:---------:|----------:|---------:|--------:|-----------:|-------------:|
|
20 |
+
| IIIT5k | 3000 | 99.60 | 99.88 | 97.77 | 5.09 |
|
21 |
+
| SVT | 647 | 98.61 | 99.63 | 97.18 | 5.87 |
|
22 |
+
| IC13_1015 | 1015 | 99.01 | 99.63 | 97.73 | 5.32 |
|
23 |
+
| IC15_1811 | 1811 | 91.88 | 97.52 | 94.77 | 5.37 |
|
24 |
+
| IC15_2077 | 2077 | 91.43 | 97.33 | 94.19 | 5.33 |
|
25 |
+
| SVTP | 645 | 98.14 | 99.44 | 96.42 | 5.86 |
|
26 |
+
| CUTE80 | 288 | 99.65 | 99.94 | 97.37 | 5.54 |
|
27 |
+
| HOST | 2416 | 81.08 | 94.91 | 88.33 | 5.38 |
|
28 |
+
| WOST | 2416 | 90.60 | 97.26 | 93.04 | 5.39 |
|
29 |
+
|-----------|-----------|----------|---------|------------|--------------|
|
30 |
+
| Combined | 14315 | 92.64 | 97.88 | 94.38 | 5.35 |
|
31 |
+
|
32 |
+
|
33 |
+
New set:
|
34 |
+
| Dataset | # samples | Accuracy | 1 - NED | Confidence | Label Length |
|
35 |
+
|:--------:|----------:|---------:|--------:|-----------:|-------------:|
|
36 |
+
| ArT | 35149 | 86.43 | 95.62 | 93.62 | 5.41 |
|
37 |
+
| COCOv1.4 | 9825 | 82.68 | 94.43 | 88.30 | 5.92 |
|
38 |
+
| Uber | 80551 | 92.20 | 96.79 | 92.85 | 5.37 |
|
39 |
+
|----------|-----------|----------|---------|------------|--------------|
|
40 |
+
| Combined | 125525 | 89.84 | 96.28 | 92.71 | 5.42 |
|
41 |
+
|
42 |
+
|
43 |
+
Time: Total 2185.2176456451416s, Average 15.626556390482992ms. Total samples 139840.
|