tirthadagr8
commited on
Update README.md
Browse files
README.md
CHANGED
@@ -1,8 +1,20 @@
|
|
1 |
---
|
2 |
-
license:
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3 |
---
|
4 |
Made using Gpt-Small from scratch for learning purpose.
|
5 |
Tokenizer used is from Gemma 2-2B-JPN-IT which is trained on japanese dataset from JESC.
|
|
|
|
|
|
|
|
|
6 |
```bibtex
|
7 |
@ARTICLE{pryzant_jesc_2018,
|
8 |
author = {{Pryzant}, R. and {Chung}, Y. and {Jurafsky}, D. and {Britz}, D.},
|
@@ -10,4 +22,4 @@ Tokenizer used is from Gemma 2-2B-JPN-IT which is trained on japanese dataset fr
|
|
10 |
journal = {Language Resources and Evaluation Conference (LREC)},
|
11 |
keywords = {Computer Science - Computation and Language},
|
12 |
year = 2018
|
13 |
-
}
|
|
|
1 |
---
|
2 |
+
license: mit
|
3 |
+
datasets:
|
4 |
+
- Hoshikuzu/JESC
|
5 |
+
language:
|
6 |
+
- en
|
7 |
+
- ja
|
8 |
+
base_model:
|
9 |
+
- openai-community/gpt2
|
10 |
+
- google/gemma-2-2b-jpn-it
|
11 |
---
|
12 |
Made using Gpt-Small from scratch for learning purpose.
|
13 |
Tokenizer used is from Gemma 2-2B-JPN-IT which is trained on japanese dataset from JESC.
|
14 |
+
|
15 |
+
Model usage:-
|
16 |
+
|
17 |
+
|
18 |
```bibtex
|
19 |
@ARTICLE{pryzant_jesc_2018,
|
20 |
author = {{Pryzant}, R. and {Chung}, Y. and {Jurafsky}, D. and {Britz}, D.},
|
|
|
22 |
journal = {Language Resources and Evaluation Conference (LREC)},
|
23 |
keywords = {Computer Science - Computation and Language},
|
24 |
year = 2018
|
25 |
+
}
|