Update README.md
Browse files
README.md
CHANGED
|
@@ -8,8 +8,8 @@ license: apache-2.0
|
|
| 8 |
|
| 9 |
### cpp-cpp
|
| 10 |
|
| 11 |
-
* source languages: cpp
|
| 12 |
-
* target languages: cpp
|
| 13 |
* OPUS readme: [cpp-cpp](https://github.com/Helsinki-NLP/Tatoeba-Challenge/tree/master/models/cpp-cpp/README.md)
|
| 14 |
|
| 15 |
* dataset: opus
|
|
@@ -32,3 +32,60 @@ license: apache-2.0
|
|
| 32 |
| Tatoeba-test.multi.multi | 21.1 | 0.369 |
|
| 33 |
| Tatoeba-test.pap-msa.pap.msa | 17.7 | 0.197 |
|
| 34 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8 |
|
| 9 |
### cpp-cpp
|
| 10 |
|
| 11 |
+
* source languages: cpp, (Creoles and pidgins, Portuguese-based))
|
| 12 |
+
* target languages: cpp, (Creoles and pidgins, Portuguese-based)
|
| 13 |
* OPUS readme: [cpp-cpp](https://github.com/Helsinki-NLP/Tatoeba-Challenge/tree/master/models/cpp-cpp/README.md)
|
| 14 |
|
| 15 |
* dataset: opus
|
|
|
|
| 32 |
| Tatoeba-test.multi.multi | 21.1 | 0.369 |
|
| 33 |
| Tatoeba-test.pap-msa.pap.msa | 17.7 | 0.197 |
|
| 34 |
|
| 35 |
+
|
| 36 |
+
### System Info:
|
| 37 |
+
- hf_name: cpp-cpp
|
| 38 |
+
|
| 39 |
+
- source_languages: cpp
|
| 40 |
+
|
| 41 |
+
- target_languages: cpp
|
| 42 |
+
|
| 43 |
+
- opus_readme_url: https://github.com/Helsinki-NLP/Tatoeba-Challenge/tree/master/models/cpp-cpp/README.md
|
| 44 |
+
|
| 45 |
+
- original_repo: Tatoeba-Challenge
|
| 46 |
+
|
| 47 |
+
- tags: ['translation']
|
| 48 |
+
|
| 49 |
+
- prepro: normalization + SentencePiece (spm32k,spm32k)
|
| 50 |
+
|
| 51 |
+
- url_model: https://object.pouta.csc.fi/Tatoeba-MT-models/cpp-cpp/opus-2020-07-26.zip
|
| 52 |
+
|
| 53 |
+
- url_test_set: https://object.pouta.csc.fi/Tatoeba-MT-models/cpp-cpp/opus-2020-07-26.test.txt
|
| 54 |
+
|
| 55 |
+
- src_alpha3: cpp
|
| 56 |
+
|
| 57 |
+
- tgt_alpha3: cpp
|
| 58 |
+
|
| 59 |
+
- short_pair: cpp-cpp
|
| 60 |
+
|
| 61 |
+
- chrF2_score: 0.369
|
| 62 |
+
|
| 63 |
+
- bleu: 21.1
|
| 64 |
+
|
| 65 |
+
- brevity_penalty: 0.882
|
| 66 |
+
|
| 67 |
+
- ref_len: 18.0
|
| 68 |
+
|
| 69 |
+
- src_name: Creoles and pidgins, Portuguese-based
|
| 70 |
+
|
| 71 |
+
- tgt_name: Creoles and pidgins, Portuguese-based
|
| 72 |
+
|
| 73 |
+
- 2m: False
|
| 74 |
+
|
| 75 |
+
- train_date: 2020-07-26 00:00:00
|
| 76 |
+
|
| 77 |
+
- src_alpha2: cpp
|
| 78 |
+
|
| 79 |
+
- tgt_alpha2: cpp
|
| 80 |
+
|
| 81 |
+
- prefer_old: False
|
| 82 |
+
|
| 83 |
+
- long_pair: cpp-cpp
|
| 84 |
+
|
| 85 |
+
- helsinki_git_sha: 480fcbe0ee1bf4774bcbe6226ad9f58e63f6c535
|
| 86 |
+
|
| 87 |
+
- transformers_git_sha: 46e9f53347bbe9e989f0335f98465f30886d8173
|
| 88 |
+
|
| 89 |
+
- port_machine: brutasse
|
| 90 |
+
|
| 91 |
+
- port_time: 2020-08-17-23:07
|