Update README.md
Browse files
README.md
CHANGED
|
@@ -1276,27 +1276,35 @@ The following hyperparameters were used during training:
|
|
| 1276 |
|
| 1277 |
### NERembert-base-3entities
|
| 1278 |
```
|
| 1279 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1280 |
```
|
| 1281 |
|
| 1282 |
### multiconer
|
| 1283 |
-
|
| 1284 |
-
|
| 1285 |
title={{SemEval-2023 Task 2: Fine-grained Multilingual Named Entity Recognition (MultiCoNER 2)}},
|
| 1286 |
author={Fetahu, Besnik and Kar, Sudipta and Chen, Zhiyu and Rokhlenko, Oleg and Malmasi, Shervin},
|
| 1287 |
booktitle={Proceedings of the 17th International Workshop on Semantic Evaluation (SemEval-2023)},
|
| 1288 |
year={2023},
|
| 1289 |
publisher={Association for Computational Linguistics}}
|
| 1290 |
|
| 1291 |
-
|
| 1292 |
title={{MultiCoNER v2: a Large Multilingual dataset for Fine-grained and Noisy Named Entity Recognition}},
|
| 1293 |
author={Fetahu, Besnik and Chen, Zhiyu and Kar, Sudipta and Rokhlenko, Oleg and Malmasi, Shervin},
|
| 1294 |
year={2023}}
|
| 1295 |
-
|
| 1296 |
|
| 1297 |
### multinerd
|
| 1298 |
-
|
| 1299 |
-
|
| 1300 |
title = "{M}ulti{NERD}: A Multilingual, Multi-Genre and Fine-Grained Dataset for Named Entity Recognition (and Disambiguation)",
|
| 1301 |
author = "Tedeschi, Simone and Navigli, Roberto",
|
| 1302 |
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2022",
|
|
@@ -1307,21 +1315,22 @@ TODO
|
|
| 1307 |
url = "https://aclanthology.org/2022.findings-naacl.60",
|
| 1308 |
doi = "10.18653/v1/2022.findings-naacl.60",
|
| 1309 |
pages = "801--812"}
|
| 1310 |
-
|
| 1311 |
|
| 1312 |
### pii-masking-200k
|
| 1313 |
-
|
| 1314 |
-
|
| 1315 |
-
author = { {ai4Privacy} },
|
| 1316 |
-
title = { pii-masking-200k (Revision 1d4c0a1) },
|
| 1317 |
-
year = 2023,
|
| 1318 |
-
url = { https://huggingface.co/datasets/ai4privacy/pii-masking-200k },
|
| 1319 |
-
doi = { 10.57967/hf/1532 },
|
| 1320 |
-
publisher = { Hugging Face }}
|
|
|
|
| 1321 |
|
| 1322 |
### wikiann
|
| 1323 |
-
|
| 1324 |
-
|
| 1325 |
title = "Massively Multilingual Transfer for {NER}",
|
| 1326 |
author = "Rahimi, Afshin and Li, Yuan and Cohn, Trevor",
|
| 1327 |
booktitle = "Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics",
|
|
@@ -1331,34 +1340,44 @@ publisher = { Hugging Face }}
|
|
| 1331 |
publisher = "Association for Computational Linguistics",
|
| 1332 |
url = "https://www.aclweb.org/anthology/P19-1015",
|
| 1333 |
pages = "151--164"}
|
|
|
|
| 1334 |
|
| 1335 |
### wikiner
|
| 1336 |
-
|
| 1337 |
-
|
| 1338 |
-
title = {Learning multilingual named entity recognition from Wikipedia},
|
| 1339 |
-
journal = {Artificial Intelligence},
|
| 1340 |
-
volume = {194},
|
| 1341 |
-
pages = {151-175},
|
| 1342 |
-
year = {2013},
|
| 1343 |
-
note = {Artificial Intelligence, Wikipedia and Semi-Structured Resources},
|
| 1344 |
-
issn = {0004-3702},
|
| 1345 |
-
doi = {https://doi.org/10.1016/j.artint.2012.03.006},
|
| 1346 |
-
url = {https://www.sciencedirect.com/science/article/pii/S0004370212000276},
|
| 1347 |
-
author = {Joel Nothman and Nicky Ringland and Will Radford and Tara Murphy and James R. Curran}}
|
| 1348 |
-
|
| 1349 |
|
| 1350 |
### frenchNER_3entities
|
| 1351 |
```
|
| 1352 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1353 |
```
|
| 1354 |
|
| 1355 |
### CamemBERT
|
| 1356 |
-
|
|
|
|
| 1357 |
title={CamemBERT: a Tasty French Language Model},
|
| 1358 |
author={Martin, Louis and Muller, Benjamin and Su{\'a}rez, Pedro Javier Ortiz and Dupont, Yoann and Romary, Laurent and de la Clergerie, {\'E}ric Villemonte and Seddah, Djam{\'e} and Sagot, Beno{\^\i}t},
|
| 1359 |
booktitle={Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics},
|
| 1360 |
year={2020}}
|
| 1361 |
-
|
| 1362 |
|
| 1363 |
## License
|
| 1364 |
[cc-by-4.0](https://creativecommons.org/licenses/by/4.0/deed.en)
|
|
|
|
| 1276 |
|
| 1277 |
### NERembert-base-3entities
|
| 1278 |
```
|
| 1279 |
+
@misc {NERmembert2024,
|
| 1280 |
+
author = { {BOURDOIS, Loïck} },
|
| 1281 |
+
organization = { {Centre Aquitain des Technologies de l'Information et Electroniques} },
|
| 1282 |
+
title = { NERmembert-base-3entities },
|
| 1283 |
+
year = 2024,
|
| 1284 |
+
url = { https://huggingface.co/CATIE-AQ/NERmembert-base-3entities },
|
| 1285 |
+
doi = { 10.57967/hf/1752 },
|
| 1286 |
+
publisher = { Hugging Face }
|
| 1287 |
+
}
|
| 1288 |
```
|
| 1289 |
|
| 1290 |
### multiconer
|
| 1291 |
+
```
|
| 1292 |
+
@inproceedings{multiconer2-report,
|
| 1293 |
title={{SemEval-2023 Task 2: Fine-grained Multilingual Named Entity Recognition (MultiCoNER 2)}},
|
| 1294 |
author={Fetahu, Besnik and Kar, Sudipta and Chen, Zhiyu and Rokhlenko, Oleg and Malmasi, Shervin},
|
| 1295 |
booktitle={Proceedings of the 17th International Workshop on Semantic Evaluation (SemEval-2023)},
|
| 1296 |
year={2023},
|
| 1297 |
publisher={Association for Computational Linguistics}}
|
| 1298 |
|
| 1299 |
+
@article{multiconer2-data,
|
| 1300 |
title={{MultiCoNER v2: a Large Multilingual dataset for Fine-grained and Noisy Named Entity Recognition}},
|
| 1301 |
author={Fetahu, Besnik and Chen, Zhiyu and Kar, Sudipta and Rokhlenko, Oleg and Malmasi, Shervin},
|
| 1302 |
year={2023}}
|
| 1303 |
+
```
|
| 1304 |
|
| 1305 |
### multinerd
|
| 1306 |
+
```
|
| 1307 |
+
@inproceedings{tedeschi-navigli-2022-multinerd,
|
| 1308 |
title = "{M}ulti{NERD}: A Multilingual, Multi-Genre and Fine-Grained Dataset for Named Entity Recognition (and Disambiguation)",
|
| 1309 |
author = "Tedeschi, Simone and Navigli, Roberto",
|
| 1310 |
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2022",
|
|
|
|
| 1315 |
url = "https://aclanthology.org/2022.findings-naacl.60",
|
| 1316 |
doi = "10.18653/v1/2022.findings-naacl.60",
|
| 1317 |
pages = "801--812"}
|
| 1318 |
+
```
|
| 1319 |
|
| 1320 |
### pii-masking-200k
|
| 1321 |
+
```
|
| 1322 |
+
@misc {ai4privacy_2023,
|
| 1323 |
+
author = { {ai4Privacy} },
|
| 1324 |
+
title = { pii-masking-200k (Revision 1d4c0a1) },
|
| 1325 |
+
year = 2023,
|
| 1326 |
+
url = { https://huggingface.co/datasets/ai4privacy/pii-masking-200k },
|
| 1327 |
+
doi = { 10.57967/hf/1532 },
|
| 1328 |
+
publisher = { Hugging Face }}
|
| 1329 |
+
```
|
| 1330 |
|
| 1331 |
### wikiann
|
| 1332 |
+
```
|
| 1333 |
+
@inproceedings{rahimi-etal-2019-massively,
|
| 1334 |
title = "Massively Multilingual Transfer for {NER}",
|
| 1335 |
author = "Rahimi, Afshin and Li, Yuan and Cohn, Trevor",
|
| 1336 |
booktitle = "Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics",
|
|
|
|
| 1340 |
publisher = "Association for Computational Linguistics",
|
| 1341 |
url = "https://www.aclweb.org/anthology/P19-1015",
|
| 1342 |
pages = "151--164"}
|
| 1343 |
+
```
|
| 1344 |
|
| 1345 |
### wikiner
|
| 1346 |
+
```
|
| 1347 |
+
@article{NOTHMAN2013151,
|
| 1348 |
+
title = {Learning multilingual named entity recognition from Wikipedia},
|
| 1349 |
+
journal = {Artificial Intelligence},
|
| 1350 |
+
volume = {194},
|
| 1351 |
+
pages = {151-175},
|
| 1352 |
+
year = {2013},
|
| 1353 |
+
note = {Artificial Intelligence, Wikipedia and Semi-Structured Resources},
|
| 1354 |
+
issn = {0004-3702},
|
| 1355 |
+
doi = {https://doi.org/10.1016/j.artint.2012.03.006},
|
| 1356 |
+
url = {https://www.sciencedirect.com/science/article/pii/S0004370212000276},
|
| 1357 |
+
author = {Joel Nothman and Nicky Ringland and Will Radford and Tara Murphy and James R. Curran}}
|
| 1358 |
+
```
|
| 1359 |
|
| 1360 |
### frenchNER_3entities
|
| 1361 |
```
|
| 1362 |
+
@misc {frenchNER2024,
|
| 1363 |
+
author = { {BOURDOIS, Loïck} },
|
| 1364 |
+
organization = { {Centre Aquitain des Technologies de l'Information et Electroniques} },
|
| 1365 |
+
title = { frenchNER_3entities },
|
| 1366 |
+
year = 2024,
|
| 1367 |
+
url = { https://huggingface.co/CATIE-AQ/frenchNER_3entities },
|
| 1368 |
+
doi = { 10.57967/hf/1751 },
|
| 1369 |
+
publisher = { Hugging Face }
|
| 1370 |
+
}
|
| 1371 |
```
|
| 1372 |
|
| 1373 |
### CamemBERT
|
| 1374 |
+
```
|
| 1375 |
+
@inproceedings{martin2020camembert,
|
| 1376 |
title={CamemBERT: a Tasty French Language Model},
|
| 1377 |
author={Martin, Louis and Muller, Benjamin and Su{\'a}rez, Pedro Javier Ortiz and Dupont, Yoann and Romary, Laurent and de la Clergerie, {\'E}ric Villemonte and Seddah, Djam{\'e} and Sagot, Beno{\^\i}t},
|
| 1378 |
booktitle={Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics},
|
| 1379 |
year={2020}}
|
| 1380 |
+
```
|
| 1381 |
|
| 1382 |
## License
|
| 1383 |
[cc-by-4.0](https://creativecommons.org/licenses/by/4.0/deed.en)
|