bourdoiscatie
commited on
Commit
•
f87838c
1
Parent(s):
d35847e
Update README.md
Browse files
README.md
CHANGED
@@ -1276,27 +1276,35 @@ The following hyperparameters were used during training:
|
|
1276 |
|
1277 |
### NERembert-base-3entities
|
1278 |
```
|
1279 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1280 |
```
|
1281 |
|
1282 |
### multiconer
|
1283 |
-
|
1284 |
-
|
1285 |
title={{SemEval-2023 Task 2: Fine-grained Multilingual Named Entity Recognition (MultiCoNER 2)}},
|
1286 |
author={Fetahu, Besnik and Kar, Sudipta and Chen, Zhiyu and Rokhlenko, Oleg and Malmasi, Shervin},
|
1287 |
booktitle={Proceedings of the 17th International Workshop on Semantic Evaluation (SemEval-2023)},
|
1288 |
year={2023},
|
1289 |
publisher={Association for Computational Linguistics}}
|
1290 |
|
1291 |
-
|
1292 |
title={{MultiCoNER v2: a Large Multilingual dataset for Fine-grained and Noisy Named Entity Recognition}},
|
1293 |
author={Fetahu, Besnik and Chen, Zhiyu and Kar, Sudipta and Rokhlenko, Oleg and Malmasi, Shervin},
|
1294 |
year={2023}}
|
1295 |
-
|
1296 |
|
1297 |
### multinerd
|
1298 |
-
|
1299 |
-
|
1300 |
title = "{M}ulti{NERD}: A Multilingual, Multi-Genre and Fine-Grained Dataset for Named Entity Recognition (and Disambiguation)",
|
1301 |
author = "Tedeschi, Simone and Navigli, Roberto",
|
1302 |
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2022",
|
@@ -1307,21 +1315,22 @@ TODO
|
|
1307 |
url = "https://aclanthology.org/2022.findings-naacl.60",
|
1308 |
doi = "10.18653/v1/2022.findings-naacl.60",
|
1309 |
pages = "801--812"}
|
1310 |
-
|
1311 |
|
1312 |
### pii-masking-200k
|
1313 |
-
|
1314 |
-
|
1315 |
-
author = { {ai4Privacy} },
|
1316 |
-
title = { pii-masking-200k (Revision 1d4c0a1) },
|
1317 |
-
year = 2023,
|
1318 |
-
url = { https://huggingface.co/datasets/ai4privacy/pii-masking-200k },
|
1319 |
-
doi = { 10.57967/hf/1532 },
|
1320 |
-
publisher = { Hugging Face }}
|
|
|
1321 |
|
1322 |
### wikiann
|
1323 |
-
|
1324 |
-
|
1325 |
title = "Massively Multilingual Transfer for {NER}",
|
1326 |
author = "Rahimi, Afshin and Li, Yuan and Cohn, Trevor",
|
1327 |
booktitle = "Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics",
|
@@ -1331,34 +1340,44 @@ publisher = { Hugging Face }}
|
|
1331 |
publisher = "Association for Computational Linguistics",
|
1332 |
url = "https://www.aclweb.org/anthology/P19-1015",
|
1333 |
pages = "151--164"}
|
|
|
1334 |
|
1335 |
### wikiner
|
1336 |
-
|
1337 |
-
|
1338 |
-
title = {Learning multilingual named entity recognition from Wikipedia},
|
1339 |
-
journal = {Artificial Intelligence},
|
1340 |
-
volume = {194},
|
1341 |
-
pages = {151-175},
|
1342 |
-
year = {2013},
|
1343 |
-
note = {Artificial Intelligence, Wikipedia and Semi-Structured Resources},
|
1344 |
-
issn = {0004-3702},
|
1345 |
-
doi = {https://doi.org/10.1016/j.artint.2012.03.006},
|
1346 |
-
url = {https://www.sciencedirect.com/science/article/pii/S0004370212000276},
|
1347 |
-
author = {Joel Nothman and Nicky Ringland and Will Radford and Tara Murphy and James R. Curran}}
|
1348 |
-
|
1349 |
|
1350 |
### frenchNER_3entities
|
1351 |
```
|
1352 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1353 |
```
|
1354 |
|
1355 |
### CamemBERT
|
1356 |
-
|
|
|
1357 |
title={CamemBERT: a Tasty French Language Model},
|
1358 |
author={Martin, Louis and Muller, Benjamin and Su{\'a}rez, Pedro Javier Ortiz and Dupont, Yoann and Romary, Laurent and de la Clergerie, {\'E}ric Villemonte and Seddah, Djam{\'e} and Sagot, Beno{\^\i}t},
|
1359 |
booktitle={Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics},
|
1360 |
year={2020}}
|
1361 |
-
|
1362 |
|
1363 |
## License
|
1364 |
[cc-by-4.0](https://creativecommons.org/licenses/by/4.0/deed.en)
|
|
|
1276 |
|
1277 |
### NERembert-base-3entities
|
1278 |
```
|
1279 |
+
@misc {NERmembert2024,
|
1280 |
+
author = { {BOURDOIS, Loïck} },
|
1281 |
+
organization = { {Centre Aquitain des Technologies de l'Information et Electroniques} },
|
1282 |
+
title = { NERmembert-base-3entities },
|
1283 |
+
year = 2024,
|
1284 |
+
url = { https://huggingface.co/CATIE-AQ/NERmembert-base-3entities },
|
1285 |
+
doi = { 10.57967/hf/1752 },
|
1286 |
+
publisher = { Hugging Face }
|
1287 |
+
}
|
1288 |
```
|
1289 |
|
1290 |
### multiconer
|
1291 |
+
```
|
1292 |
+
@inproceedings{multiconer2-report,
|
1293 |
title={{SemEval-2023 Task 2: Fine-grained Multilingual Named Entity Recognition (MultiCoNER 2)}},
|
1294 |
author={Fetahu, Besnik and Kar, Sudipta and Chen, Zhiyu and Rokhlenko, Oleg and Malmasi, Shervin},
|
1295 |
booktitle={Proceedings of the 17th International Workshop on Semantic Evaluation (SemEval-2023)},
|
1296 |
year={2023},
|
1297 |
publisher={Association for Computational Linguistics}}
|
1298 |
|
1299 |
+
@article{multiconer2-data,
|
1300 |
title={{MultiCoNER v2: a Large Multilingual dataset for Fine-grained and Noisy Named Entity Recognition}},
|
1301 |
author={Fetahu, Besnik and Chen, Zhiyu and Kar, Sudipta and Rokhlenko, Oleg and Malmasi, Shervin},
|
1302 |
year={2023}}
|
1303 |
+
```
|
1304 |
|
1305 |
### multinerd
|
1306 |
+
```
|
1307 |
+
@inproceedings{tedeschi-navigli-2022-multinerd,
|
1308 |
title = "{M}ulti{NERD}: A Multilingual, Multi-Genre and Fine-Grained Dataset for Named Entity Recognition (and Disambiguation)",
|
1309 |
author = "Tedeschi, Simone and Navigli, Roberto",
|
1310 |
booktitle = "Findings of the Association for Computational Linguistics: NAACL 2022",
|
|
|
1315 |
url = "https://aclanthology.org/2022.findings-naacl.60",
|
1316 |
doi = "10.18653/v1/2022.findings-naacl.60",
|
1317 |
pages = "801--812"}
|
1318 |
+
```
|
1319 |
|
1320 |
### pii-masking-200k
|
1321 |
+
```
|
1322 |
+
@misc {ai4privacy_2023,
|
1323 |
+
author = { {ai4Privacy} },
|
1324 |
+
title = { pii-masking-200k (Revision 1d4c0a1) },
|
1325 |
+
year = 2023,
|
1326 |
+
url = { https://huggingface.co/datasets/ai4privacy/pii-masking-200k },
|
1327 |
+
doi = { 10.57967/hf/1532 },
|
1328 |
+
publisher = { Hugging Face }}
|
1329 |
+
```
|
1330 |
|
1331 |
### wikiann
|
1332 |
+
```
|
1333 |
+
@inproceedings{rahimi-etal-2019-massively,
|
1334 |
title = "Massively Multilingual Transfer for {NER}",
|
1335 |
author = "Rahimi, Afshin and Li, Yuan and Cohn, Trevor",
|
1336 |
booktitle = "Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics",
|
|
|
1340 |
publisher = "Association for Computational Linguistics",
|
1341 |
url = "https://www.aclweb.org/anthology/P19-1015",
|
1342 |
pages = "151--164"}
|
1343 |
+
```
|
1344 |
|
1345 |
### wikiner
|
1346 |
+
```
|
1347 |
+
@article{NOTHMAN2013151,
|
1348 |
+
title = {Learning multilingual named entity recognition from Wikipedia},
|
1349 |
+
journal = {Artificial Intelligence},
|
1350 |
+
volume = {194},
|
1351 |
+
pages = {151-175},
|
1352 |
+
year = {2013},
|
1353 |
+
note = {Artificial Intelligence, Wikipedia and Semi-Structured Resources},
|
1354 |
+
issn = {0004-3702},
|
1355 |
+
doi = {https://doi.org/10.1016/j.artint.2012.03.006},
|
1356 |
+
url = {https://www.sciencedirect.com/science/article/pii/S0004370212000276},
|
1357 |
+
author = {Joel Nothman and Nicky Ringland and Will Radford and Tara Murphy and James R. Curran}}
|
1358 |
+
```
|
1359 |
|
1360 |
### frenchNER_3entities
|
1361 |
```
|
1362 |
+
@misc {frenchNER2024,
|
1363 |
+
author = { {BOURDOIS, Loïck} },
|
1364 |
+
organization = { {Centre Aquitain des Technologies de l'Information et Electroniques} },
|
1365 |
+
title = { frenchNER_3entities },
|
1366 |
+
year = 2024,
|
1367 |
+
url = { https://huggingface.co/CATIE-AQ/frenchNER_3entities },
|
1368 |
+
doi = { 10.57967/hf/1751 },
|
1369 |
+
publisher = { Hugging Face }
|
1370 |
+
}
|
1371 |
```
|
1372 |
|
1373 |
### CamemBERT
|
1374 |
+
```
|
1375 |
+
@inproceedings{martin2020camembert,
|
1376 |
title={CamemBERT: a Tasty French Language Model},
|
1377 |
author={Martin, Louis and Muller, Benjamin and Su{\'a}rez, Pedro Javier Ortiz and Dupont, Yoann and Romary, Laurent and de la Clergerie, {\'E}ric Villemonte and Seddah, Djam{\'e} and Sagot, Beno{\^\i}t},
|
1378 |
booktitle={Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics},
|
1379 |
year={2020}}
|
1380 |
+
```
|
1381 |
|
1382 |
## License
|
1383 |
[cc-by-4.0](https://creativecommons.org/licenses/by/4.0/deed.en)
|