The Sequoia corpus contains French sentences, annotated with various linguistic information: (i) part-of-speech tags, (ii) surface syntactic representations (both constituency trees and dependency trees) and (iii) deep syntactic representations (which are deep syntactic dependency graphs).
Sequoia corpus is distributed under the following licence: LGPL-LR.
If you use this work, please cite the following:
@inproceedings{Candito_Le-corpus-Sequoia-:_2012,
address = {Grenoble, France},
author = {Candito, Marie and Seddah, Djam{\'e}},
title = {{Le corpus Sequoia : annotation syntaxique et exploitation pour l'adaptation d'analyseur par pont lexical}},
year = {2012},
booktitle = {{TALN 2012 - 19e conf{\'e}rence sur le Traitement Automatique des Langues Naturelles}},
url = {https://inria.hal.science/hal-00698938},
hal_pdf = {https://inria.hal.science/hal-00698938v1/file/canditoseddah-taln2012-final.pdf},
}
@inproceedings{Candito_Effectively-long-distance-dependencies-in_2012,
address = {Lisbon, Portugal},
author = {Candito, Marie and Seddah, Djam{\'e}},
title = {{Effectively long-distance dependencies in French : annotation and parsing evaluation}},
year = {2012},
booktitle = {{TLT 11 - The 11th International Workshop on Treebanks and Linguistic Theories}},
url = {https://inria.hal.science/hal-00769625},
hal_pdf = {https://inria.hal.science/hal-00769625v1/file/tlt_extraction_final.pdf},
}
@inproceedings{Candito_Deep-Syntax-Annotation-of_2014,
address = {Reykjavik, Iceland},
author = {Candito, Marie and Perrier, Guy and Guillaume, Bruno and Ribeyre, Corentin and Fort, Karen and Seddah, Djam{\'e} and Villemonte de La Clergerie, {\'E}ric},
title = {{Deep Syntax Annotation of the Sequoia French Treebank}},
year = {2014},
booktitle = {{International Conference on Language Resources and Evaluation (LREC)}},
url = {https://inria.hal.science/hal-00969191},
hal_pdf = {https://inria.hal.science/hal-00969191v2/file/deep_sequoia.final_with_keywords.pdf},
}
@inproceedings{Perrier_Un-sch\'ema-d'annotation-en_2014,
address = {Marseille, France},
author = {Perrier, Guy and Candito, Marie and Guillaume, Bruno and Ribeyre, Corentin and Fort, Karen and Seddah, Djam{\'e}},
title = {{Un sch{\'e}ma d'annotation en d{\'e}pendances syntaxiques profondes pour le fran{\c c}ais}},
year = {2014},
booktitle = {{TALN - Traitement Automatique des Langues Naturelles}},
pages = {574-579},
url = {https://inria.hal.science/hal-01054407},
hal_pdf = {https://inria.hal.science/hal-01054407v1/file/Paper_P-C.4.pdf},
}