@STRING{igm_electronic={electronic version} } @STRING{igm_phddoc={Th\`ese de doctorat} } @STRING{igml = {I.G.M., Universit\'e de Marne-la-Vall\'ee} } @STRING{igml_amsterdam={Amsterdam/Philadelphia : Benjamins} } @STRING{igml_ial= {Beijing: Institute of Applied Linguistics} } @STRING{igmlc_lgc={International Conference on Lexis and Grammar} } @STRING{igmlj_jap={Journal of Applied Linguistics} } @STRING{igmlj_linv={Lingvisticae Investigationes} } @STRING{igmlp_ucl={UCL, Presses Universitaires de Louvain} } @Article{ IGML_Pau00, author = {Paumier, S\'ebastien}, title = {{{N}ouvelles m\'ethodes pour la recherche d'expressions dans de grands corpus}}, journal = {Revue {I}nformatique et {S}tatistique dans les {S}ciences humaines}, year = {2000}, volume = {36}, pages = {289-296}, note = {Actes des troisi\`emes journ\'ees INTEX, Li\`ege (2000)}, lang = {FR}, editor = {Dister, Anne} } @Article{ IGML_Pau01, author = {Paumier, S\'ebastien}, title = {{{S}ome remarks on the application of a lexicon-grammar}}, journal = {Lingvisticae Investigationes}, year = {2001}, volume = {24}, pages = {245-256}, number = {2}, lang = {EN}, publisher = {Amsterdam/Philadelphia : Benjamins} } @Article{ IGML_FaiPau07b, author = {Fairon, C\'edrick and Paumier, S\'ebastien}, title = {{De la possibilit\'e de construire un dictionnaire \'electronique du langage SMS}}, journal = {Cahiers de lexicologie}, editor = {Fairon, C\'edrick and Lamiroy, B\'eatrice}, year = {2007}, volume = {2}, number = {91}, pages = {65--72}, lang = {FR}, note = { } } @Article{ IGML_UllPau06, author = {Ulland, Harald and Paumier, S\'ebastien}, title = {{Analyse automatique des mots polylexicaux en norv\'egien}}, journal = igmlj_linv, publisher = igml_amsterdam, year = {2005}, volume = {28}, number = {2}, pages = {255--281}, lang = {FR}, note = {DOI: 10.1075/li.28.2.05ull } } @Article{ IGML_Pau09, author = {Paumier, S\'ebastien}, title = {{Why academic software should be Open Source}}, journal = {INFOtheca: Journal of informatics and librarianship}, publisher = {Serbian Academic Library Association}, editor = {Sedmak, Aleksandar}, year = {2009}, volume = {X}, number = {1-2}, pages = {51--54}, lang = {EN}, month = jun, pdf = {http://www.unilib.bg.ac.yu/zajednica01/english/izdanja/infoteka/br1_2_2009/INFOTHECA_X_1-2_June2009_51a-54a.pdf}, note = { } } @Article{ IGML_Pau04b, author = {Paumier, S\'ebastien}, title = {{Recursive Automata for Syntactic Grammars}}, journal = igmlj_jap, publisher = igml_ial, editor = {Laporte, Eric and Cheng, Ting-Au}, year = {2004}, pages = {122--131}, igmrefpreprint= {ISSN 1003-5397}, igmnote = {Special issue on Lexicon-Grammar. In Chinese.}, lang = {OT}, note = {Special issue on Lexicon-Grammar. In Chinese. ISSN 1003-5397 } } @Book{ IGML_FaiKlePau06, author = {Fairon, C\'edrick and Klein, Jean-Ren\'e and Paumier, S\'ebastien}, title = {{Le langage SMS. \'Etude d'un corpus informatis\'e \`a partir de l'enqu\^ete ''Faites don de vos SMS \`a la science''}}, series = {Cahiers du CENTAL}, publisher = igmlp_ucl, year = {2006}, volume = {3.1}, lang = {FR}, url = {http://www.i6doc.com/doc/sms}, note = { } } @Book{ IGML_FaiKlePau06b, author = {Fairon, C\'edrick and Klein, Jean-Ren\'e and Paumier, S\'ebastien}, title = {{SMS pour la science. Corpus de 30.000 SMS et logiciel de consultation}}, series = {Cahiers du CENTAL}, publisher = igmlp_ucl, year = {2006}, volume = {3.2}, lang = {FR}, url = {http://www.i6doc.com/doc/smscd}, note = { } } @InBook{ IGML_FaiKlePau06d, author = {Fairon, C\'edrick and Klein, Jean-Ren\'e and Paumier, S\'ebastien}, title = {{Le fran\c cais m'a tuer}}, publisher = igmlp_ucl, year = {2006}, pages = {33--42}, lang = {FR}, igmchapter = {Le langage SMS, r\'ev\'elateur d'1comp\'etence?}, note = {Chapter title : Le langage SMS, r\'ev\'elateur d'1comp\'etence? } } @InBook{ IGML_FaiKlePau08, author = {Fairon, C\'edrick and Klein, Jean R. and Paumier, S\'ebastien}, title = {{La langue du cyberespace : de la diversit\'e aux normes}}, publisher = {Editions L'Harmattan}, editor = {Gerbault, Jeannine}, year = {2008}, pages = {173--184}, lang = {FR}, chapter = {13}, igmchapter = {Un corpus transcrit de 30000 SMS fran\c{c}ais}, note = {Chapter title : Un corpus transcrit de 30000 SMS fran\c{c}ais } } @InCollection{ IGML_Pau10, author = {Paumier, S\'ebastien}, title = {{L'hyper-verbe schtroumpfer}}, booktitle = {Les tables. La grammaire du fran\c cais par le menu}, series = {Les cahiers du CENTAL}, publisher = igmlp_ucl, editor = {Nakamura, Takuya and Laporte, \'Eric and Dister, Anne and Fairon, C\'edrick}, year = {2010}, volume = {6}, pages = {309--314}, lang = {FR}, note = { } } @InProceedings{ IGML_LapPau06, author = {Laporte, \'Eric and Paumier, S\'ebastien}, title = {{Graphes param\'etr\'es et outils de lexicalisation}}, igmposter = {true}, booktitle = {Poster session of 13eme Colloque sur le traitement automatique des langues naturelles (TALN'06)}, igmnumconf = {13}, igmnumbisconf = {eme}, igmacroconf = {TALN}, igmconf = {Colloque sur le traitement automatique des langues naturelles}, publisher = igmlp_ucl, year = {2006}, pages = {532--540}, month = apr, lang = {FR}, address = {Leuven, Belgique}, url = {http://hal.archives-ouvertes.fr/hal-00189668/fr/}, igmnote = {Verbum ex Machina. Cahiers du CENTAL 2(1)}, note = {Verbum ex Machina. Cahiers du CENTAL 2(1) } } @InProceedings{ IGML_FaiKlePau06c, author = {Fairon, C\'edrick and Klein, Jean-Ren\'e and Paumier, S\'ebastien}, title = {{Un corpus transcrit de 30.000 SMS}}, booktitle = { CMT}, igmconf = {CMT}, year = {2006}, days = {18-20}, month = may, lang = {FR} } @InProceedings{ IGML_FaiPau06, author = {Fairon, C\'edrick and Paumier, S\'ebastien}, title = {{A framework for real time dictionary updating}}, igmposter = {true}, booktitle = {Poster session of LREC}, igmconf = {LREC}, year = {2006}, days = {24-26}, month = may, lang = {EN}, note = { } } @InProceedings{ IGML_FaiPau06b, author = {Fairon, C\'edrick and Paumier, S\'ebastien}, title = {{A translated corpus of 30,000 French SMS}}, booktitle = { LREC}, igmconf = {LREC}, year = {2006}, days = {24-26}, month = may, lang = {EN}, note = { } } @InProceedings{ IGML_FaiPauWat05, author = {Fairon, C\'edrick and Paumier, S\'ebastien and Watrin, Patrick}, title = {{Can we parse without tagging ?}}, booktitle = {2nd Language \& Technology Conference (LTC'05)}, igmnumconf = {2}, igmnumbisconf = {nd}, igmacroconf = {LTC}, igmconf = {Language \& Technology Conference}, editor = {Vetulani, Zygmunt}, year = {2005}, pages = {473--477}, lang = {EN}, days = {21-23}, month = apr, pdf = {http://infolingu.univ-mlv.fr/english/Bibliographie/Articles/ltc_138_fairon.pdf}, note = { } } @InProceedings{ IGML_DumPau08, author = {Dumitriu, Dana-Marina and Paumier, S\'ebastien}, title = {{Requ\^etes linguistiques sur alignements multilingues}}, booktitle = { Directia Terminologie si Inginerie Lingvistica (DTIL'08)}, igmacroconf = {DTIL}, igmconf = {Directia Terminologie si Inginerie Lingvistica}, year = {2008}, days = {28-29}, month = feb, igmelec = {true}, lang = {FR}, pdf = {http://dtil.unilat.org/seminar_bucuresti_2008/actes/paumier_dumitriu.htm}, igmnote = {ISBN: 978-9-291220-37-3}, note = {ISBN: 978-9-291220-37-3 } # igm_electronic # { } } @InProceedings{ IGML_FaiPau07, author = {Fairon, C\'edrick and Paumier, S\'ebastien}, title = {{Un corpus SMS est-il un corpus comme les autres ?}}, booktitle = {26\`eme } # igmlc_lgc # { (LGC'07)}, igmnumconf = {26}, igmnumbisconf = {\`eme}, igmacroconf = {LGC}, igmconf = igmlc_lgc, editor = {Camugli Gallardo, Catherine and Constant, Matthieu and Dister, Anne}, year = {2007}, pages = {209--216}, days = {2-6}, month = oct, lang = {FR}, pdf = {http://infolingu.univ-mlv.fr/Colloques/Bonifacio/proceedings/fairon.pdf}, note = { } } @InProceedings{ IGML_Pau04, author = {Paumier, S\'ebastien}, title = {{Weak Greibach Normal Form of Recursive Transition Networks}}, booktitle = { Proceedings of Journ\'ees Montoises d'Informatique Th\'eorique}, igmconf = {Proceedings of Journ\'ees Montoises d'Informatique Th\'eorique}, year = {2004}, pages = {304--324}, lang = {EN}, address = {Li\`ege}, note = { } } @InProceedings{ IGML_PauDum08, author = {Paumier, S\'ebastien and Dumitriu, Dana-Marina}, title = {{Editable text alignments and powerful linguistic queries}}, booktitle = {27th } # igmlc_lgc # { (LGC'08)}, igmnumconf = {27}, igmnumbisconf = {th}, igmacroconf = {LGC}, igmconf = igmlc_lgc, editor = {Constant, Matthieu and Nakamura, Takuya and De Gioia, Michele and Vecchiato, Sara}, year = {2008}, pages = {117--125}, lang = {EN}, days = {10-13}, month = sep, note = { } } @InProceedings{ IGML_Pau03, author = {Paumier, S\'ebastien}, title = {{A Time-Efficient Token Representation for Parsers}}, booktitle = { Proceedings of the EACL Workshop on Finite-State Methods in Natural Language Processing}, igmconf = {Proceedings of the EACL Workshop on Finite-State Methods in Natural Language Processing}, year = {2003}, pages = {83--90}, lang = {EN}, address = {Budapest}, pdf = {http://igm.univ-mlv.fr/~paumier/paumier_EACL_2004.pdf}, note = { } } @InProceedings{ IGML_VoyNakPau09, author = {Paumier, S\'ebastien and Nakamura, Takuya and Voyatzi, Stavroula}, title = {{UNITEX, a Corpus Processing System with Multi-Lingual Linguistic Resources}}, booktitle = { eLexicography in the 21st century: new challenges, new applications (eLEX'09)}, igmacroconf = {eLEX}, igmconf = {eLexicography in the 21st century: new challenges, new applications}, year = {2009}, pages = {173--175}, days = {22-24}, month = oct, lang = {EN}, note = { } } @Manual{ IGML_Pau02, author = {Paumier, S\'ebastien}, title = {{Unitex - Manuel d'utilisation}}, year = {2006}, pages = {1--217}, pdf = {http://igm.univ-mlv.fr/\~unitex/ManuelUnitex.pdf}, igmnote = {Premi\`ere version~: 2004.}, lang = {FR}, note = {Premi\`ere version~: 2004. } } @Misc{ IGML_Pau08, author = {Paumier, S\'ebastien}, title = {{Unitex 2.0 User Manual}}, year = {2008}, month = oct, igmelec = {true}, pdf = {http://www-igm.univ-mlv.fr/~unitex/UnitexManual2.0.pdf}, lang = {EN}, note = { } # igm_electronic # { } } @PhDThesis{ IGML_Pau03b, typeupe = {PHDTHESIS}, author = {Paumier, S\'ebastien}, labs = {3210}, title = {{De la reconnaissance de formes linguistiques \`a l'analyse syntaxique}}, type = igm_phddoc, igmtype = {igm_phdDoc}, igmlocal = {true}, school = {Universit\'e de Marne-la-Vall\'ee}, directeur = {Gross, Maurice}, encadrant = {Guenthner, Franz}, rapporteur = {Choffrut, Christian and Guenthner, Franz}, examinateur = {Laporte, \'Eric and Nam, Jee-sun and Perrin, Dominique}, abstract = {La plupart des descriptions des langues naturelles consistent en une accumulation de r\`{e}gles d\'{e}crivant le comportement des diff\'{e}rents \'{e}l\'{e}ments du langage. Cependant, si beaucoup de r\`{e}gles g\'{e}n\'{e}rales ont \'{e}t\'{e} \'{e}tablies, leurs exceptions n'ont pratiquement pas \'{e}t\'{e} \'{e}tudi\'{e}es, ce qui fait que ces descriptions sont incompl\`{e}tes, voire erron\'{e}es lorsque le nombre de cas particuliers n'est pas n\'{e}gligeable. Pour rem\'{e}dier \`{a} cela, un examen minutieux des phrases \'{e}l\'{e}mentaires du fran\c{c}ais a \'{e}t\'{e} men\'{e} au LADL. Ces travaux ont abouti \`{a} une description tr\`{e}s fine des propri\'{e}t\'{e}s syntaxiques de ces phrases, cod\'{e}e sous la forme de matrices appel\'{e}es tables de lexique-grammaire. En 1993, il a \'{e}t\'{e} montr\'{e} que l'on pouvait exploiter les donn\'{e}es de ces tables pour effectuer l'analyse automatique de phrases simples. Nous avons \'{e}tudi\'{e} un moyen d'\'{e}tendre ces travaux, de fa\c{c}on \`{a} traiter exhaustivement les donn\'{e}es du lexique-grammaire, afin de pouvoir analyser n'importe quelle phrase simple du fran\c{c}ais. Le traitement complet de toutes ces constructions est une op\'{e}ration qui prendra beaucoup de temps, ce qui nous a conduit \`{a} nous poser la question de la maintenance de donn\'{e}es \`{a} long terme. Nous avons ainsi pris le parti d'utiliser un formalisme de description tr\`{e}s simple, celui des grammaires locales, afin que les donn\'{e}es soient repr\'{e}sent\'{e}es d'une fa\c{c}on la plus claire possible, et qu'elles puissent \^{e}tre maintenues facilement. Dans un premier temps, nous avons test\'{e} la puissance de description de notre mod\`{e}le, \`{a} travers l'examen de diverses constructions. Bien que simple, il s'est av\'{e}r\'{e} bien adapt\'{e} \`{a} la description de structures syntaxiques, et a mis en \'{e}vidence le fait que la distinction entre la recherche de motifs et l'analyse syntaxique n'est qu'une question d'\'{e}chelle de description. En contrepartie de cette simplicit\'e, nous avons du faire face aux probl\`{e}mes informatique soulev\'{e}s par l'exploitation de nos grammaires, en particulier \`{a} cause des ordres de grandeur atteints par les donn\'{e}es accumul\'{e}es. Nous avons donc \'{e}tudi\'{e} dans un second temps diff\'{e}rentes m\'{e}thodes permettant de manipuler ces donn\'{e}es, les unes mettant en jeu des transformations op\'{e}rant sur les grammaires, les autres concernant les programmes destin\'{e}s \`{a} les appliquer. Les r\'{e}sultats que nous avons obtenus montrent que notre mod\`{e}le est viable, et que l'accumulation des grammaires d\'{e}crivant toutes les structures de phrases simples du fran\c{c}ais est r\'{e}alisable, ce qui devrait permettre, \`{a} terme, d'obtenir un analyseur syntaxique exact pour ces constructions.}, year = {2003}, days = {4}, month = jul, igmnbpages = {197}, pdf = {http://www-igm.univ-mlv.fr/labinfo/theses/2003/paumier1.ps.gz}, keywords = {recherche de motifs, lexique-grammaire, analyse syntaxique, grammaires syntaxiques, transducteurs alg\'{e}briques \'{e}tendus, traitement des langues naturelles (TALN), forme normale de Greibach, r\'{e}seaux de transitions r\'{e}cursifs (RTN).}, lang = {FR}, note = { Jury : Gross, Maurice, Guenthner, Franz, Choffrut, Christian and Guenthner, Franz, Laporte, \'Eric and Nam, Jee-sun and Perrin, Dominique (197 pp.) } } @TechReport{ IGML_Pau00b, author = {Paumier, S\'ebastien}, title = {{Recherche d'expressions dans de grands corpus: le syst\`eme AGLAE}}, institution = igml, year = {2000}, lang = {FR}, igmnote = {M\'emoire de DEA}, note = {M\'emoire de DEA } }