@InProceedings{HathoutEtAl2009-WAC5, title = {{L}ooking for {F}rench deverbal nouns in an evolving {W}eb (a short history of {WAC})}, author = {{H}athout, {N}abil and {S}ajous, {F}ranck and {T}anguy, {L}udovic}, booktitle = {Proceedings of {WAC}5: {F}ifth {W}orkshop on {W}eb {A}s {C}orpus }, pages = {37-44 }, address = {{S}an-{S}ebastian {E}spagne }, day = {07}, month = {09}, year = {2009}, abstract = {{T}his paper describes an 8-year-long research effort for automatically collecting new {F}rench deverbal nouns on the {W}eb. {T}he goal has remained the same: building an extensive and cumulative list of noun-verb pairs where the noun denotes the action expressed by the verb (e.g. production - produce). {T}his list is used for both linguistic research and for {NLP} applications. {T}he initial method consisted in taking advantage of the former {A}ltavista search engine, allowing for a direct access to unknown word forms. {T}he second technique led us to develop a specific crawler, which raised a number of technical difficulties. {I}n the third experiment, we use a collection of web pages made available to us by a commercial search engine. {T}hrough all these stages, the general method has remained the same, and the results are similar and cumulative, although the technical environment has greatly evolved.}, }