@article{aup:/content/journals/10.5117/TVT2016.3.PAND, author = "Pander Maat, Henk and Dekker, Nick", title = "Tekstgenres analyseren op lexicale complexiteit met T‑Scan", journal= "Tijdschrift voor Taalbeheersing", year = "2016", volume = "38", number = "3", pages = "263-304", doi = "https://doi.org/10.5117/TVT2016.3.PAND", url = "https://www.aup-online.com/content/journals/10.5117/TVT2016.3.PAND", publisher = "Amsterdam University Press", issn = "2352-1236", type = "Journal Article", keywords = "stylistic variation", keywords = "automatic text analysis", keywords = "lexical complexity", keywords = "readability", keywords = "corpus research", abstract = "Abstract Using T-Scan to analyse the lexical complexity of text genres T-Scan is a tool for the automatic analysis of Dutch text. This paper presents the first large-scale corpus analysis with T-Scan, focusing on lexical complexity. A collection of nearly 1000 text specimens was assembled, containing ten genres: travel blogs, celebrity news features, novels, textbooks for vocational secondary schools, textbooks for general secondary schools, news reports, opinion pieces, political programs, medical advice texts and research articles. The lexical complexity features in the analysis include morphology, word frequency, various word concreteness indices, personal pronouns, names and verb tense. Systematic genre differences are found, such that a genre detection model comprising 18 T-Scan features correctly identifies 83 percent of the corpus texts. Most lexical features differentiating genres intuitively relate to text topic complexity. A closer analysis is offered of the contrast between the two textbook samples in the corpus, which differ only in the educational levels they cater for. Again, topic variation seems a more important factor than stylistic variation. We demonstrate a new method to examine stylistic variation, which consists of within-genre comparisons using the genre prediction; more specifically, ‘deviant’ texts are compared to ‘typical’ members of their genre.", }