Title : ( An Overview of Text Mining in Language Studies: The Computational Approach to Text Analytics )
Authors: Hadi Masjedy , Seyyed Mohammad Reza Adel , Seyyed Mohammad Reza Amirian , Gholamreza Zareian ,Abstract
\\\\\\\\\\\\\\\'Text mining\\\\\\\\\\\\\\\' refers to the computational process of unstructured text analytics for extracting latent linguistic layers and themes. It is especially significant as content or thematic analysis in descriptive and interpretive studies. This process begins with structuring simple texts and proceeds with summarizing, classifiing, modelling, evaluating and interpreting the inherent textual concepts and patterns. Given that this method counts as an interdisciplinary innovation especially in discoursal studies, it is to be pursued more intensively in academic studies. Despite the multitude of English studies in this area, there has been little interest to date in text mining amongst Iranian researchers as evidenced by the critically limited number of local Persian and English studies. Thus looking into the theory and practice of text mining and its major analytic tools and methods in Persian and English, this paper aims to prepare the ground for utilizing this methodology in language studies.
Keywords
, Text mining, unstructured texts, content analysis, thematic analysis, natural language processing@article{paperid:1105063,
author = {هادی مسجدی and Seyyed Mohammad Reza Adel, and سید محمدرضا امیریان and غلامرضا زارعیان},
title = {An Overview of Text Mining in Language Studies: The Computational Approach to Text Analytics},
journal = {جستارهای زبانی},
year = {2022},
volume = {12},
number = {6},
month = {January},
issn = {2322-3081},
pages = {499--531},
numpages = {32},
keywords = {Text mining; unstructured texts; content analysis; thematic analysis; natural language processing},
}
%0 Journal Article
%T An Overview of Text Mining in Language Studies: The Computational Approach to Text Analytics
%A هادی مسجدی
%A Seyyed Mohammad Reza Adel,
%A سید محمدرضا امیریان
%A غلامرضا زارعیان
%J جستارهای زبانی
%@ 2322-3081
%D 2022
