dc.contributor.author |
Sumam, Mary Idicula |
|
dc.contributor.author |
Soumya, S |
|
dc.contributor.author |
Manju, K |
|
dc.date.accessioned |
2014-07-17T09:42:13Z |
|
dc.date.available |
2014-07-17T09:42:13Z |
|
dc.date.issued |
2009 |
|
dc.identifier.uri |
http://dyuthi.cusat.ac.in/purl/4090 |
|
dc.description |
2009 International Conference on Advances in Recent Technologies in Communication and Computing |
en_US |
dc.description.abstract |
A Parts of Speech tagger for Malayalam which uses
a stochastic approach has been proposed. The tagger makes
use of word frequencies and bigram statistics from a corpus.
The morphological analyzer is used to generate a tagged
corpus due to the unavailability of an annotated corpus in
Malayalam. Although the experiments have been performed on
a very small corpus, the results have shown that the statistical
approach works well with a highly agglutinative language like
Malayalam |
en_US |
dc.description.sponsorship |
Cochin University of Science and Technology |
en_US |
dc.language.iso |
en |
en_US |
dc.publisher |
IEEE |
en_US |
dc.subject |
Dravidian Language |
en_US |
dc.subject |
Morphemes |
en_US |
dc.subject |
HMM |
en_US |
dc.subject |
Viterbi |
en_US |
dc.subject |
Tagset. |
en_US |
dc.title |
Development Of A Pos Tagger For Malayalam-An Experience |
en_US |
dc.type |
Article |
en_US |