|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |
java.lang.Objectkr.ac.kaist.swrc.jhannanum.share.TagSet
public class TagSet
Morpheme tag set.
Field Summary | |
---|---|
java.lang.String |
author
the author of tag set |
java.lang.String |
copyright
the copyright of tag set |
java.lang.String |
date
the last update date of tag set |
java.lang.String |
editor
the editor of the tag set |
int[] |
indexTags
the list of index tags |
int |
IRR_TYPE_B
'ㅂ' irregular |
int |
IRR_TYPE_D
'ㄷ' irregular |
int |
IRR_TYPE_H
'ㅎ' irregular |
int |
IRR_TYPE_REO
'러' irregular |
int |
IRR_TYPE_REU
'르' irregular |
int |
IRR_TYPE_S
'ㅅ' irregular |
private java.util.ArrayList<java.lang.String> |
irregularList
the irregular rule list |
int |
iwgTag
the start tag |
int |
numTag
the number tag |
static int |
PHONEME_TYPE_ALL
phoneme type - all |
static int |
TAG_SET_KAIST
KAIST tag set |
static int |
TAG_TYPE_ADJS
tag type - adjective |
static int |
TAG_TYPE_ALL
tag type - all |
static int |
TAG_TYPE_COUNT
the number of tag types |
static int |
TAG_TYPE_EOMIES
tag type - eomi(ending) |
static int |
TAG_TYPE_JOSA
tag type - josa(particle) |
static int |
TAG_TYPE_JP
tag type - predicative particle |
static int |
TAG_TYPE_NBNP
tag type - bound noun |
static int |
TAG_TYPE_NOUNS
tag type - noun |
static int |
TAG_TYPE_NPS
tag type - pronoun |
static int |
TAG_TYPE_VERBS
tag type - verb |
static int |
TAG_TYPE_YONGS
tag type - yongeon(verb, adjective) |
private java.util.ArrayList<java.lang.String> |
tagList
the morpheme tag list |
private java.util.HashMap<java.lang.String,int[]> |
tagSetMap
the hash map for the group of tags |
private int[][] |
tagTypeTable
the table for tag types |
java.lang.String |
title
the name of tag set |
int |
unkTag
the unknown tag |
int[] |
unkTags
the list of unknown tags |
java.lang.String |
version
the version of tag set |
Constructor Summary | |
---|---|
TagSet()
Constructor. |
Method Summary | |
---|---|
boolean |
checkPhonemeType(int phonemeType,
int phoneme)
Checks the phoneme type |
boolean |
checkTagType(int tagType,
int tag)
Checks morpheme tag type |
void |
clear()
Cleans the data loaded. |
int |
getIrregularID(java.lang.String irregular)
Returns the ID of the specified irregular rule. |
java.lang.String |
getIrregularName(int irregularID)
Returns the name of the irregular rule for the specified ID. |
int |
getTagCount()
Returns the number of morpheme tags loaded. |
int |
getTagID(java.lang.String tag)
Returns the ID of the morpheme tag. |
java.lang.String |
getTagName(int tagID)
Returns the tag name for the specified ID. |
int[] |
getTags(java.lang.String tagSetName)
Returns the morpheme tags in the specified tag group. |
void |
init(java.lang.String filePath,
int tagSetFlag)
Reads the tag set file, and initializes the object. |
void |
setTagTypes(int tagSetFlag)
Sets the tag types. |
Methods inherited from class java.lang.Object |
---|
clone, equals, finalize, getClass, hashCode, notify, notifyAll, toString, wait, wait, wait |
Field Detail |
---|
public static final int TAG_SET_KAIST
public static final int TAG_TYPE_ALL
public static final int TAG_TYPE_VERBS
public static final int TAG_TYPE_NOUNS
public static final int TAG_TYPE_NPS
public static final int TAG_TYPE_ADJS
public static final int TAG_TYPE_NBNP
public static final int TAG_TYPE_JOSA
public static final int TAG_TYPE_YONGS
public static final int TAG_TYPE_EOMIES
public static final int TAG_TYPE_JP
public static final int TAG_TYPE_COUNT
public static final int PHONEME_TYPE_ALL
public java.lang.String title
public java.lang.String version
public java.lang.String copyright
public java.lang.String author
public java.lang.String date
public java.lang.String editor
private java.util.ArrayList<java.lang.String> tagList
private java.util.ArrayList<java.lang.String> irregularList
private java.util.HashMap<java.lang.String,int[]> tagSetMap
private int[][] tagTypeTable
public int[] indexTags
public int[] unkTags
public int iwgTag
public int unkTag
public int numTag
public int IRR_TYPE_B
public int IRR_TYPE_S
public int IRR_TYPE_D
public int IRR_TYPE_H
public int IRR_TYPE_REU
public int IRR_TYPE_REO
Constructor Detail |
---|
public TagSet()
Method Detail |
---|
public boolean checkPhonemeType(int phonemeType, int phoneme)
phonemeType
- - phoneme typephoneme
- - phoneme
public boolean checkTagType(int tagType, int tag)
tagType
- - tag typetag
- - morpheme tag
public void clear()
public int getIrregularID(java.lang.String irregular)
irregular
- - irregular rule
public java.lang.String getIrregularName(int irregularID)
irregularID
- - the ID of the irregular rule
public int getTagCount()
public int getTagID(java.lang.String tag)
tag
- - morpheme tag
public java.lang.String getTagName(int tagID)
tagID
- - the morpheme tag ID
public int[] getTags(java.lang.String tagSetName)
tagSetName
- - the name of the tag group
public void init(java.lang.String filePath, int tagSetFlag) throws java.io.IOException
filePath
- - the file for morpheme tag set
java.io.IOException
public void setTagTypes(int tagSetFlag)
tagSetFlag
- - the flag for tag set (TAG_SET_KAIST, ..)
|
||||||||||
PREV CLASS NEXT CLASS | FRAMES NO FRAMES | |||||||||
SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD |