|
|||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | ||||||||
java.lang.Objectrita.support.Featured
rita.RiString
public class RiString
RiTa's version of the Java String object (both implement the CharSequence interface) with support for 'features'; key-value pairs that contain additional information about the object. For example, you can add part-of-speech, phonemes, syllables, and stress features to a RiString object as follows:
RiString rs = new RiString("The dog was white");
RiAnalyzer ra = new RiAnalyzer();
ra.analyze(rs);
System.out.println(rs.getFeature("syllables"));
System.out.println(rs.getFeature("phonemes"));
System.out.println(rs.getFeature("stresses"));
System.out.println(rs.getFeature("pos"));
| Field Summary |
|---|
| Fields inherited from class rita.support.Featured |
|---|
CHUNKS, PARSE, VALUE_UNKNOWN |
| Fields inherited from interface processing.core.PConstants |
|---|
A, AB, ADD, AG, ALPHA, ALPHA_MASK, ALT, AMBIENT, AR, ARC, ARGB, ARROW, B, BACKSPACE, BASELINE, BEEN_LIT, BEVEL, BLEND, BLUE_MASK, BLUR, BOTTOM, BOX, BURN, CENTER, CENTER_DIAMETER, CENTER_RADIUS, CHATTER, CLOSE, CMYK, CODED, COMPLAINT, CONTROL, CORNER, CORNERS, CROSS, CUSTOM, DA, DARKEST, DB, DEG_TO_RAD, DELETE, DG, DIAMETER, DIFFERENCE, DILATE, DIRECTIONAL, DISABLE_ACCURATE_TEXTURES, DISABLE_DEPTH_SORT, DISABLE_DEPTH_TEST, DISABLE_OPENGL_2X_SMOOTH, DISABLE_OPENGL_ERROR_REPORT, DODGE, DOWN, DR, DXF, EB, EDGE, EG, ELLIPSE, ENABLE_ACCURATE_TEXTURES, ENABLE_DEPTH_SORT, ENABLE_DEPTH_TEST, ENABLE_NATIVE_FONTS, ENABLE_OPENGL_2X_SMOOTH, ENABLE_OPENGL_4X_SMOOTH, ENABLE_OPENGL_ERROR_REPORT, ENTER, EPSILON, ER, ERODE, ERROR_BACKGROUND_IMAGE_FORMAT, ERROR_BACKGROUND_IMAGE_SIZE, ERROR_PUSHMATRIX_OVERFLOW, ERROR_PUSHMATRIX_UNDERFLOW, ERROR_TEXTFONT_NULL_PFONT, ESC, EXCLUSION, G, GIF, GRAY, GREEN_MASK, HALF_PI, HAND, HARD_LIGHT, HINT_COUNT, HSB, IMAGE, INVERT, JAVA2D, JPEG, LEFT, LIGHTEST, LINE, LINES, LINUX, MACOSX, MAX_FLOAT, MAX_INT, MIN_FLOAT, MIN_INT, MITER, MODEL, MULTIPLY, NORMAL, NORMALIZED, NX, NY, NZ, OPAQUE, OPEN, OPENGL, ORTHOGRAPHIC, OTHER, OVERLAY, P2D, P3D, PATH, PDF, PERSPECTIVE, PI, platformNames, POINT, POINTS, POLYGON, POSTERIZE, PROBLEM, PROJECT, QUAD, QUAD_STRIP, QUADS, QUARTER_PI, R, RAD_TO_DEG, RADIUS, RECT, RED_MASK, REPLACE, RETURN, RGB, RIGHT, ROUND, SA, SB, SCREEN, SG, SHAPE, SHIFT, SHINE, SOFT_LIGHT, SPB, SPG, SPHERE, SPOT, SPR, SQUARE, SR, SUBTRACT, SW, TAB, TARGA, THIRD_PI, THRESHOLD, TIFF, TOP, TRIANGLE, TRIANGLE_FAN, TRIANGLE_STRIP, TRIANGLES, TWO_PI, TX, TY, TZ, U, UP, V, VERTEX_FIELD_COUNT, VW, VX, VY, VZ, WAIT, WHITESPACE, WINDOWS, X, Y, Z |
| Constructor Summary | |
|---|---|
RiString(java.lang.CharSequence s)
|
|
RiString(processing.core.PApplet p,
java.lang.CharSequence s)
Included only for consistency's sake |
|
| Method Summary | |
|---|---|
char |
charAt(int index)
|
int |
compareTo(java.lang.Object arg0)
|
int |
compareTo(java.lang.String anotherString)
|
int |
compareToIgnoreCase(java.lang.String str)
|
java.lang.String |
concat(java.lang.String str)
|
boolean |
contains(java.lang.CharSequence s)
|
boolean |
contentEquals(java.lang.StringBuilder sb)
|
RiString |
copy()
Creates and returns a copy of this object |
static RiString |
copy(RiString riString)
Creates and returns a copy of riString |
static void |
delete(RiString text)
|
void |
dump()
|
boolean |
endsWith(java.lang.String suffix)
|
boolean |
equals(java.lang.Object anObject)
|
boolean |
equalsIgnoreCase(java.lang.String anotherString)
|
int |
firstIndexOf(java.lang.String word)
Returns the index of the first token matching word
or -1 if not found |
static RiString[] |
fromCollection(java.util.Collection c)
|
static RiString[] |
fromStrings(java.lang.String[] s)
|
byte[] |
getBytes()
|
byte[] |
getBytes(java.lang.String charsetName)
|
void |
getChars(int srcBegin,
int srcEnd,
char[] dst,
int dstBegin)
|
java.lang.String |
getPos()
Returns an String of part-of-speech tags, 1 per word, using the default WordTokenizer & PosParser, delimited by spaces. |
java.lang.String |
getPos(boolean useWordNetTags)
|
java.lang.String |
getPos(java.lang.String delim)
Returns an String of part-of-speech tags, 1 per word, using the default WordTokenizer & PosParser, delimited by delim. |
java.lang.String |
getPos(java.lang.String delim,
boolean useWordNetTags)
Returns an String of part-of-speech tags, 1 per word, using the default WordTokenizer & PosParser, delimited by delim. |
java.lang.String[] |
getPosArr(boolean useWordNetTags)
Returns an array of part-of-speech tags, one per word, using the default WordTokenizer & PosParser... |
java.lang.String |
getPosAt(int wordIdx)
Returns the part-of-speech at wordIdx using the default
WordTokenizer & PosParser... |
java.lang.String |
getPosAt(int wordIdx,
boolean useWordNetTags)
Returns the part-of-speech at wordIdx using the default
WordTokenizer & PosParser... |
java.lang.String |
getText()
|
java.lang.String |
getWordAt(int wordIdx)
Returns the word at wordIdx using the default WordTokenizer. |
int |
getWordCount()
Returns the # of words in the object according to the default WordTokenizer. |
java.lang.String[] |
getWords()
Returns the array of words in the object, via a call to RiTa.tokenize(). |
int |
hashCode()
|
int |
indexOf(int ch)
|
int |
indexOf(int ch,
int fromIndex)
|
int |
indexOf(java.lang.String str)
|
int |
indexOf(java.lang.String str,
int fromIndex)
|
boolean |
insertWordAt(java.lang.String newWord,
int wordIdx)
Inserts newWord at wordIdx
and shifts each subsequent word accordingly. |
java.lang.String |
intern()
|
FeaturedIF |
join(RiString[] fstrs,
java.lang.String regex)
|
int |
lastIndexOf(int ch)
|
int |
lastIndexOf(int ch,
int fromIndex)
|
int |
lastIndexOf(java.lang.String str)
|
int |
lastIndexOf(java.lang.String str,
int fromIndex)
|
int |
length()
|
static void |
main(java.lang.String[] args)
|
boolean |
matches(java.lang.String regex)
|
static boolean |
regexMatch(java.lang.String patternStr,
java.lang.String fullStr)
Utility method to test whether a String partially matches a regex pattern. |
static java.lang.String |
regexReplace(java.lang.String patternStr,
java.lang.String fullStr,
java.lang.String replaceStr)
Utility method to do regex replacement on a String |
boolean |
regionMatches(boolean ignoreCase,
int toffset,
java.lang.String other,
int ooffset,
int len)
|
boolean |
regionMatches(int toffset,
java.lang.String other,
int ooffset,
int len)
|
java.lang.String |
replace(char oldChar,
char newChar)
|
java.lang.String |
replace(java.lang.CharSequence target,
java.lang.CharSequence replacement)
|
void |
replace(java.lang.String oldText,
java.lang.String newText)
Replaces all instances of oldText with
newText in the object. |
java.lang.String |
replaceAll(java.lang.String regex,
java.lang.String replacement)
|
java.lang.String |
replaceByPos(java.lang.String newWord,
java.lang.String pos)
Randomly chooses from all words matching pos
and replaces a random one with newWord. |
boolean |
replaceCharAt(int idx,
java.lang.String replaceWith)
Replaces the character at 'idx' with 'replaceWith'. |
java.lang.String |
replaceFirst(java.lang.String regex,
java.lang.String replacement)
|
boolean |
replaceWordAt(java.lang.String newWord,
int wordIdx)
Replaces the word at wordIdx
with newWord. |
void |
setString(java.lang.CharSequence[] words)
|
void |
setString(java.lang.String newWord)
|
void |
setText(java.lang.String _text)
Sets the current text to this String |
RiString[] |
split()
Splits the RiString as per String.split(), then checks for
any features with the same number of elements as the resulting String[] and adds
the appropriate feature to each newly created RiString in the array.Example: 'only a handful of responses' / {chunk=noun-phrase}, {pos=rb dt nn in nns} -> 'only' / {pos=rb} 'a' / {pos=dt} 'handful' / {pos=nn} 'of' / {pos=in} 'responses' / {pos=nns} |
RiString[] |
split(java.lang.String regex)
Splits the RiString as per String.split(regex), then checks for
any features with the same number of elements as the resulting String[] and adds
the appropriate feature to each individual RiString.Example: 'only a handful of responses' / {chunk=noun-phrase}, {pos=rb dt nn in nns} -> 'only' / {pos=rb} 'a' / {pos=dt} 'handful' / {pos=nn} 'of' / {pos=in} 'responses' / {pos=nns} |
boolean |
startsWith(java.lang.String prefix)
|
boolean |
startsWith(java.lang.String prefix,
int toffset)
|
java.lang.CharSequence |
subSequence(int beginIndex,
int endIndex)
|
java.lang.String |
substring(int beginIndex)
|
java.lang.String |
substring(int beginIndex,
int endIndex)
|
char[] |
toCharArray()
|
java.lang.String |
toLowerCase()
|
java.lang.String |
toLowerCase(java.util.Locale locale)
|
java.lang.String |
toString()
|
java.lang.String |
toUpperCase()
|
java.lang.String |
toUpperCase(java.util.Locale locale)
|
java.lang.String |
trim()
|
| Methods inherited from class rita.support.Featured |
|---|
addFeature, addFeature, appendFeature, asFeature, asFeature, asFeature, asFeature, asFeature, clearFeatures, getAvailableFeatures, getFeature, getFeatures, getFeatures, getId, hasFeature, removeFeature, setFeatures, toStrings |
| Methods inherited from class java.lang.Object |
|---|
getClass, notify, notifyAll, wait, wait, wait |
| Methods inherited from interface rita.support.FeaturedIF |
|---|
addFeature, clearFeatures, getAvailableFeatures, getFeature, getFeatures, hasFeature, removeFeature, setFeatures |
| Constructor Detail |
|---|
public RiString(processing.core.PApplet p,
java.lang.CharSequence s)
public RiString(java.lang.CharSequence s)
| Method Detail |
|---|
public static void delete(RiString text)
public void setText(java.lang.String _text)
public int firstIndexOf(java.lang.String word)
word
or -1 if not found
public int getWordCount()
getWords()public java.lang.String[] getWords()
RiTa.tokenize(String)
public boolean insertWordAt(java.lang.String newWord,
int wordIdx)
newWord at wordIdx
and shifts each subsequent word accordingly. Returns true
if the replace was succesful, or false if the index does not exist.
public boolean replaceWordAt(java.lang.String newWord,
int wordIdx)
wordIdx
with newWord. Returns true
if the replace was succesful, or false
if the index does not exist.
public static java.lang.String regexReplace(java.lang.String patternStr,
java.lang.String fullStr,
java.lang.String replaceStr)
patternStr - regexfullStr - String to checkreplaceStr - String to insertPattern
public static boolean regexMatch(java.lang.String patternStr,
java.lang.String fullStr)
patternStr - regex StringfullStr - String to checkPattern
public java.lang.String replaceByPos(java.lang.String newWord,
java.lang.String pos)
pos
and replaces a random one with newWord.
Returns the replaced word, or null if if no substitution
could be made.
public java.lang.String getWordAt(int wordIdx)
wordIdx using the default WordTokenizer.
public java.lang.String getPosAt(int wordIdx)
wordIdx using the default
WordTokenizer & PosParser...
public java.lang.String getPosAt(int wordIdx,
boolean useWordNetTags)
wordIdx using the default
WordTokenizer & PosParser...
public java.lang.String[] getPosArr(boolean useWordNetTags)
public java.lang.String getPos(java.lang.String delim,
boolean useWordNetTags)
delim.
public java.lang.String getPos(java.lang.String delim)
delim.
public java.lang.String getPos()
public java.lang.String getPos(boolean useWordNetTags)
public void replace(java.lang.String oldText,
java.lang.String newText)
oldText with
newText in the object.
public RiString[] split()
String.split(), then checks for
any features with the same number of elements as the resulting String[] and adds
the appropriate feature to each newly created RiString in the array.
RiConstants.WORD_BOUNDARYpublic RiString[] split(java.lang.String regex)
String.split(regex), then checks for
any features with the same number of elements as the resulting String[] and adds
the appropriate feature to each individual RiString.
RiConstants.WORD_BOUNDARYpublic void setString(java.lang.String newWord)
public void setString(java.lang.CharSequence[] words)
public FeaturedIF join(RiString[] fstrs,
java.lang.String regex)
public void dump()
public static RiString copy(RiString riString)
riString
public RiString copy()
public static RiString[] fromStrings(java.lang.String[] s)
public static RiString[] fromCollection(java.util.Collection c)
public char charAt(int index)
charAt in interface java.lang.CharSequencepublic int compareTo(java.lang.Object arg0)
public int compareTo(java.lang.String anotherString)
public int compareToIgnoreCase(java.lang.String str)
public java.lang.String concat(java.lang.String str)
public boolean contains(java.lang.CharSequence s)
public boolean contentEquals(java.lang.StringBuilder sb)
public boolean endsWith(java.lang.String suffix)
public boolean equals(java.lang.Object anObject)
equals in class java.lang.Objectpublic boolean equalsIgnoreCase(java.lang.String anotherString)
public byte[] getBytes()
public byte[] getBytes(java.lang.String charsetName)
throws java.io.UnsupportedEncodingException
java.io.UnsupportedEncodingException
public void getChars(int srcBegin,
int srcEnd,
char[] dst,
int dstBegin)
public int hashCode()
hashCode in class java.lang.Object
public int indexOf(int ch,
int fromIndex)
public int indexOf(int ch)
public int indexOf(java.lang.String str,
int fromIndex)
public int indexOf(java.lang.String str)
public java.lang.String intern()
public int lastIndexOf(int ch,
int fromIndex)
public int lastIndexOf(int ch)
public int lastIndexOf(java.lang.String str,
int fromIndex)
public int lastIndexOf(java.lang.String str)
public int length()
length in interface java.lang.CharSequencepublic boolean matches(java.lang.String regex)
public boolean regionMatches(boolean ignoreCase,
int toffset,
java.lang.String other,
int ooffset,
int len)
public boolean regionMatches(int toffset,
java.lang.String other,
int ooffset,
int len)
public java.lang.String replace(char oldChar,
char newChar)
public java.lang.String replace(java.lang.CharSequence target,
java.lang.CharSequence replacement)
public java.lang.String replaceAll(java.lang.String regex,
java.lang.String replacement)
public java.lang.String replaceFirst(java.lang.String regex,
java.lang.String replacement)
public boolean replaceCharAt(int idx,
java.lang.String replaceWith)
public boolean startsWith(java.lang.String prefix,
int toffset)
public boolean startsWith(java.lang.String prefix)
public java.lang.CharSequence subSequence(int beginIndex,
int endIndex)
subSequence in interface java.lang.CharSequence
public java.lang.String substring(int beginIndex,
int endIndex)
public java.lang.String substring(int beginIndex)
public char[] toCharArray()
public java.lang.String toLowerCase()
public java.lang.String toLowerCase(java.util.Locale locale)
public java.lang.String toString()
toString in interface java.lang.CharSequencetoString in class Featuredpublic java.lang.String getText()
getText in interface FeaturedIFgetText in class Featuredpublic java.lang.String toUpperCase()
public java.lang.String toUpperCase(java.util.Locale locale)
public java.lang.String trim()
public static void main(java.lang.String[] args)
|
|||||||||
| PREV CLASS NEXT CLASS | FRAMES NO FRAMES | ||||||||
| SUMMARY: NESTED | FIELD | CONSTR | METHOD | DETAIL: FIELD | CONSTR | METHOD | ||||||||