Skip to content

Commit

Permalink
better naming of basicface components
Browse files Browse the repository at this point in the history
  • Loading branch information
brendano committed Oct 22, 2012
1 parent f281da3 commit 51cfae9
Showing 1 changed file with 4 additions and 3 deletions.
7 changes: 4 additions & 3 deletions src/cmu/arktweetnlp/Twokenize.java
Original file line number Diff line number Diff line change
Expand Up @@ -98,11 +98,12 @@ public static String OR(String... parts) {
// @aliciakeys Put it in a love song :-))
// @hellocalyclops =))=))=)) Oh well

static String s1 = "(♥|0|o|°|v|\\$|t|x|\\.|;|\\u0CA0|@|ʘ|•|・|◕|\\^|¬|\\*)";
static String s2 = "(?:[\\.]|[_-]+)\\2";
static String bfLeft = "(♥|0|o|°|v|\\$|t|x|\\.|;|\\u0CA0|@|ʘ|•|・|◕|\\^|¬|\\*)";
static String bfCenter = "(?:[\\.]|[_-]+)";
static String bfRight = "\\2";
static String s3 = "(?:--['\"])";
static String s4 = "(?:<|&lt;|>|&gt;)[\\._-]+(?:<|&lt;|>|&gt;)";
static String basicface = "(?:(?i)" +s1+s2+ ")|" +s3+ "|" + s4;
static String basicface = "(?:(?i)" +bfLeft+bfCenter+bfRight+ ")|" +s3+ "|" + s4;

static String eeLeft = "[\\\\\ƪԄ\\((<>;ヽ\\-=~\\*]+";
static String eeRight= "[\\-=\\);'\\u0022<>ʃ)//ノノ丿╯σっµ~\\*]+";
Expand Down

0 comments on commit 51cfae9

Please sign in to comment.