예제 #1
1
 /**
  * Given a string, return an array of tokens. The separator can be escaped with the '\' character.
  * The '\' character may also be escaped by the '\' character.
  *
  * @param s the string to tokenize.
  * @param separator the separator char.
  * @param maxTokens the maxmimum number of tokens returned. If the max is reached, the remaining
  *     part of s is appended to the end of the last token.
  * @return an array of tokens.
  */
 public static String[] tokenize(String s, char separator, int maxTokens) {
   List tokens = new ArrayList();
   StringBuilder token = new StringBuilder();
   boolean prevIsEscapeChar = false;
   for (int i = 0; i < s.length(); i += Character.charCount(i)) {
     int currentChar = s.codePointAt(i);
     if (prevIsEscapeChar) {
       // Case 1:  escaped character
       token.appendCodePoint(currentChar);
       prevIsEscapeChar = false;
     } else if (currentChar == separator && tokens.size() < maxTokens - 1) {
       // Case 2:  separator
       tokens.add(token.toString());
       token = new StringBuilder();
     } else if (currentChar == '\\') {
       // Case 3:  escape character
       prevIsEscapeChar = true;
     } else {
       // Case 4:  regular character
       token.appendCodePoint(currentChar);
     }
   }
   if (token.length() > 0) {
     tokens.add(token.toString());
   }
   return (String[]) tokens.toArray(new String[] {});
 }
 protected String makeSpace(int len) {
   if (len <= 0) {
     return "";
   }
   StringBuilder sb = new StringBuilder(len);
   for (int i = 0; i < len; i++) {
     sb.append(' ');
   }
   return sb.toString();
 }
예제 #3
0
 /**
  * Convert the name to a valid HTML name.
  *
  * @param name the name that needs to be converted to valid HTML name.
  * @return a valid HTML name string.
  */
 public String getName(String name) {
   StringBuilder sb = new StringBuilder();
   char ch;
   /* The HTML 4 spec at http://www.w3.org/TR/html4/types.html#h-6.2 mentions
    * that the name/id should begin with a letter followed by other valid characters.
    * The HTML 5 spec (draft) is more permissive on names/ids where the only restriction
    * is that it should be at least one character long and should not contain spaces.
    * The spec draft is @ http://www.w3.org/html/wg/drafts/html/master/dom.html#the-id-attribute.
    *
    * For HTML 4, we need to check for non-characters at the beginning of the name and
    * substitute it accordingly, "_" and "$" can appear at the beginning of a member name.
    * The method substitutes "$" with "Z:Z:D" and will prefix "_" with "Z:Z".
    */
   for (int i = 0; i < name.length(); i++) {
     ch = name.charAt(i);
     switch (ch) {
       case '(':
       case ')':
       case '<':
       case '>':
       case ',':
         sb.append('-');
         break;
       case ' ':
       case '[':
         break;
       case ']':
         sb.append(":A");
         break;
         // Any appearance of $ needs to be substituted with ":D" and not with hyphen
         // since a field name "P$$ and a method P(), both valid member names, can end
         // up as "P--". A member name beginning with $ needs to be substituted with
         // "Z:Z:D".
       case '$':
         if (i == 0) sb.append("Z:Z");
         sb.append(":D");
         break;
         // A member name beginning with _ needs to be prefixed with "Z:Z" since valid anchor
         // names can only begin with a letter.
       case '_':
         if (i == 0) sb.append("Z:Z");
         sb.append(ch);
         break;
       default:
         sb.append(ch);
     }
   }
   return sb.toString();
 }