天天看点

Java的HTML的URL字符编码转换为Java字符串的函数

  1. import java.util.regex.*;
  2. public class UnicodeCeToJavaString {
  3. static final String mbs = "&#(//d+);"; //like "ロ"
  4. public static String EncodeCesToChars(String paramStr){
  5. String mbChar;
  6. StringBuffer sb = new StringBuffer();
  7. Pattern pat = Pattern.compile(mbs);
  8. Matcher mat = pat.matcher(paramStr);
  9. while (mat.find()){
  10. mbChar = getMbCharStr(mat.group(1)); //pass the digit part
  11. mat.appendReplacement(sb, mbChar);
  12. }
  13. mat.appendTail(sb);
  14. return new String(sb);
  15. }
  16. static String getMbCharStr(String digits){ //handle "12525" part which is a
  17. char[] cha = new char[1];                //Unicode value stringnized
  18. try{
  19. int val = Integer.parseInt(digits);
  20. char ch = (char)val;
  21. cha[0] = ch;
  22. }
  23. catch(Exception e){
  24. System.err.println("Error from getMbCharStr:");
  25. e.printStackTrace(System.err);
  26. }
  27. return new String(cha); //easy!, because Java uses Unicode
  28. }
  29. }