CharsetUtils.java
/* * Copyright (c) 2013. * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package com.example.kjdemo.utils; import org.apache.http.protocol.HTTP; import java.util.ArrayList; import java.util.List; /** * Created by wyouflf on 13-8-30. */ public class CharsetUtils { private CharsetUtils() { } public static String toCharset(final String str, final String charset, int judgeCharsetLength) { try { String oldCharset = getEncoding(str, judgeCharsetLength); return new String(str.getBytes(oldCharset), charset); } catch (Throwable ex) { LogUtils.w(ex); return str; } } public static String getEncoding(final String str, int judgeCharsetLength) { String encode = CharsetUtils.DEFAULT_ENCODING_CHARSET; for (String charset : SUPPORT_CHARSET) { if (isCharset(str, charset, judgeCharsetLength)) { encode = charset; break; } } return encode; } public static boolean isCharset(final String str, final String charset, int judgeCharsetLength) { try { String temp = str.length() > judgeCharsetLength ? str.substring(0, judgeCharsetLength) : str; return temp.equals(new String(temp.getBytes(charset), charset)); } catch (Throwable e) { return false; } } public static final String DEFAULT_ENCODING_CHARSET = HTTP.DEFAULT_CONTENT_CHARSET; public static final List<String> SUPPORT_CHARSET = new ArrayList<String>(); static { SUPPORT_CHARSET.add("ISO-8859-1"); SUPPORT_CHARSET.add("GB2312"); SUPPORT_CHARSET.add("GBK"); SUPPORT_CHARSET.add("GB18030"); SUPPORT_CHARSET.add("US-ASCII"); SUPPORT_CHARSET.add("ASCII"); SUPPORT_CHARSET.add("ISO-2022-KR"); SUPPORT_CHARSET.add("ISO-8859-2"); SUPPORT_CHARSET.add("ISO-2022-JP"); SUPPORT_CHARSET.add("ISO-2022-JP-2"); SUPPORT_CHARSET.add("UTF-8"); } }