1ï¼ç®åå¤ææ¯UTF-8æä¸æ¯UTF-8ï¼å 为ä¸è¬é¤äºUTF-8ä¹å¤å°±æ¯GBKï¼æ以就设置é»è®¤ä¸ºGBKã
æç
§ç»å®çå符éåå¨æ件æ¶ï¼å¨æ件çæå¼å¤´çä¸ä¸ªåèä¸å°±æå¯è½åå¨çç¼ç ä¿¡æ¯ï¼æ以ï¼åºæ¬çåçå°±æ¯åªè¦è¯»åºæ件åä¸ä¸ªåèï¼å¤å®è¿äºåèçå¼ï¼å°±å¯ä»¥å¾ç¥å
¶ç¼ç çæ ¼å¼ãå
¶å®ï¼å¦æ项ç®è¿è¡çå¹³å°å°±æ¯ä¸ææä½ç³»ç»ï¼å¦æè¿äºææ¬æ件å¨é¡¹ç®å
产çï¼å³å¼å人åå¯ä»¥æ§å¶ææ¬çç¼ç æ ¼å¼ï¼åªè¦å¤å®ä¸¤ç§å¸¸è§çç¼ç å°±å¯ä»¥äºï¼GBKåUTF-8ãç±äºä¸æWindowsé»è®¤çç¼ç æ¯GBKï¼æ以ä¸è¬åªè¦å¤å®UTF-8ç¼ç æ ¼å¼ã
对äºUTF-8ç¼ç æ ¼å¼çææ¬æ件ï¼å
¶å3个åèçå¼å°±æ¯-17ã-69ã-65ï¼æ以ï¼å¤å®æ¯å¦æ¯UTF-8ç¼ç æ ¼å¼ç代ç ç段å¦ä¸ï¼
[java] view plaincopy
File file = new File(path);
InputStream in= new java.io.FileInputStream(file);
byte[] b = new byte[3];
in.read(b);
in.close();
if (b[0] == -17 && b[1] == -69 && b[2] == -65)
System.out.println(file.getName() + "ï¼ç¼ç 为UTF-8");
else
System.out.println(file.getName() + "ï¼å¯è½æ¯GBKï¼ä¹å¯è½æ¯å
¶ä»ç¼ç ");
2ï¼è¥æ³å®ç°æ´å¤æçæ件ç¼ç æ£æµï¼å¯ä»¥ä½¿ç¨ä¸ä¸ªå¼æºé¡¹ç®cpdetectorï¼å®æå¨çç½åæ¯ï¼
http://cpdetector.sourceforge.net/ãå®çç±»åºå¾å°ï¼åªæ500Kå·¦å³ï¼cpDetectoræ¯åºäºç»è®¡å¦åççï¼ä¸ä¿è¯å®å
¨æ£ç¡®ï¼å©ç¨è¯¥ç±»åºå¤å®ææ¬æ件ç代ç å¦ä¸ï¼
读å¤é¨æ件(å
å©ç¨cpdetectoræ£æµæ件çç¼ç æ ¼å¼ï¼ç¶åç¨æ£æµå°çç¼ç æ¹å¼å»è¯»æ件):
[java] view plaincopy
/**
* å©ç¨ç¬¬ä¸æ¹å¼æºå
cpdetectorè·åæ件ç¼ç æ ¼å¼
*
* @param path
* è¦å¤ææ件ç¼ç æ ¼å¼çæºæ件çè·¯å¾
* @author huanglei
* @version 2012-7-12 14:05
*/
public static String getFileEncode(String path) {
/*
* detectoræ¯æ¢æµå¨ï¼å®ææ¢æµä»»å¡äº¤ç»å
·ä½çæ¢æµå®ç°ç±»çå®ä¾å®æã
* cpDetectorå
ç½®äºä¸äºå¸¸ç¨çæ¢æµå®ç°ç±»ï¼è¿äºæ¢æµå®ç°ç±»çå®ä¾å¯ä»¥éè¿addæ¹æ³ å è¿æ¥ï¼å¦ParsingDetectorã
* JChardetFacadeãASCIIDetectorãUnicodeDetectorã
* detectoræç
§âè°æå
è¿åé空çæ¢æµç»æï¼å°±ä»¥è¯¥ç»æ为åâçååè¿åæ¢æµå°ç
* å符éç¼ç ã使ç¨éè¦ç¨å°ä¸ä¸ªç¬¬ä¸æ¹JARå
ï¼antlr.jarãchardet.jaråcpdetector.jar
* cpDetectoræ¯åºäºç»è®¡å¦åççï¼ä¸ä¿è¯å®å
¨æ£ç¡®ã
*/
CodepageDetectorProxy detector = CodepageDetectorProxy.getInstance();
/*
* ParsingDetectorå¯ç¨äºæ£æ¥HTMLãXMLçæ件æå符æµçç¼ç ,æé æ¹æ³ä¸çåæ°ç¨äº
* æ示æ¯å¦æ¾ç¤ºæ¢æµè¿ç¨ç详ç»ä¿¡æ¯ï¼ä¸ºfalseä¸æ¾ç¤ºã
*/
detector.add(new ParsingDetector(false));
/*
* JChardetFacadeå°è£
äºç±Mozillaç»ç»æä¾çJChardetï¼å®å¯ä»¥å®æ大å¤æ°æ件çç¼ç
* æµå®ãæ以ï¼ä¸è¬æäºè¿ä¸ªæ¢æµå¨å°±å¯æ»¡è¶³å¤§å¤æ°é¡¹ç®çè¦æ±ï¼å¦æä½ è¿ä¸æ¾å¿ï¼å¯ä»¥
* åå¤å å 个æ¢æµå¨ï¼æ¯å¦ä¸é¢çASCIIDetectorãUnicodeDetectorçã
*/
detector.add(JChardetFacade.getInstance());// ç¨å°antlr.jarãchardet.jar
// ASCIIDetectorç¨äºASCIIç¼ç æµå®
detector.add(ASCIIDetector.getInstance());
// UnicodeDetectorç¨äºUnicode家æç¼ç çæµå®
detector.add(UnicodeDetector.getInstance());
java.nio.charset.Charset charset = null;
File f = new File(path);
try {
charset = detector.detectCodepage(f.toURI().toURL());
} catch (Exception ex) {
ex.printStackTrace();
}
if (charset != null)
return charset.name();
else
return null;
}
[java] view plaincopy
String charsetName = getFileEncode(configFilePath);
System.out.println(charsetName);
inputStream = new FileInputStream(configFile);
BufferedReader in = new BufferedReader(new InputStreamReader(inputStream, charsetName));
读jarå
å
é¨èµæºæ件(å
å©ç¨cpdetectoræ£æµjarå
é¨çèµæºæ件çç¼ç æ ¼å¼ï¼ç¶å以æ£æµå°çç¼ç æ¹å¼å»è¯»æ件)ï¼
[java] view plaincopy
/**
* å©ç¨ç¬¬ä¸æ¹å¼æºå
cpdetectorè·åURL对åºçæ件ç¼ç
*
* @param path
* è¦å¤ææ件ç¼ç æ ¼å¼çæºæ件çURL
* @author huanglei
* @version 2012-7-12 14:05
*/
public static String getFileEncode(URL url) {
/*
* detectoræ¯æ¢æµå¨ï¼å®ææ¢æµä»»å¡äº¤ç»å
·ä½çæ¢æµå®ç°ç±»çå®ä¾å®æã
* cpDetectorå
ç½®äºä¸äºå¸¸ç¨çæ¢æµå®ç°ç±»ï¼è¿äºæ¢æµå®ç°ç±»çå®ä¾å¯ä»¥éè¿addæ¹æ³ å è¿æ¥ï¼å¦ParsingDetectorã
* JChardetFacadeãASCIIDetectorãUnicodeDetectorã
* detectoræç
§âè°æå
è¿åé空çæ¢æµç»æï¼å°±ä»¥è¯¥ç»æ为åâçååè¿åæ¢æµå°ç
* å符éç¼ç ã使ç¨éè¦ç¨å°ä¸ä¸ªç¬¬ä¸æ¹JARå
ï¼antlr.jarãchardet.jaråcpdetector.jar
* cpDetectoræ¯åºäºç»è®¡å¦åççï¼ä¸ä¿è¯å®å
¨æ£ç¡®ã
*/
CodepageDetectorProxy detector = CodepageDetectorProxy.getInstance();
/*
* ParsingDetectorå¯ç¨äºæ£æ¥HTMLãXMLçæ件æå符æµçç¼ç ,æé æ¹æ³ä¸çåæ°ç¨äº
* æ示æ¯å¦æ¾ç¤ºæ¢æµè¿ç¨ç详ç»ä¿¡æ¯ï¼ä¸ºfalseä¸æ¾ç¤ºã
*/
detector.add(new ParsingDetector(false));
/*
* JChardetFacadeå°è£
äºç±Mozillaç»ç»æä¾çJChardetï¼å®å¯ä»¥å®æ大å¤æ°æ件çç¼ç
* æµå®ãæ以ï¼ä¸è¬æäºè¿ä¸ªæ¢æµå¨å°±å¯æ»¡è¶³å¤§å¤æ°é¡¹ç®çè¦æ±ï¼å¦æä½ è¿ä¸æ¾å¿ï¼å¯ä»¥
* åå¤å å 个æ¢æµå¨ï¼æ¯å¦ä¸é¢çASCIIDetectorãUnicodeDetectorçã
*/
detector.add(JChardetFacade.getInstance());// ç¨å°antlr.jarãchardet.jar
// ASCIIDetectorç¨äºASCIIç¼ç æµå®
detector.add(ASCIIDetector.getInstance());
// UnicodeDetectorç¨äºUnicode家æç¼ç çæµå®
detector.add(UnicodeDetector.getInstance());
java.nio.charset.Charset charset = null;
try {
charset = detector.detectCodepage(url);
} catch (Exception ex) {
ex.printStackTrace();
}
if (charset != null)
return charset.name();
else
return null;
}
[java] view plaincopy
URL url = CreateStationTreeModel.class.getResource("/resource/" + "é
ç½®æ件");
URLConnection urlConnection = url.openConnection();
inputStream=urlConnection.getInputStream();
String charsetName = getFileEncode(url);
System.out.println(charsetName);
BufferedReader in = new BufferedReader(new InputStreamReader(inputStream, charsetName));
3ï¼æ¢æµä»»æè¾å
¥çææ¬æµçç¼ç ï¼æ¹æ³æ¯è°ç¨å
¶é载形å¼ï¼
[java] view plaincopy
charset=detector.detectCodepage(å¾
æµçææ¬è¾å
¥æµ,æµé该æµæéç读å
¥åèæ°);
ä¸é¢çåèæ°ç±ç¨åºåæå®ï¼åèæ°è¶å¤ï¼å¤å®è¶åç¡®ï¼å½ç¶æ¶é´ä¹è±å¾è¶é¿ãè¦æ³¨æï¼åèæ°çæå®ä¸è½è¶
è¿ææ¬æµçæ大é¿åº¦ã
4ï¼å¤å®æ件ç¼ç çå
·ä½åºç¨ä¸¾ä¾ï¼
å±æ§æ件(.properties)æ¯Javaç¨åºä¸ç常ç¨ææ¬åå¨æ¹å¼ï¼è±¡STRUTSæ¡æ¶å°±æ¯å©ç¨å±æ§æ件åå¨ç¨åºä¸çå符串èµæºãå®çå
容å¦ä¸æ示ï¼
#注éè¯å¥
å±æ§å=å±æ§å¼
读å
¥å±æ§æ件çä¸è¬æ¹æ³æ¯ï¼
[java] view plaincopy
FileInputStream ios=new FileInputStream(âå±æ§æ件åâ);
Properties prop=new Properties();
prop.load(ios);
String value=prop.getProperty(âå±æ§åâ);
ios.close();
å©ç¨java.io.Propertiesçloadæ¹æ³è¯»å
¥å±æ§æ件è½ç¶æ¹ä¾¿ï¼ä½å¦æå±æ§æ件ä¸æä¸æï¼å¨è¯»å
¥ä¹åå°±ä¼åç°åºç°ä¹±ç ç°è±¡ãåçè¿ä¸ªåå æ¯loadæ¹æ³ä½¿ç¨åèæµè¯»å
¥ææ¬ï¼å¨è¯»å
¥åéè¦å°åèæµç¼ç æ为å符串ï¼èå®ä½¿ç¨çç¼ç æ¯âiso-8859-1â,è¿ä¸ªå符éæ¯ASCIIç å符éï¼ä¸æ¯æä¸æç¼ç ï¼
æ¹æ³ä¸ï¼ä½¿ç¨æ¾å¼ç转ç ï¼
[java] view plaincopy
String value=prop.getProperty(âå±æ§åâ);
String encValue=new String(value.getBytes(âiso-8859-1â³),âå±æ§æ件çå®é
ç¼ç â);
æ¹æ³äºï¼è±¡è¿ç§å±æ§æ件æ¯é¡¹ç®å
é¨çï¼æ们å¯ä»¥æ§å¶å±æ§æ件çç¼ç æ ¼å¼ï¼æ¯å¦çº¦å®éç¨Windowså
å®çGBKï¼å°±ç´æ¥å©ç¨âgbkâæ¥è½¬ç ï¼ å¦æ约å®éç¨UTF-8ï¼å°±ä½¿ç¨âUTF-8â³ç´æ¥è½¬ç ã
æ¹æ³ä¸ï¼å¦ææ³çµæ´»ä¸äºï¼åå°èªå¨æ¢æµç¼ç ï¼å°±å¯å©ç¨ä¸é¢ä»ç»çæ¹æ³æµå®å±æ§æ件çç¼ç ï¼ä»èæ¹ä¾¿å¼å人åçå·¥ä½
è¡¥å
ï¼å¯ä»¥ç¨ä¸é¢ä»£ç è·å¾Javaæ¯æç¼ç éåï¼
Charset.availableCharsets().keySet();
å¯ä»¥ç¨ä¸é¢ç代ç è·å¾ç³»ç»é»è®¤ç¼ç ï¼
Charset.defaultCharset();