/* * Copyright 2004-2011 H2 Group. Multiple-Licensed under the H2 License, * Version 1.0, and under the Eclipse Public License, Version 1.0 * (http://h2database.com/html/license.html). * Initial Developer: H2 Group */ package org.h2.build.doc; import java.io.IOException; import java.io.InputStream; import java.io.OutputStream; import java.util.Locale; import org.h2.build.indexer.HtmlConverter; import org.h2.store.fs.FileUtils; import org.h2.util.IOUtils; import org.h2.util.StringUtils; /** * Converts a HTML or Unicode encoded file to UTF-8. */ public class FileConverter { private String inFile = "~/temp/in.txt"; private String outFile = "~/temp/out.txt"; /** * This method is called when executing this application from the command * line. * * @param args the command line parameters */ public static void main(String... args) throws Exception { new FileConverter().run(args); } private void run(String... args) throws Exception { for (int i = 0; i < args.length; i++) { if (args[i].equals("-in")) { inFile = args[++i]; } else if (args[i].equals("-out")) { outFile = args[++i]; } } String languageCode = Locale.KOREA.getLanguage(); String language = new Locale(languageCode).getDisplayLanguage(new Locale(languageCode)); System.out.println(language); System.out.println(StringUtils.javaEncode(language)); convert(); } private void convert() throws IOException { InputStream in = FileUtils.newInputStream(inFile); byte[] bytes = IOUtils.readBytesAndClose(in, -1); String s = new String(bytes, "UTF-8"); String s2 = HtmlConverter.convertHtmlToString(s); String s3 = StringUtils.javaDecode(s2); byte[] result = s3.getBytes("UTF-8"); OutputStream out = FileUtils.newOutputStream(outFile, false); out.write(result); out.close(); } }