/*! ****************************************************************************** * * Pentaho Data Integration * * Copyright (C) 2002-2016 by Pentaho : http://www.pentaho.com * ******************************************************************************* * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ******************************************************************************/ package org.pentaho.di.trans.steps.changefileencoding; import java.io.BufferedReader; import java.io.BufferedWriter; import java.io.FileInputStream; import java.io.FileOutputStream; import java.io.InputStreamReader; import java.io.OutputStreamWriter; import org.apache.commons.vfs2.FileType; import org.pentaho.di.core.ResultFile; import org.pentaho.di.core.exception.KettleException; import org.pentaho.di.core.util.Utils; import org.pentaho.di.core.vfs.KettleVFS; import org.pentaho.di.i18n.BaseMessages; import org.pentaho.di.trans.Trans; import org.pentaho.di.trans.TransMeta; import org.pentaho.di.trans.step.BaseStep; import org.pentaho.di.trans.step.StepDataInterface; import org.pentaho.di.trans.step.StepInterface; import org.pentaho.di.trans.step.StepMeta; import org.pentaho.di.trans.step.StepMetaInterface; /** * Change file encoding * * * @author Samatar * @since 03-Juin-2008 * */ public class ChangeFileEncoding extends BaseStep implements StepInterface { private static Class<?> PKG = ChangeFileEncoding.class; // for i18n purposes, needed by Translator2!! private ChangeFileEncodingMeta meta; private ChangeFileEncodingData data; public ChangeFileEncoding( StepMeta stepMeta, StepDataInterface stepDataInterface, int copyNr, TransMeta transMeta, Trans trans ) { super( stepMeta, stepDataInterface, copyNr, transMeta, trans ); } public boolean processRow( StepMetaInterface smi, StepDataInterface sdi ) throws KettleException { meta = (ChangeFileEncodingMeta) smi; data = (ChangeFileEncodingData) sdi; Object[] outputRow = getRow(); // Get row from input rowset & set row busy! if ( outputRow == null ) { // no more input to be expected... setOutputDone(); return false; } if ( first ) { first = false; // get the RowMeta data.inputRowMeta = getInputRowMeta().clone(); // Check is source filename field is provided if ( Utils.isEmpty( meta.getDynamicFilenameField() ) ) { logError( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.FilenameFieldMissing" ) ); throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.FilenameFieldMissing" ) ); } // Check is target filename field is provided if ( Utils.isEmpty( meta.getTargetFilenameField() ) ) { throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.TargetFilenameFieldMissing" ) ); } // cache the position of the field data.indexOfFileename = data.inputRowMeta.indexOfValue( meta.getDynamicFilenameField() ); if ( data.indexOfFileename < 0 ) { // The field is unreachable ! logError( BaseMessages.getString( PKG, "ChangeFileEncoding.Exception.CouldnotFindField" ) + "[" + meta.getDynamicFilenameField() + "]" ); throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Exception.CouldnotFindField", meta.getDynamicFilenameField() ) ); } // cache the position of the field data.indexOfTargetFileename = data.inputRowMeta.indexOfValue( meta.getTargetFilenameField() ); if ( data.indexOfTargetFileename < 0 ) { // The field is unreachable ! logError( BaseMessages.getString( PKG, "ChangeFileEncoding.Exception.CouldnotFindField" ) + "[" + meta.getTargetFilenameField() + "]" ); throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Exception.CouldnotFindField", meta.getTargetFilenameField() ) ); } // Check source encoding data.sourceEncoding = environmentSubstitute( meta.getSourceEncoding() ); // if(Utils.isEmpty(data.sourceEncoding)) { // throw new KettleException(BaseMessages.getString(PKG, "ChangeFileEncoding.Exception.SourceEncodingEmpty")); // } // Check target encoding data.targetEncoding = environmentSubstitute( meta.getTargetEncoding() ); if ( Utils.isEmpty( data.targetEncoding ) ) { throw new KettleException( BaseMessages .getString( PKG, "ChangeFileEncoding.Exception.TargetEncodingEmpty" ) ); } // End If first } try { // get source filename String sourceFilename = data.inputRowMeta.getString( outputRow, data.indexOfFileename ); if ( Utils.isEmpty( sourceFilename ) ) { throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.SourceFileIsEmpty", meta .getDynamicFilenameField() ) ); } // get target filename String targetFilename = data.inputRowMeta.getString( outputRow, data.indexOfTargetFileename ); if ( Utils.isEmpty( targetFilename ) ) { throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.TargetFileIsEmpty", meta .getTargetFilenameField() ) ); } data.sourceFile = KettleVFS.getFileObject( sourceFilename ); // Check if source file exists if ( !data.sourceFile.exists() ) { throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.SourceFileNotExists", sourceFilename ) ); } // Check if source file is a file if ( data.sourceFile.getType() != FileType.FILE ) { throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.SourceFileNotAFile", sourceFilename ) ); } // create directory only if not exists if ( !data.sourceFile.getParent().exists() ) { if ( meta.isCreateParentFolder() ) { data.sourceFile.getParent().createFolder(); } else { throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.ParentFolderNotExist", data.sourceFile.getParent().toString() ) ); } } // Change file encoding changeEncoding( sourceFilename, targetFilename ); putRow( data.inputRowMeta, outputRow ); // copy row to output rowset(s); if ( isDetailed() ) { logDetailed( BaseMessages.getString( PKG, "ChangeFileEncoding.LineNumber", getLinesRead() + " : " + getInputRowMeta().getString( outputRow ) ) ); } } catch ( Exception e ) { boolean sendToErrorRow = false; String errorMessage = null; if ( getStepMeta().isDoingErrorHandling() ) { sendToErrorRow = true; errorMessage = e.toString(); } else { logError( BaseMessages.getString( PKG, "ChangeFileEncoding.ErrorInStepRunning" ) + e.getMessage() ); setErrors( 1 ); stopAll(); setOutputDone(); // signal end to receiver(s) return false; } if ( sendToErrorRow ) { // Simply add this row to the error row putError( getInputRowMeta(), outputRow, 1, errorMessage, meta.getDynamicFilenameField(), "ChangeFileEncoding001" ); } } return true; } private void changeEncoding( String sourceFilename, String targetFilename ) throws KettleException { BufferedWriter buffWriter = null; BufferedReader buffReader = null; try { buffWriter = new BufferedWriter( new OutputStreamWriter( new FileOutputStream( targetFilename, false ), data.targetEncoding ) ); if ( Utils.isEmpty( data.sourceEncoding ) ) { buffReader = new BufferedReader( new InputStreamReader( new FileInputStream( sourceFilename ) ) ); } else { buffReader = new BufferedReader( new InputStreamReader( new FileInputStream( sourceFilename ), data.sourceEncoding ) ); } char[] cBuf = new char[8192]; int readSize = 0; while ( ( readSize = buffReader.read( cBuf ) ) != -1 ) { buffWriter.write( cBuf, 0, readSize ); } // add filename to result filenames? if ( meta.addSourceResultFilenames() ) { // Add this to the result file names... ResultFile resultFile = new ResultFile( ResultFile.FILE_TYPE_GENERAL, data.sourceFile, getTransMeta().getName(), getStepname() ); resultFile.setComment( BaseMessages.getString( PKG, "ChangeFileEncoding.Log.FileAddedResult" ) ); addResultFile( resultFile ); if ( isDetailed() ) { logDetailed( BaseMessages.getString( PKG, "ChangeFileEncoding.Log.FilenameAddResult", data.sourceFile .toString() ) ); } } // add filename to result filenames? if ( meta.addTargetResultFilenames() ) { // Add this to the result file names... ResultFile resultFile = new ResultFile( ResultFile.FILE_TYPE_GENERAL, KettleVFS.getFileObject( targetFilename ), getTransMeta().getName(), getStepname() ); resultFile.setComment( BaseMessages.getString( PKG, "ChangeFileEncoding.Log.FileAddedResult" ) ); addResultFile( resultFile ); if ( isDetailed() ) { logDetailed( BaseMessages.getString( PKG, "ChangeFileEncoding.Log.FilenameAddResult", targetFilename ) ); } } } catch ( Exception e ) { throw new KettleException( BaseMessages.getString( PKG, "ChangeFileEncoding.Error.CreatingFile" ), e ); } finally { try { if ( buffWriter != null ) { buffWriter.flush(); buffWriter.close(); } if ( buffReader != null ) { buffReader.close(); } } catch ( Exception e ) { // Ignore } } } public boolean init( StepMetaInterface smi, StepDataInterface sdi ) { meta = (ChangeFileEncodingMeta) smi; data = (ChangeFileEncodingData) sdi; if ( super.init( smi, sdi ) ) { return true; } return false; } public void dispose( StepMetaInterface smi, StepDataInterface sdi ) { meta = (ChangeFileEncodingMeta) smi; data = (ChangeFileEncodingData) sdi; if ( data.sourceFile != null ) { try { data.sourceFile.close(); } catch ( Exception e ) { // ignore } } super.dispose( smi, sdi ); } }