/*! ****************************************************************************** * * Pentaho Data Integration * * Copyright (C) 2002-2016 by Pentaho : http://www.pentaho.com * ******************************************************************************* * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ******************************************************************************/ package org.pentaho.di.trans.steps.rssinput; import java.util.List; import org.pentaho.di.core.CheckResult; import org.pentaho.di.core.CheckResultInterface; import org.pentaho.di.core.Const; import org.pentaho.di.core.util.Utils; import org.pentaho.di.core.database.DatabaseMeta; import org.pentaho.di.core.exception.KettleException; import org.pentaho.di.core.exception.KettleStepException; import org.pentaho.di.core.exception.KettleXMLException; import org.pentaho.di.core.row.RowMetaInterface; import org.pentaho.di.core.row.ValueMetaInterface; import org.pentaho.di.core.row.value.ValueMetaFactory; import org.pentaho.di.core.row.value.ValueMetaInteger; import org.pentaho.di.core.row.value.ValueMetaString; import org.pentaho.di.core.variables.VariableSpace; import org.pentaho.di.core.xml.XMLHandler; import org.pentaho.di.i18n.BaseMessages; import org.pentaho.di.repository.ObjectId; import org.pentaho.di.repository.Repository; import org.pentaho.di.trans.Trans; import org.pentaho.di.trans.TransMeta; import org.pentaho.di.trans.step.BaseStepMeta; import org.pentaho.di.trans.step.StepDataInterface; import org.pentaho.di.trans.step.StepInterface; import org.pentaho.di.trans.step.StepMeta; import org.pentaho.di.trans.step.StepMetaInterface; import org.pentaho.metastore.api.IMetaStore; import org.w3c.dom.Node; public class RssInputMeta extends BaseStepMeta implements StepMetaInterface { private static Class<?> PKG = RssInput.class; // for i18n purposes, needed by Translator2!! /** Flag indicating that a row number field should be included in the output */ private boolean includeRowNumber; /** The name of the field in the output containing the row number */ private String rowNumberField; /** Flag indicating that url field should be included in the output */ private boolean includeUrl; /** The name of the field in the output containing the url */ private String urlField; /** The maximum number or lines to read */ private long rowLimit; /** The fields to import... */ private RssInputField[] inputFields; /** The url **/ private String[] url; /** read rss from */ private String readfrom; /** if URL defined in a field? */ private boolean urlInField; /** URL field name */ private String urlFieldname; public RssInputMeta() { super(); // allocate BaseStepMeta } /** * @return Returns the input fields. */ public RssInputField[] getInputFields() { return inputFields; } /** * @param inputFields * The input fields to set. */ public void setInputFields( RssInputField[] inputFields ) { this.inputFields = inputFields; } /** * @return Returns the urlInField. */ public boolean urlInField() { return urlInField; } /** * @param inputFields * The urlInField to set. */ public void seturlInField( boolean urlInFieldin ) { this.urlInField = urlInFieldin; } /** * @return Returns the includeRowNumber. */ public boolean includeRowNumber() { return includeRowNumber; } public void setReadFrom( String readfrom ) { this.readfrom = readfrom; } public String getReadFrom() { return readfrom; } public String getRealReadFrom() { return getReadFrom(); } /** * @return Returns the includeUrl. */ public boolean includeUrl() { return includeUrl; } /** * @param includeRowNumber * The includeRowNumber to set. */ public void setIncludeRowNumber( boolean includeRowNumber ) { this.includeRowNumber = includeRowNumber; } /** * @param includeUrl * The includeUrl to set. */ public void setIncludeUrl( boolean includeUrl ) { this.includeUrl = includeUrl; } /** * @return Returns the rowLimit. */ public long getRowLimit() { return rowLimit; } /** * @param rowLimit * The rowLimit to set. */ public void setRowLimit( long rowLimit ) { this.rowLimit = rowLimit; } /** * @return Returns the rowNumberField. */ public String getRowNumberField() { return rowNumberField; } /** * @return Returns the urlField. */ public String geturlField() { return urlField; } /** * @param urlField * The urlField to set. */ public void seturlField( String urlField ) { this.urlField = urlField; } /** * @param urlFieldname * The urlFieldname to set. */ public void setUrlFieldname( String urlFieldname ) { this.urlFieldname = urlFieldname; } /** * @return Returns the urlFieldname. */ public String getUrlFieldname() { return urlFieldname; } /** * @param url * The url to set. */ public void setUrl( String[] url ) { this.url = url; } public String[] getUrl() { return url; } /** * @param rowNumberField * The rowNumberField to set. */ public void setRowNumberField( String rowNumberField ) { this.rowNumberField = rowNumberField; } public void loadXML( Node stepnode, List<DatabaseMeta> databases, IMetaStore metaStore ) throws KettleXMLException { readData( stepnode ); } public Object clone() { RssInputMeta retval = (RssInputMeta) super.clone(); int nrFields = inputFields.length; int nrUrl = url.length; retval.allocate( nrUrl, nrFields ); System.arraycopy( url, 0, retval.url, 0, nrUrl ); for ( int i = 0; i < nrFields; i++ ) { if ( inputFields[i] != null ) { retval.inputFields[i] = (RssInputField) inputFields[i].clone(); } } return retval; } public String getXML() { StringBuilder retval = new StringBuilder(); retval.append( " " + XMLHandler.addTagValue( "url_in_field", urlInField ) ); retval.append( " " + XMLHandler.addTagValue( "url_field_name", urlFieldname ) ); retval.append( " " + XMLHandler.addTagValue( "rownum", includeRowNumber ) ); retval.append( " " + XMLHandler.addTagValue( "rownum_field", rowNumberField ) ); retval.append( " " + XMLHandler.addTagValue( "include_url", includeUrl ) ); retval.append( " " + XMLHandler.addTagValue( "url_Field", urlField ) ); retval.append( " " + XMLHandler.addTagValue( "read_from", readfrom ) ); retval.append( " <urls>" + Const.CR ); for ( int i = 0; i < url.length; i++ ) { retval.append( " " + XMLHandler.addTagValue( "url", url[i] ) ); } retval.append( " </urls>" + Const.CR ); retval.append( " <fields>" + Const.CR ); for ( int i = 0; i < inputFields.length; i++ ) { RssInputField field = inputFields[i]; retval.append( field.getXML() ); } retval.append( " </fields>" + Const.CR ); retval.append( " " + XMLHandler.addTagValue( "limit", rowLimit ) ); return retval.toString(); } private void readData( Node stepnode ) throws KettleXMLException { try { urlInField = "Y".equalsIgnoreCase( XMLHandler.getTagValue( stepnode, "url_in_field" ) ); urlFieldname = XMLHandler.getTagValue( stepnode, "url_field_name" ); includeRowNumber = "Y".equalsIgnoreCase( XMLHandler.getTagValue( stepnode, "rownum" ) ); rowNumberField = XMLHandler.getTagValue( stepnode, "rownum_field" ); includeUrl = "Y".equalsIgnoreCase( XMLHandler.getTagValue( stepnode, "include_url" ) ); urlField = XMLHandler.getTagValue( stepnode, "url_Field" ); readfrom = XMLHandler.getTagValue( stepnode, "read_from" ); Node fields = XMLHandler.getSubNode( stepnode, "fields" ); int nrFields = XMLHandler.countNodes( fields, "field" ); Node urlnode = XMLHandler.getSubNode( stepnode, "urls" ); int nrUrls = XMLHandler.countNodes( urlnode, "url" ); allocate( nrUrls, nrFields ); for ( int i = 0; i < nrUrls; i++ ) { Node urlnamenode = XMLHandler.getSubNodeByNr( urlnode, "url", i ); url[i] = XMLHandler.getNodeValue( urlnamenode ); } for ( int i = 0; i < nrFields; i++ ) { Node fnode = XMLHandler.getSubNodeByNr( fields, "field", i ); RssInputField field = new RssInputField( fnode ); inputFields[i] = field; } // Is there a limit on the number of rows we process? rowLimit = Const.toLong( XMLHandler.getTagValue( stepnode, "limit" ), 0L ); } catch ( Exception e ) { throw new KettleXMLException( "Unable to load step info from XML", e ); } } public void allocate( int nrUrl, int nrfields ) { inputFields = new RssInputField[nrfields]; url = new String[nrUrl]; } public void setDefault() { urlInField = false; urlFieldname = ""; includeRowNumber = false; rowNumberField = ""; includeUrl = false; urlField = ""; readfrom = ""; int nrFields = 0; int nrUrl = 0; allocate( nrUrl, nrFields ); for ( int i = 0; i < nrUrl; i++ ) { url[i] = ""; } for ( int i = 0; i < nrFields; i++ ) { inputFields[i] = new RssInputField( "field" + ( i + 1 ) ); } rowLimit = 0; } public void getFields( RowMetaInterface r, String name, RowMetaInterface[] info, StepMeta nextStep, VariableSpace space, Repository repository, IMetaStore metaStore ) throws KettleStepException { int i; for ( i = 0; i < inputFields.length; i++ ) { RssInputField field = inputFields[i]; int type = field.getType(); if ( type == ValueMetaInterface.TYPE_NONE ) { type = ValueMetaInterface.TYPE_STRING; } try { ValueMetaInterface v = ValueMetaFactory.createValueMeta( space.environmentSubstitute( field.getName() ), type ); v.setLength( field.getLength(), field.getPrecision() ); v.setOrigin( name ); r.addValueMeta( v ); } catch ( Exception e ) { throw new KettleStepException( e ); } } if ( includeUrl ) { ValueMetaInterface v = new ValueMetaString( space.environmentSubstitute( urlField ) ); v.setLength( 100, -1 ); v.setOrigin( name ); r.addValueMeta( v ); } if ( includeRowNumber ) { ValueMetaInterface v = new ValueMetaInteger( space.environmentSubstitute( rowNumberField ) ); v.setLength( ValueMetaInterface.DEFAULT_INTEGER_LENGTH, 0 ); v.setOrigin( name ); r.addValueMeta( v ); } } public void readRep( Repository rep, IMetaStore metaStore, ObjectId id_step, List<DatabaseMeta> databases ) throws KettleException { try { urlInField = rep.getStepAttributeBoolean( id_step, "url_in_field" ); urlFieldname = rep.getStepAttributeString( id_step, "url_field_name" ); includeRowNumber = rep.getStepAttributeBoolean( id_step, "rownum" ); rowNumberField = rep.getStepAttributeString( id_step, "rownum_field" ); includeUrl = rep.getStepAttributeBoolean( id_step, "include_url" ); urlField = rep.getStepAttributeString( id_step, "url_Field" ); readfrom = rep.getStepAttributeString( id_step, "read_from" ); rowLimit = rep.getStepAttributeInteger( id_step, "limit" ); int nrFields = rep.countNrStepAttributes( id_step, "field_name" ); int nrUrls = rep.countNrStepAttributes( id_step, "url_name" ); allocate( nrUrls, nrFields ); for ( int i = 0; i < nrUrls; i++ ) { url[i] = rep.getStepAttributeString( id_step, i, "url_name" ); } for ( int i = 0; i < nrFields; i++ ) { RssInputField field = new RssInputField(); field.setName( rep.getStepAttributeString( id_step, i, "field_name" ) ); field .setColumn( RssInputField.getColumnByCode( rep.getStepAttributeString( id_step, i, "field_column" ) ) ); field.setType( ValueMetaFactory.getIdForValueMeta( rep.getStepAttributeString( id_step, i, "field_type" ) ) ); field.setFormat( rep.getStepAttributeString( id_step, i, "field_format" ) ); field.setCurrencySymbol( rep.getStepAttributeString( id_step, i, "field_currency" ) ); field.setDecimalSymbol( rep.getStepAttributeString( id_step, i, "field_decimal" ) ); field.setGroupSymbol( rep.getStepAttributeString( id_step, i, "field_group" ) ); field.setLength( (int) rep.getStepAttributeInteger( id_step, i, "field_length" ) ); field.setPrecision( (int) rep.getStepAttributeInteger( id_step, i, "field_precision" ) ); field.setTrimType( RssInputField.getTrimTypeByCode( rep.getStepAttributeString( id_step, i, "field_trim_type" ) ) ); field.setRepeated( rep.getStepAttributeBoolean( id_step, i, "field_repeat" ) ); inputFields[i] = field; } } catch ( Exception e ) { throw new KettleException( BaseMessages.getString( PKG, "RssInputMeta.Exception.ErrorReadingRepository" ), e ); } } public void saveRep( Repository rep, IMetaStore metaStore, ObjectId id_transformation, ObjectId id_step ) throws KettleException { try { rep.saveStepAttribute( id_transformation, id_step, "url_in_field", urlInField ); rep.saveStepAttribute( id_transformation, id_step, "url_field_name", urlFieldname ); rep.saveStepAttribute( id_transformation, id_step, "rownum", includeRowNumber ); rep.saveStepAttribute( id_transformation, id_step, "rownum_field", rowNumberField ); rep.saveStepAttribute( id_transformation, id_step, "include_url", includeUrl ); rep.saveStepAttribute( id_transformation, id_step, "url_Field", urlField ); rep.saveStepAttribute( id_transformation, id_step, "read_from", readfrom ); rep.saveStepAttribute( id_transformation, id_step, "limit", rowLimit ); for ( int i = 0; i < url.length; i++ ) { rep.saveStepAttribute( id_transformation, id_step, i, "url_name", url[i] ); } for ( int i = 0; i < inputFields.length; i++ ) { RssInputField field = inputFields[i]; rep.saveStepAttribute( id_transformation, id_step, i, "field_name", field.getName() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_column", field.getColumnCode() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_type", field.getTypeDesc() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_format", field.getFormat() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_currency", field.getCurrencySymbol() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_decimal", field.getDecimalSymbol() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_group", field.getGroupSymbol() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_length", field.getLength() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_precision", field.getPrecision() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_trim_type", field.getTrimTypeCode() ); rep.saveStepAttribute( id_transformation, id_step, i, "field_repeat", field.isRepeated() ); } } catch ( Exception e ) { throw new KettleException( BaseMessages.getString( PKG, "RssInputMeta.Exception.ErrorSavingToRepository", "" + id_step ), e ); } } public StepDataInterface getStepData() { return new RssInputData(); } public boolean supportsErrorHandling() { return true; } public void check( List<CheckResultInterface> remarks, TransMeta transMeta, StepMeta stepMeta, RowMetaInterface prev, String[] input, String[] output, RowMetaInterface info, VariableSpace space, Repository repository, IMetaStore metaStore ) { CheckResult cr; if ( urlInField ) { if ( Utils.isEmpty( getUrlFieldname() ) ) { cr = new CheckResult( CheckResult.TYPE_RESULT_ERROR, BaseMessages.getString( PKG, "RssInputMeta.CheckResult.NoField" ), stepMeta ); remarks.add( cr ); } else { cr = new CheckResult( CheckResult.TYPE_RESULT_OK, BaseMessages.getString( PKG, "RssInputMeta.CheckResult.FieldOk" ), stepMeta ); remarks.add( cr ); } } else { if ( getUrl() == null || getUrl().length == 0 ) { cr = new CheckResult( CheckResult.TYPE_RESULT_ERROR, BaseMessages.getString( PKG, "RssInputMeta.CheckResult.NoUrl" ), stepMeta ); remarks.add( cr ); } else { cr = new CheckResult( CheckResult.TYPE_RESULT_OK, BaseMessages.getString( PKG, "RssInputMeta.CheckResult.UrlOk", "" + getUrl().length ), stepMeta ); remarks.add( cr ); } } } public StepInterface getStep( StepMeta stepMeta, StepDataInterface stepDataInterface, int cnr, TransMeta tr, Trans trans ) { return new RssInput( stepMeta, stepDataInterface, cnr, tr, trans ); } }