/*******************************************************************************
* Copyright 2014 University of Southern California
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* This code was developed by the Information Integration Group as part
* of the Karma project at the Information Sciences Institute of the
* University of Southern California. For more information, publications,
* and related projects, please see: http://www.isi.edu/integration
******************************************************************************/
package edu.isi.karma.kr2rml.mapping;
import java.util.HashMap;
import java.util.Map;
import org.json.JSONArray;
import org.json.JSONException;
import org.json.JSONObject;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import edu.isi.karma.kr2rml.exception.HNodeNotFoundKarmaException;
import edu.isi.karma.rep.HNode;
import edu.isi.karma.rep.HTable;
import edu.isi.karma.rep.RepFactory;
import edu.isi.karma.rep.Worksheet;
public class KR2RMLMappingColumnNameHNodeTranslator {
private static Logger logger = LoggerFactory.getLogger(KR2RMLMappingColumnNameHNodeTranslator.class);
private RepFactory factory;
private Worksheet worksheet;
private Map<String, String> hNodeIdToColumnName = new HashMap<>();
private Map<String, String> columnNameToHNodeId = new HashMap<>();
public KR2RMLMappingColumnNameHNodeTranslator(RepFactory factory, Worksheet worksheet)
{
this.factory = factory;
this.worksheet = worksheet;
this.populateHNodeIdAndColumnNameMaps();
}
public String getColumnNameForHNodeId(String hNodeId)
{
if(!this.hNodeIdToColumnName.containsKey(hNodeId))
{
String columnName = translateHNodeIdToColumnName(hNodeId);
if(null != columnName)
{
hNodeIdToColumnName.put(hNodeId, columnName);
columnNameToHNodeId.put(columnName, hNodeId);
}
}
return hNodeIdToColumnName.get(hNodeId);
}
public String translateHNodeIdToColumnName(String hNodeId)
{
HNode hNode = factory.getHNode(hNodeId);
String colNameStr = "";
try {
JSONArray colNameArr = hNode.getJSONArrayRepresentation(factory);
if (colNameArr.length() == 1) {
colNameStr = (String)
(((JSONObject)colNameArr.get(0)).get("columnName"));
} else {
JSONArray colNames = new JSONArray();
for (int i=0; i<colNameArr.length();i++) {
colNames.put((String)
(((JSONObject)colNameArr.get(i)).get("columnName")));
}
colNameStr = colNames.toString();
}
return colNameStr;
} catch (JSONException e) {
logger.debug("unable to find hnodeid to column name mapping for hnode: " + hNode.getId() + " " + hNode.getColumnName(), e);
}
return null;
}
public void populateHNodeIdAndColumnNameMaps()
{
HTable hTable = worksheet.getHeaders();
populateHNodeIdAndColumnNameMapsForHTable(hTable);
}
private void populateHNodeIdAndColumnNameMapsForHTable(HTable hTable) {
for(HNode hNode : hTable.getHNodes())
{
if(hNode.hasNestedTable())
{
populateHNodeIdAndColumnNameMapsForHTable(hNode.getNestedTable());
}
else
{
String hNodeId = hNode.getId();
String columnName = translateHNodeIdToColumnName(hNodeId);
columnNameToHNodeId.put(columnName, hNodeId);
hNodeIdToColumnName.put(hNodeId, columnName);
}
}
}
public String getHNodeIdForColumnName(String templateTermValue) throws HNodeNotFoundKarmaException {
if(!this.columnNameToHNodeId.containsKey(templateTermValue))
{
try {
String hNodeId = translateColumnNameToHNodeId(templateTermValue);
columnNameToHNodeId.put(templateTermValue, hNodeId);
hNodeIdToColumnName.put(hNodeId, templateTermValue);
} catch (JSONException e) {
throw new HNodeNotFoundKarmaException("Unable to find HNodeId for column name", templateTermValue);
}
}
return this.columnNameToHNodeId.get(templateTermValue);
}
private String translateColumnNameToHNodeId(String colTermVal) throws JSONException
{
HTable hTable = worksheet.getHeaders();
// If hierarchical columns
if (colTermVal.startsWith("[") && colTermVal.endsWith("]") && colTermVal.contains(",")) {
JSONArray strArr = new JSONArray(colTermVal);
for (int i=0; i<strArr.length(); i++) {
String cName = (String) strArr.get(i);
logger.debug("Column being normalized: "+ cName);
if(hTable == null) {
logger.error("Error retrieving column: " + cName);
return null;
}
HNode hNode = hTable.getHNodeFromColumnName(cName);
if(hNode == null) {
logger.error("Error retrieving column: " + cName);
return null;
}
if (i == strArr.length()-1) { // Found!
return hNode.getId();
} else {
hTable = hNode.getNestedTable();
}
}
} else {
HNode hNode = hTable.getHNodeFromColumnName(colTermVal);
if(hNode == null) {
logger.error("Error retrieving column: " + colTermVal);
return null;
}
logger.debug("Column" +colTermVal);
return hNode.getId();
}
return null;
}
}