/* Copyright (C) 2003-2011 JabRef contributors. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. This program is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details. You should have received a copy of the GNU General Public License along with this program; if not, write to the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA. */ package net.sf.jabref.external; import java.net.URL; import java.net.MalformedURLException; import java.io.*; /** * FullTextFinder implementation that attempts to find PDF url from a Sciencedirect article page. */ public class SpringerLinkPdfDownload implements FullTextFinder { private static final String BASE_URL = "http://www.springerlink.com"; private static final String CONTENT_BASE_URL = "http://www.springerlink.com/content/"; public SpringerLinkPdfDownload() { } public boolean supportsSite(URL url) { return url.getHost().toLowerCase().indexOf("www.springerlink.com") != -1; } public URL findFullTextURL(URL url) throws IOException { // If the url contains a 'id=' component, we will try to int idIndex = url.toString().indexOf("id="); if (idIndex > -1) { url = new URL(CONTENT_BASE_URL+url.toString().substring(idIndex+3)); } //System.out.println("URL NOW: "+url); String pageSource = FindFullText.loadPage(url); FindFullText.dumpToFile(pageSource, new File("page.html")); int index = pageSource.indexOf("PDF ("); if (index > -1) { String leading = pageSource.substring(0, index); String marker = "href="; index = leading.toLowerCase().lastIndexOf(marker); if ((index > -1) && (index+marker.length()+1 < leading.length())) { int endIndex = leading.indexOf("\"", index+marker.length()+1); try { URL pdfUrl = new URL(BASE_URL+leading.substring(index+marker.length()+1, endIndex)); System.out.println(pdfUrl.toString()); return pdfUrl; } catch (MalformedURLException e) { return null; } } return null; } else return null; } }