Coverage Report

Coverage Report - net.sf.jabref.imports.ScienceDirectFetcher

Classes in this File

Line Coverage

Branch Coverage

Complexity

ScienceDirectFetcher

0/57

0/18

2.889

 package net.sf.jabref.imports;
 
 import net.sf.jabref.BibtexEntry;
 import net.sf.jabref.GUIGlobals;
 import net.sf.jabref.Globals;
 import net.sf.jabref.OutputPrinter;
 import net.sf.jabref.net.URLDownload;
 
 import javax.swing.*;
 import java.io.IOException;
 import java.io.UnsupportedEncodingException;
 import java.net.URL;
 import java.net.URLEncoder;
 import java.util.ArrayList;
 import java.util.List;
 import java.util.regex.Matcher;
 import java.util.regex.Pattern;
 
 
 public class ScienceDirectFetcher implements EntryFetcher {
 
     protected static int MAX_PAGES_TO_LOAD = 8;
     protected static final String WEBSITE_URL = "http://www.sciencedirect.com";
     protected static final String SEARCH_URL = WEBSITE_URL +"/science/quicksearch?query=";
 
     protected static final String linkPrefix = "http://www.sciencedirect.com/science?_ob=ArticleURL&" ;
     protected static final Pattern linkPattern = Pattern.compile(
             "<a href=\""+
             linkPrefix.replaceAll("\\?", "\\\\?")+
             "([^\"]+)\"\"");
 
     protected static final Pattern nextPagePattern = Pattern.compile(
             "<a href=\"(.*)\">Next &gt;");
 
 
     protected boolean stopFetching = false;
     protected boolean noAccessFound = false;
 
     public String getHelpPage() {
         return "ScienceDirect.html";
     }
 
     public URL getIcon() {
         return GUIGlobals.getIconUrl("www");
     }
 
     public String getKeyName() {
         return "Search ScienceDirect";
     }
 
     public JPanel getOptionsPanel() {
         // No Options panel
         return null;
     }
 
     public String getTitle() {
         return Globals.menuTitle("Search ScienceDirect");
     }
 
     public void stopFetching() {
         stopFetching = true;
         noAccessFound = false;
     }
 
     public boolean processQuery(String query, ImportInspector dialog, OutputPrinter status) {
         stopFetching = false;
         try {
             List<String> citations = getCitations(query);
             if (citations == null)
                 return false;
             if (citations.size() == 0){
                 status.showMessage(Globals.lang("No entries found for the search string '%0'",
                     query),
                     Globals.lang("Search ScienceDirect"), JOptionPane.INFORMATION_MESSAGE);
                 return false;
             }
 
             int i=0;
             for (String cit : citations) {
                 if (stopFetching)
                     break;
                 BibtexEntry entry = BibsonomyScraper.getEntry(cit);
                 if (entry != null)
                     dialog.addEntry(entry);
                 dialog.setProgress(++i, citations.size());
             }
 
             return true;
 
         } catch (IOException e) {
             e.printStackTrace();
             status.showMessage(Globals.lang("Error while fetching from ScienceDirect") + ": " + e.getMessage());
         }
         return false;
     }
 
     /**
      *
      * @param query
      *            The search term to query JStor for.
      * @return a list of IDs
      * @throws java.io.IOException
      */
     protected List<String> getCitations(String query) throws IOException {
         String urlQuery;
         ArrayList<String> ids = new ArrayList<String>();
         try {
             urlQuery = SEARCH_URL + URLEncoder.encode(query, "UTF-8");
             int count = 1;
             String nextPage = null;
             while (((nextPage = getCitationsFromUrl(urlQuery, ids)) != null)
                     && (count < MAX_PAGES_TO_LOAD)) {
                 urlQuery = nextPage;
                 count++;
             }
             return ids;
         } catch (UnsupportedEncodingException e) {
             throw new RuntimeException(e);
         }
     }
 
     protected String getCitationsFromUrl(String urlQuery, List<String> ids) throws IOException {
         URL url = new URL(urlQuery);
         URLDownload ud = new URLDownload(url);
         ud.download();
 
         String cont = ud.getStringContent();
         //String entirePage = cont;
         Matcher m = linkPattern.matcher(cont);
         if (m.find()) {
             while (m.find()) {
                 ids.add(linkPrefix+m.group(1));
                 cont = cont.substring(m.end());
                 m = linkPattern.matcher(cont);
             }
         }
 
         else {
             return null;
         }
         /*m = nextPagePattern.matcher(entirePage);
         if (m.find()) {
             String newQuery = WEBSITE_URL +m.group(1);
             return newQuery;
         }
         else*/
             return null;
     }
 
 
 }

1		package net.sf.jabref.imports;
2
3		import net.sf.jabref.BibtexEntry;
4		import net.sf.jabref.GUIGlobals;
5		import net.sf.jabref.Globals;
6		import net.sf.jabref.OutputPrinter;
7		import net.sf.jabref.net.URLDownload;
8
9		import javax.swing.*;
10		import java.io.IOException;
11		import java.io.UnsupportedEncodingException;
12		import java.net.URL;
13		import java.net.URLEncoder;
14		import java.util.ArrayList;
15		import java.util.List;
16		import java.util.regex.Matcher;
17		import java.util.regex.Pattern;
18
19
20	0	public class ScienceDirectFetcher implements EntryFetcher {
21
22	0	protected static int MAX_PAGES_TO_LOAD = 8;
23		protected static final String WEBSITE_URL = "http://www.sciencedirect.com";
24		protected static final String SEARCH_URL = WEBSITE_URL +"/science/quicksearch?query=";
25
26		protected static final String linkPrefix = "http://www.sciencedirect.com/science?_ob=ArticleURL&" ;
27	0	protected static final Pattern linkPattern = Pattern.compile(
28		"<a href=\""+
29		linkPrefix.replaceAll("\\?", "\\\\?")+
30		"([^\"]+)\"\"");
31
32	0	protected static final Pattern nextPagePattern = Pattern.compile(
33		"<a href=\"(.*)\">Next >");
34
35
36	0	protected boolean stopFetching = false;
37	0	protected boolean noAccessFound = false;
38
39		public String getHelpPage() {
40	0	return "ScienceDirect.html";
41		}
42
43		public URL getIcon() {
44	0	return GUIGlobals.getIconUrl("www");
45		}
46
47		public String getKeyName() {
48	0	return "Search ScienceDirect";
49		}
50
51		public JPanel getOptionsPanel() {
52		// No Options panel
53	0	return null;
54		}
55
56		public String getTitle() {
57	0	return Globals.menuTitle("Search ScienceDirect");
58		}
59
60		public void stopFetching() {
61	0	stopFetching = true;
62	0	noAccessFound = false;
63	0	}
64
65		public boolean processQuery(String query, ImportInspector dialog, OutputPrinter status) {
66	0	stopFetching = false;
67		try {
68	0	List<String> citations = getCitations(query);
69	0	if (citations == null)
70	0	return false;
71	0	if (citations.size() == 0){
72	0	status.showMessage(Globals.lang("No entries found for the search string '%0'",
73		query),
74		Globals.lang("Search ScienceDirect"), JOptionPane.INFORMATION_MESSAGE);
75	0	return false;
76		}
77
78	0	int i=0;
79	0	for (String cit : citations) {
80	0	if (stopFetching)
81	0	break;
82	0	BibtexEntry entry = BibsonomyScraper.getEntry(cit);
83	0	if (entry != null)
84	0	dialog.addEntry(entry);
85	0	dialog.setProgress(++i, citations.size());
86	0	}
87
88	0	return true;
89
90	0	} catch (IOException e) {
91	0	e.printStackTrace();
92	0	status.showMessage(Globals.lang("Error while fetching from ScienceDirect") + ": " + e.getMessage());
93		}
94	0	return false;
95		}
96
97		/**
98		*
99		* @param query
100		* The search term to query JStor for.
101		* @return a list of IDs
102		* @throws java.io.IOException
103		*/
104		protected List<String> getCitations(String query) throws IOException {
105		String urlQuery;
106	0	ArrayList<String> ids = new ArrayList<String>();
107		try {
108	0	urlQuery = SEARCH_URL + URLEncoder.encode(query, "UTF-8");
109	0	int count = 1;
110	0	String nextPage = null;
111		while (((nextPage = getCitationsFromUrl(urlQuery, ids)) != null)
112	0	&& (count < MAX_PAGES_TO_LOAD)) {
113	0	urlQuery = nextPage;
114	0	count++;
115		}
116	0	return ids;
117	0	} catch (UnsupportedEncodingException e) {
118	0	throw new RuntimeException(e);
119		}
120		}
121
122		protected String getCitationsFromUrl(String urlQuery, List<String> ids) throws IOException {
123	0	URL url = new URL(urlQuery);
124	0	URLDownload ud = new URLDownload(url);
125	0	ud.download();
126
127	0	String cont = ud.getStringContent();
128		//String entirePage = cont;
129	0	Matcher m = linkPattern.matcher(cont);
130	0	if (m.find()) {
131	0	while (m.find()) {
132	0	ids.add(linkPrefix+m.group(1));
133	0	cont = cont.substring(m.end());
134	0	m = linkPattern.matcher(cont);
135		}
136		}
137
138		else {
139	0	return null;
140		}
141		/*m = nextPagePattern.matcher(entirePage);
142		if (m.find()) {
143		String newQuery = WEBSITE_URL +m.group(1);
144		return newQuery;
145		}
146		else*/
147	0	return null;
148		}
149
150
151		}