* adapt tv.com scraper to site changes

2009-07-25 13:36:29 +00:00 · 2009-07-25 13:36:29 +00:00 · 57df9b1fbc
parent afbc49369a
commit 57df9b1fbc
2 changed files with 5 additions and 7 deletions
--- a/source/net/sourceforge/filebot/web/TVDotComClient.java
+++ b/source/net/sourceforge/filebot/web/TVDotComClient.java
@ -62,16 +62,14 @@ public class TVDotComClient implements EpisodeListProvider {
 		
 		Document dom = getHtmlDocument(searchUrl);
 		
-		List<Node> nodes = selectNodes("//*[@class='title']//descendant-or-self::A", dom);
+		List<SearchResult> searchResults = new ArrayList<SearchResult>();
 		
-		List<SearchResult> searchResults = new ArrayList<SearchResult>(nodes.size());
-		
-		for (Node node : nodes) {
+		for (Node node : selectNodes("//H2/A", dom)) {
 			String title = getTextContent(node);
 			String href = getAttribute("href", node);
 			
 			try {
-				URL episodeGuideLocation = new URL(href.replaceAll("summary\\.html\\?.*", "episode.html"));
+				URL episodeGuideLocation = new URL(href.replaceAll("summary[.]html[?].*", "episode.html"));
 				searchResults.add(new HyperLink(title, episodeGuideLocation));
 			} catch (MalformedURLException e) {
 				Logger.getLogger(getClass().getName()).log(Level.WARNING, "Invalid href: " + href, e);
--- a/test/net/sourceforge/filebot/web/TVDotComClientTest.java
+++ b/test/net/sourceforge/filebot/web/TVDotComClientTest.java
@ -26,10 +26,10 @@ public class TVDotComClientTest {

 	@Test
 	public void search() throws Exception {
-		List<SearchResult> results = tvdotcom.search("Buffy");
+		List<SearchResult> results = tvdotcom.search("buffy the vampire slayer");
 		
 		// if this fails, there is probably a problem with the xpath query
-		assertEquals(10, results.size());
+		assertEquals(4, results.size());
 		
 		HyperLink result = (HyperLink) results.get(0);