--- android/TrainInfoService/src/dk/thoerup/traininfoservice/banedk/DepartureFetcher.java 2010/07/13 20:14:59 991 +++ android/TrainInfoService/src/dk/thoerup/traininfoservice/banedk/DepartureFetcher.java 2010/07/14 08:05:31 992 @@ -1,16 +1,14 @@ package dk.thoerup.traininfoservice.banedk; +import java.net.URL; import java.util.Collections; -import java.util.List; import java.util.Map; import java.util.logging.Logger; -import com.gargoylesoftware.htmlunit.BrowserVersion; -import com.gargoylesoftware.htmlunit.WebClient; -import com.gargoylesoftware.htmlunit.html.DomNodeList; -import com.gargoylesoftware.htmlunit.html.HtmlElement; -import com.gargoylesoftware.htmlunit.html.HtmlPage; +import org.jsoup.nodes.Document; +import org.jsoup.nodes.Element; +import org.jsoup.select.Elements; import dk.thoerup.circuitbreaker.CircuitBreaker; import dk.thoerup.circuitbreaker.CircuitBreakerManager; @@ -106,11 +104,7 @@ public DepartureBean lookupDeparturesNormalSite(String stationcode, TrainType type, boolean arrival) throws Exception { DepartureBean departureBean = new DepartureBean(); - - final WebClient webClient = new WebClient( BrowserVersion.FIREFOX_3 ); - webClient.setTimeout(2500); - webClient.setJavaScriptEnabled(false); - + String typeString = getTypeString(type); String arrivalDeparture = (arrival==false) ? "Afgang" : "Ankomst"; @@ -118,26 +112,26 @@ //String uri = "http://www.bane.dk/visStation.asp?ArtikelID=4275&W=" + type + "&S=" + stationcode; String uri = "http://trafikinfo.bane.dk/Trafikinformation/AfgangAnkomst/" + arrivalDeparture + "/" + stationcode + "/" + typeString + "/UdvidetVisning"; - //logger.info("URI: " + uri); - HtmlunitInvocation wrapper = new HtmlunitInvocation(webClient, uri); + //logger.info("URI: " + uri); + JsoupInvocation wrapper = new JsoupInvocation( new URL(uri), 2500); CircuitBreaker breaker = CircuitBreakerManager.getManager().getCircuitBreaker("banedk"); - HtmlPage page = (HtmlPage) breaker.invoke(wrapper); + Document page = (Document) breaker.invoke(wrapper); String tableName = arrival == false ? "afgangtabel" : "ankomsttabel"; - HtmlElement table = page.getElementById(tableName); + Element table = page.getElementById(tableName); if (table != null) { - DomNodeList tableRows = table.getElementsByTagName("tr"); + Elements tableRows = table.getElementsByTag("tr"); - for (HtmlElement currentRow : tableRows) { - String rowClass = currentRow.getAttribute("class"); + for (Element currentRow : tableRows) { + String rowClass = currentRow.attr("class"); if (rowClass != null && rowClass.toLowerCase().contains("station") ) { - DomNodeList fields = currentRow.getElementsByTagName("td"); + Elements fields = currentRow.getElementsByTag("td"); DepartureEntry departure = new DepartureEntry(); - String time = fields.get(0).asText(); + String time = fields.get(0).text(); if (time.equals("")) time = "0:00"; //Bane.dk bug work-around departure.setTime(time); @@ -145,21 +139,21 @@ int updated = extractUpdated( fields.get(1) ); departure.setUpdated(updated); - String trainNumber = fields.get(2).asText(); + String trainNumber = fields.get(2).text(); if (type == TrainType.STOG) //If it is S-train we need to extract the trainNumber trainNumber = trainNumber + " " + extractTrainNumber(fields.get(2)); departure.setTrainNumber(trainNumber); - String destination = fields.get(3).asText(); + String destination = fields.get(3).text(); departure.setDestination(destination); - String origin = fields.get(4).asText(); + String origin = fields.get(4).text(); departure.setOrigin(origin); - String location = fields.get(5).asText(); + String location = fields.get(5).text(); departure.setLocation(location); - String status = fields.get(6).asText().trim(); + String status = fields.get(6).text().trim(); departure.setStatus(status); String note = extractNote( fields.get(7) ); @@ -174,23 +168,21 @@ logger.warning("No departures found for station=" + stationcode + ", type=" + type); } - HtmlElement notifDiv = page.getElementById("station_planlagte_text"); + Element notifDiv = page.getElementById("station_planlagte_text"); if (notifDiv != null) { - DomNodeList tables = notifDiv.getElementsByTagName("table"); - for (HtmlElement tab : tables) { + Elements tables = notifDiv.getElementsByTag("table"); + for (Element tab : tables) { - DomNodeList anchors = tab.getElementsByTagName("a"); + Elements anchors = tab.getElementsByTag("a"); if (anchors.size() == 2) { - departureBean.notifications.add( anchors.get(1).getTextContent() ); + departureBean.notifications.add( anchors.get(1).text() ); } } } - webClient.closeAllWindows(); - return departureBean; } @@ -263,11 +255,11 @@ }*/ - private int extractUpdated(HtmlElement updatedTd) { //extract the digit (in this case: 4) from "media/trafikinfo/opdater4.gif" + private int extractUpdated(Element updatedTd) { //extract the digit (in this case: 4) from "media/trafikinfo/opdater4.gif" int updated = -1; - DomNodeList updatedImgs = updatedTd.getElementsByTagName("img"); - String updatedStr = updatedImgs.get(0).getAttribute("src"); + Elements updatedImgs = updatedTd.getElementsByTag("img"); + String updatedStr = updatedImgs.get(0).attr("src"); if (updatedStr != null) { for (int i=0; i elems = noteTd.getElementsByAttribute("span", "class", "bemtype"); + Elements elems = noteTd.getElementsByClass("bemtype"); if (elems.size() > 0 && note.charAt(note.length()-1) == 'i') note = note.substring(0,note.length() -1 ); return note; } - private String extractTrainNumber(HtmlElement trainTd) { - HtmlElement anchorElement = trainTd.getElementsByTagName("a").get(0); - String href = anchorElement.getAttribute("href"); + private String extractTrainNumber(Element trainTd) { + Element anchorElement = trainTd.getElementsByTag("a").get(0); + String href = anchorElement.attr("href"); int pos = href.lastIndexOf('/'); String number = href.substring(pos+1);