--- android/TrainInfoService/src/dk/thoerup/traininfoservice/banedk/DepartureFetcher.java 2009/09/10 18:13:52 308 +++ android/TrainInfoService/src/dk/thoerup/traininfoservice/banedk/DepartureFetcher.java 2010/09/14 05:33:30 1046 @@ -1,115 +1,325 @@ package dk.thoerup.traininfoservice.banedk; -import java.sql.Connection; -import java.sql.ResultSet; -import java.sql.Statement; -import java.util.ArrayList; + +import java.net.URL; +import java.net.URLEncoder; import java.util.Collections; -import java.util.List; +import java.util.Map; +import java.util.logging.Logger; -import com.gargoylesoftware.htmlunit.WebClient; -import com.gargoylesoftware.htmlunit.html.DomNodeList; -import com.gargoylesoftware.htmlunit.html.HtmlElement; -import com.gargoylesoftware.htmlunit.html.HtmlPage; +import org.jsoup.nodes.Document; +import org.jsoup.nodes.Element; +import org.jsoup.select.Elements; -import dk.thoerup.traininfoservice.DBConnection; +import dk.thoerup.circuitbreaker.CircuitBreaker; +import dk.thoerup.circuitbreaker.CircuitBreakerManager; +import dk.thoerup.traininfoservice.StationBean; +import dk.thoerup.traininfoservice.StationDAO; +import dk.thoerup.traininfoservice.Statistics; public class DepartureFetcher { + + enum TrainType{ + STOG, + REGIONAL + } + + Logger logger = Logger.getLogger(DepartureFetcher.class.getName()); + + Map cache; + + StationDAO stationDao = new StationDAO(); + + private boolean useAzureSite; + private int replyTimeout; + + public DepartureFetcher(boolean azureSite, int cacheTimeout, int replyTimeout) { + this.replyTimeout = replyTimeout; + useAzureSite = azureSite; + cache = new TimeoutMap(cacheTimeout); + } + + + + + public DepartureBean cachedLookupDepartures(int stationID, boolean arrival) throws Exception { + final String key = "" + stationID + ":" + arrival; + DepartureBean departureBean = cache.get(key); - public List lookupDepartures(int stationID) throws Exception { - List departureList = new ArrayList(); - Connection conn = null; - try - { - conn = DBConnection.getConnection(); - - String SQL = "SELECT stationcode_fjrn, stationcode_stog FROM trainstations WHERE id=" + stationID; - Statement stmt = conn.createStatement(); - ResultSet rs = stmt.executeQuery(SQL); - - if (rs.next()) { - String code = rs.getString( 1 ); - if (! rs.wasNull() ) { - List list = lookupDepartures(code, "FJRN"); - departureList.addAll(list); - } - - code = rs.getString(2); - if (! rs.wasNull() ) { - List list = lookupDepartures(code, "S2"); - departureList.addAll(list); - } - Collections.sort( departureList ); - - } - - } finally { - if (conn != null && !conn.isClosed() ) { - conn.close(); - } + if (departureBean == null) { + departureBean = lookupDepartures(stationID,arrival); + cache.put(key, departureBean); + } else { + Statistics.getInstance().incrementDepartureCacheHits(); + logger.info("Departure: Cache hit " + key); //remove before production + } + return departureBean; + } + + + public DepartureBean lookupDepartures(int stationID, boolean arrival) throws Exception { + + DepartureBean departureBean = new DepartureBean(); + + StationBean station = stationDao.getById(stationID); + + departureBean.stationName = station.getName(); + + if (station.getRegional() != null) { + DepartureBean tempBean = lookupDepartures(station.getRegional(), TrainType.REGIONAL, arrival); + departureBean.departureEntries.addAll( tempBean.departureEntries ); + departureBean.notifications.addAll(tempBean.notifications); + } + + if (station.getStrain() != null) { + DepartureBean tempBean = lookupDepartures(station.getStrain(), TrainType.STOG, arrival); + departureBean.departureEntries.addAll( tempBean.departureEntries ); + departureBean.notifications.addAll(tempBean.notifications); + } + + if (departureBean.departureEntries.size() == 0) { + logger.info("No departures found for station " + stationID); } - return departureList; + Collections.sort( departureBean.departureEntries ); + + + return departureBean; } - public List lookupDepartures(String stationcode, String type) throws Exception { - - List departureList = new ArrayList(); + public DepartureBean lookupDepartures(String stationcode, TrainType type, boolean arrival) throws Exception { + if (useAzureSite == true) { + return lookupDeparturesAzureSite(stationcode, type, arrival); + } else { + return lookupDeparturesWwwSite(stationcode, type, arrival); + } + } + + private String getTypeStringAzure(TrainType type) { + switch (type) { + case STOG: + return "S-Tog"; + case REGIONAL: + return "Fjerntog"; + default: + return ""; //Can not happen + } + } + + private String getTypeStringWww(TrainType type) { + switch (type) { + case STOG: + return "S2"; + case REGIONAL: + return "FJRN"; + default: + return ""; //Can not happen + } + } + + public DepartureBean lookupDeparturesAzureSite(String stationcode, TrainType type, boolean arrival) throws Exception { - final WebClient webClient = new WebClient(); - webClient.setTimeout(1000); - webClient.setJavaScriptEnabled(false); - - final HtmlPage page = webClient.getPage("http://www.bane.dk/visStation.asp?ArtikelID=4275&W=" + type + "&S=" + stationcode); - - HtmlElement table = page.getElementById("afgangtabel"); - DomNodeList tableRows = table.getElementsByTagName("tr"); - - for (HtmlElement currentRow : tableRows) { - String rowClass = currentRow.getAttribute("class"); - if (rowClass != null && rowClass.toLowerCase().contains("station") ) { - DomNodeList fields = currentRow.getElementsByTagName("td"); - - DepartureBean departure = new DepartureBean(); - - String time = fields.get(0).asText(); - departure.setTime(time); - - int updated = extractUpdated( fields.get(1) ); - departure.setUpdated(updated); - - String trainNumber = fields.get(2).asText(); - departure.setTrainNumber(trainNumber); - - String destination = fields.get(3).asText(); - departure.setDestination(destination); - - String origin = fields.get(4).asText(); - departure.setOrigin(origin); - - String location = fields.get(5).asText(); - departure.setLocation(location); - - String status = fields.get(6).asText(); - departure.setStatus(status); - - String note = fields.get(7).asText(); - departure.setNote(note); - - departureList.add(departure); + DepartureBean departureBean = new DepartureBean(); + + + String typeString = getTypeStringAzure(type); + String arrivalDeparture = (arrival==false) ? "Afgang" : "Ankomst"; + + stationcode = URLEncoder.encode(stationcode,"ISO-8859-1"); + + String uri = "http://trafikinfo.bane.dk/Trafikinformation/AfgangAnkomst/" + arrivalDeparture + "/" + stationcode + "/" + typeString + "/UdvidetVisning"; + + //logger.info("URI: " + uri); + JsoupInvocation wrapper = new JsoupInvocation( new URL(uri), replyTimeout); + CircuitBreaker breaker = CircuitBreakerManager.getManager().getCircuitBreaker("banedk"); + + Document page = (Document) breaker.invoke(wrapper); + + String tableName = arrival == false ? "afgangtabel" : "ankomsttabel"; + Element table = page.getElementById(tableName); + + if (table != null) { + Elements tableRows = table.getElementsByTag("tr"); + + boolean tidsstregExists = (table.getElementsByAttributeValue("class", "Tidsstreg").size() > 0); + boolean passedTidsstreg = false; + + for (Element currentRow : tableRows) { + String rowClass = currentRow.attr("class"); + + if (tidsstregExists == true && passedTidsstreg == false) { + if (currentRow.getElementsByAttributeValue("class", "Tidsstreg").size() > 0) { + passedTidsstreg = true; + } else { + continue; + } + } + + if (rowClass != null && rowClass.toLowerCase().contains("station") ) { + + Elements fields = currentRow.getElementsByTag("td"); + + DepartureEntry departure = new DepartureEntry(); + + String time = fields.get(0).text(); + if (time.equals("")) + time = "0:00"; //Bane.dk bug work-around + departure.setTime(time); + + int updated = extractUpdated( fields.get(1) ); + departure.setUpdated(updated); + + String trainNumber = fields.get(2).text(); + if (type == TrainType.STOG) //If it is S-train we need to extract the trainNumber + trainNumber = trainNumber + " " + extractTrainNumberAzure(fields.get(2)); + departure.setTrainNumber(trainNumber); + + String destination = fields.get(3).text(); + departure.setDestination(destination); + + String origin = fields.get(4).text(); + departure.setOrigin(origin); + + String location = fields.get(5).text(); + departure.setLocation(location); + + String status = fields.get(6).text().trim(); + departure.setStatus(status); + + String note = extractNote( fields.get(7) ); + departure.setNote(note); + + departure.setType(typeString); + + departureBean.departureEntries.add( departure ); + } + } + } else { + logger.warning("No departures found for station=" + stationcode + ", type=" + type); + } + + Element notifDiv = page.getElementById("station_planlagte_text"); + if (notifDiv != null) { + + Elements tables = notifDiv.getElementsByTag("table"); + for (Element tab : tables) { + + Elements anchors = tab.getElementsByTag("a"); + if (anchors.size() == 2) { + departureBean.notifications.add( anchors.get(1).text() ); + } } + + } + + + return departureBean; + } + + + + public static String cleanText(String input) { + //apparently JSoup translates   characters on www.bane.dk to 0xA0 + return input.replace((char) 0xA0, (char)0x20).trim(); + } + + public DepartureBean lookupDeparturesWwwSite(String stationcode, TrainType trainType, boolean arrival) throws Exception { + + DepartureBean departureBean = new DepartureBean(); + + String type = getTypeStringWww(trainType); + + stationcode = URLEncoder.encode(stationcode, "ISO-8859-1"); + + + String uri = "http://www.bane.dk/visStation.asp?ArtikelID=4275&W=" + type + "&S=" + stationcode; + logger.info("URI:" + uri); + JsoupInvocation wrapper = new JsoupInvocation( new URL(uri), replyTimeout); + CircuitBreaker breaker = CircuitBreakerManager.getManager().getCircuitBreaker("banedk"); + + Element page = (Element) breaker.invoke(wrapper); + + String tableName = arrival == false ? "afgangtabel" : "ankomsttabel"; + Element table = page.getElementById(tableName); + + + + if (table != null) { + Elements tableRows = table.getElementsByTag("tr"); + + boolean passedTidsstreg = false; + boolean tidsstregExists = (table.getElementsByAttributeValue("class", "Tidsstreg").size() > 0); + + for (Element currentRow : tableRows) { + String rowClass = currentRow.attr("class"); + + if (tidsstregExists == true && passedTidsstreg == false) { + if (currentRow.getElementsByAttributeValue("class", "Tidsstreg").size() > 0) { + passedTidsstreg = true; + } else { + continue; + } + } + + + if (rowClass != null && rowClass.toLowerCase().contains("station") ) { + Elements fields = currentRow.getElementsByTag("td"); + + DepartureEntry departure = new DepartureEntry(); + + + + String time = cleanText( fields.get(0).getAllElements().get(2).text() ); + if (time.equals("")) + time = "0:00"; //Bane.dk bug work-around + departure.setTime(time); + + int updated = extractUpdated( fields.get(1) ); + departure.setUpdated(updated); + + String trainNumber = cleanText( fields.get(2).text() ); + if (type.equalsIgnoreCase("S2")) //If it is S-train we need to extract the trainNumber + trainNumber = trainNumber + " " + extractTrainNumberWww(fields.get(2)); + departure.setTrainNumber(trainNumber); + + String destination = cleanText( fields.get(3).text() ); + departure.setDestination(destination); + + String origin = cleanText( fields.get(4).text() ); + departure.setOrigin(origin); + + String location = cleanText( fields.get(5).text() ); + departure.setLocation(location); + + String status = cleanText( fields.get(6).text() ); + departure.setStatus(status); + + String note = cleanText( extractNote( fields.get(7) ) ); + departure.setNote(note); + + departure.setType(type); + + departureBean.departureEntries.add(departure); + + + } + } + } else { + logger.warning("No departures found for station=" + stationcode + ", type=" + type); } - return departureList; + + return departureBean; } + - private int extractUpdated(HtmlElement updatedTd) { //extract the digit (in this case: 4) from "media/trafikinfo/opdater4.gif" + private int extractUpdated(Element updatedTd) { //extract the digit (in this case: 4) from "media/trafikinfo/opdater4.gif" int updated = -1; - DomNodeList updatedImgs = updatedTd.getElementsByTagName("img"); - String updatedStr = updatedImgs.get(0).getAttribute("src"); + Elements updatedImgs = updatedTd.getElementsByTag("img"); + String updatedStr = updatedImgs.get(0).attr("src"); if (updatedStr != null) { for (int i=0; i 0 && note.charAt(note.length()-1) == 'i') + note = note.substring(0,note.length() -1 ); + + return note.trim(); + } + + private String extractTrainNumberAzure(Element trainTd) { + Element anchorElement = trainTd.getElementsByTag("a").get(0); + String href = anchorElement.attr("href"); + + int pos = href.lastIndexOf('/'); + String number = href.substring(pos+1); + + return number; + } + + private String extractTrainNumberWww(Element trainTd) { + String number = ""; + Element anchorElement = trainTd.getElementsByTag("a").get(0); + String href = anchorElement.attr("href"); + String argstring = href.substring( href.indexOf('?') + 1); + + String args[] = argstring.split("&"); + for (String arg : args) { + String pair[] = arg.split("="); // Key=pair[0], Value=pair[1] + + if (pair[0].equalsIgnoreCase("TogNr")) + number = pair[1]; + } + + + return number; + } + + //test - public static void main(String args[]) throws Exception{ + /* + public static void main(String args[]) throws Exception { DepartureFetcher f = new DepartureFetcher(); List deps = f.lookupDepartures("AR", "FJRN"); for(DepartureBean d : deps) { @@ -133,5 +384,5 @@ } System.out.println("--------------------------"); - } + }*/ }