/[projects]/android/TrainInfoService/src/dk/thoerup/traininfoservice/banedk/DepartureFetcher.java
ViewVC logotype

Contents of /android/TrainInfoService/src/dk/thoerup/traininfoservice/banedk/DepartureFetcher.java

Parent Directory Parent Directory | Revision Log Revision Log


Revision 1038 - (show annotations) (download)
Sun Sep 12 18:41:17 2010 UTC (13 years, 8 months ago) by torben
File size: 11349 byte(s)
Make jsoup act correct with old site
1 package dk.thoerup.traininfoservice.banedk;
2
3
4 import java.net.URL;
5 import java.net.URLEncoder;
6 import java.util.Collections;
7 import java.util.Map;
8 import java.util.logging.Logger;
9
10 import org.jsoup.nodes.Document;
11 import org.jsoup.nodes.Element;
12 import org.jsoup.select.Elements;
13
14 import dk.thoerup.circuitbreaker.CircuitBreaker;
15 import dk.thoerup.circuitbreaker.CircuitBreakerManager;
16 import dk.thoerup.traininfoservice.StationBean;
17 import dk.thoerup.traininfoservice.StationDAO;
18 import dk.thoerup.traininfoservice.Statistics;
19
20 public class DepartureFetcher {
21
22 enum TrainType{
23 STOG,
24 REGIONAL
25 }
26
27 Logger logger = Logger.getLogger(DepartureFetcher.class.getName());
28
29 Map<String, DepartureBean> cache;
30
31 StationDAO stationDao = new StationDAO();
32
33 private boolean useAzureSite;
34 private int replyTimeout;
35
36 public DepartureFetcher(boolean azureSite, int cacheTimeout, int replyTimeout) {
37 this.replyTimeout = replyTimeout;
38 useAzureSite = azureSite;
39 cache = new TimeoutMap<String,DepartureBean>(cacheTimeout);
40 }
41
42
43
44
45 public DepartureBean cachedLookupDepartures(int stationID, boolean arrival) throws Exception {
46 final String key = "" + stationID + ":" + arrival;
47
48 DepartureBean departureBean = cache.get(key);
49
50
51 if (departureBean == null) {
52 departureBean = lookupDepartures(stationID,arrival);
53 cache.put(key, departureBean);
54 } else {
55 Statistics.getInstance().incrementDepartureCacheHits();
56 logger.info("Departure: Cache hit " + key); //remove before production
57 }
58 return departureBean;
59 }
60
61
62 public DepartureBean lookupDepartures(int stationID, boolean arrival) throws Exception {
63
64 DepartureBean departureBean = new DepartureBean();
65
66 StationBean station = stationDao.getById(stationID);
67
68 departureBean.stationName = station.getName();
69
70 if (station.getRegional() != null) {
71 DepartureBean tempBean = lookupDepartures(station.getRegional(), TrainType.REGIONAL, arrival);
72 departureBean.departureEntries.addAll( tempBean.departureEntries );
73 departureBean.notifications.addAll(tempBean.notifications);
74 }
75
76 if (station.getStrain() != null) {
77 DepartureBean tempBean = lookupDepartures(station.getStrain(), TrainType.STOG, arrival);
78 departureBean.departureEntries.addAll( tempBean.departureEntries );
79 departureBean.notifications.addAll(tempBean.notifications);
80 }
81
82 if (departureBean.departureEntries.size() == 0) {
83 logger.info("No departures found for station " + stationID);
84 }
85
86 Collections.sort( departureBean.departureEntries );
87
88
89 return departureBean;
90 }
91
92 public DepartureBean lookupDepartures(String stationcode, TrainType type, boolean arrival) throws Exception {
93 if (useAzureSite == true) {
94 return lookupDeparturesAzureSite(stationcode, type, arrival);
95 } else {
96 return lookupDeparturesWwwSite(stationcode, type, arrival);
97 }
98 }
99
100 private String getTypeStringAzure(TrainType type) {
101 switch (type) {
102 case STOG:
103 return "S-Tog";
104 case REGIONAL:
105 return "Fjerntog";
106 default:
107 return ""; //Can not happen
108 }
109 }
110
111 private String getTypeStringWww(TrainType type) {
112 switch (type) {
113 case STOG:
114 return "S2";
115 case REGIONAL:
116 return "FJRN";
117 default:
118 return ""; //Can not happen
119 }
120 }
121
122 public DepartureBean lookupDeparturesAzureSite(String stationcode, TrainType type, boolean arrival) throws Exception {
123
124 DepartureBean departureBean = new DepartureBean();
125
126
127 String typeString = getTypeStringAzure(type);
128 String arrivalDeparture = (arrival==false) ? "Afgang" : "Ankomst";
129
130 stationcode = URLEncoder.encode(stationcode,"ISO-8859-1");
131
132 String uri = "http://trafikinfo.bane.dk/Trafikinformation/AfgangAnkomst/" + arrivalDeparture + "/" + stationcode + "/" + typeString + "/UdvidetVisning";
133
134 //logger.info("URI: " + uri);
135 JsoupInvocation wrapper = new JsoupInvocation( new URL(uri), replyTimeout);
136 CircuitBreaker breaker = CircuitBreakerManager.getManager().getCircuitBreaker("banedk");
137
138 Document page = (Document) breaker.invoke(wrapper);
139
140 String tableName = arrival == false ? "afgangtabel" : "ankomsttabel";
141 Element table = page.getElementById(tableName);
142
143 if (table != null) {
144 Elements tableRows = table.getElementsByTag("tr");
145
146 boolean tidsstregExists = (table.getElementsByAttributeValue("class", "Tidsstreg").size() > 0);
147 boolean passedTidsstreg = false;
148
149 for (Element currentRow : tableRows) {
150 String rowClass = currentRow.attr("class");
151
152 if (tidsstregExists == true && passedTidsstreg == false) {
153 if (currentRow.getElementsByAttributeValue("class", "Tidsstreg").size() > 0) {
154 passedTidsstreg = true;
155 } else {
156 continue;
157 }
158 }
159
160 if (rowClass != null && rowClass.toLowerCase().contains("station") ) {
161
162 Elements fields = currentRow.getElementsByTag("td");
163
164 DepartureEntry departure = new DepartureEntry();
165
166 String time = fields.get(0).text();
167 if (time.equals(""))
168 time = "0:00"; //Bane.dk bug work-around
169 departure.setTime(time);
170
171 int updated = extractUpdated( fields.get(1) );
172 departure.setUpdated(updated);
173
174 String trainNumber = fields.get(2).text();
175 if (type == TrainType.STOG) //If it is S-train we need to extract the trainNumber
176 trainNumber = trainNumber + " " + extractTrainNumber(fields.get(2));
177 departure.setTrainNumber(trainNumber);
178
179 String destination = fields.get(3).text();
180 departure.setDestination(destination);
181
182 String origin = fields.get(4).text();
183 departure.setOrigin(origin);
184
185 String location = fields.get(5).text();
186 departure.setLocation(location);
187
188 String status = fields.get(6).text().trim();
189 departure.setStatus(status);
190
191 String note = extractNote( fields.get(7) );
192 departure.setNote(note);
193
194 departure.setType(typeString);
195
196 departureBean.departureEntries.add( departure );
197 }
198 }
199 } else {
200 logger.warning("No departures found for station=" + stationcode + ", type=" + type);
201 }
202
203 Element notifDiv = page.getElementById("station_planlagte_text");
204 if (notifDiv != null) {
205
206 Elements tables = notifDiv.getElementsByTag("table");
207 for (Element tab : tables) {
208
209 Elements anchors = tab.getElementsByTag("a");
210 if (anchors.size() == 2) {
211 departureBean.notifications.add( anchors.get(1).text() );
212 }
213 }
214
215 }
216
217
218 return departureBean;
219 }
220
221
222
223 String cleanText(String input) {
224 //apparently JSoup interprets some of space characters on www.bane.dk as 0xA0
225 return input.replace((char) 0xA0, (char)0x20).trim();
226 }
227
228 public DepartureBean lookupDeparturesWwwSite(String stationcode, TrainType trainType, boolean arrival) throws Exception {
229
230 DepartureBean departureBean = new DepartureBean();
231
232 String type = getTypeStringWww(trainType);
233
234
235 String uri = "http://www.bane.dk/visStation.asp?ArtikelID=4275&W=" + type + "&S=" + stationcode;
236 JsoupInvocation wrapper = new JsoupInvocation( new URL(uri), replyTimeout);
237 CircuitBreaker breaker = CircuitBreakerManager.getManager().getCircuitBreaker("banedk");
238
239 Element page = (Element) breaker.invoke(wrapper);
240
241 String tableName = arrival == false ? "afgangtabel" : "ankomsttabel";
242 Element table = page.getElementById(tableName);
243
244 if (table != null) {
245 Elements tableRows = table.getElementsByTag("tr");
246
247 for (Element currentRow : tableRows) {
248 String rowClass = currentRow.attr("class");
249 if (rowClass != null && rowClass.toLowerCase().contains("station") ) {
250 Elements fields = currentRow.getElementsByTag("td");
251
252 DepartureEntry departure = new DepartureEntry();
253
254
255
256 String time = cleanText( fields.get(0).getAllElements().get(2).text() );
257 if (time.equals(""))
258 time = "0:00"; //Bane.dk bug work-around
259 departure.setTime(time);
260
261 int updated = extractUpdated( fields.get(1) );
262 departure.setUpdated(updated);
263
264 String trainNumber = cleanText( fields.get(2).text() );
265 if (type.equalsIgnoreCase("S2")) //If it is S-train we need to extract the trainNumber
266 trainNumber = trainNumber + " " + extractTrainNumber(fields.get(2));
267 departure.setTrainNumber(trainNumber);
268
269 String destination = cleanText( fields.get(3).text() );
270 departure.setDestination(destination);
271
272 String origin = cleanText( fields.get(4).text() );
273 departure.setOrigin(origin);
274
275 String location = cleanText( fields.get(5).text() );
276 departure.setLocation(location);
277
278 String status = cleanText( fields.get(6).text() );
279 departure.setStatus(status);
280
281 String note = cleanText( extractNote( fields.get(7) ) );
282 departure.setNote(note);
283
284 departure.setType(type);
285
286 departureBean.departureEntries.add(departure);
287
288
289 }
290 }
291 } else {
292 logger.warning("No departures found for station=" + stationcode + ", type=" + type);
293 }
294
295
296 return departureBean;
297 }
298
299
300 private int extractUpdated(Element updatedTd) { //extract the digit (in this case: 4) from "media/trafikinfo/opdater4.gif"
301 int updated = -1;
302
303 Elements updatedImgs = updatedTd.getElementsByTag("img");
304 String updatedStr = updatedImgs.get(0).attr("src");
305
306 if (updatedStr != null) {
307 for (int i=0; i<updatedStr.length(); i++) {
308 char c = updatedStr.charAt(i);
309 if ( Character.isDigit(c)) {
310 updated = Character.digit(c, 10);
311 break;
312 }
313 }
314 }
315 return updated;
316 }
317
318 private String extractNote(Element noteTd) {
319 String note = noteTd.text().trim();
320
321
322 Elements elems = noteTd.getElementsByClass("bemtype");
323 if (elems.size() > 0 && note.charAt(note.length()-1) == 'i')
324 note = note.substring(0,note.length() -1 );
325
326 return note.trim();
327 }
328
329 private String extractTrainNumber(Element trainTd) {
330 Element anchorElement = trainTd.getElementsByTag("a").get(0);
331 String href = anchorElement.attr("href");
332
333 int pos = href.lastIndexOf('/');
334 String number = href.substring(pos+1);
335
336 return number;
337 }
338
339 //test
340 /*
341 public static void main(String args[]) throws Exception {
342 DepartureFetcher f = new DepartureFetcher();
343 List<DepartureBean> deps = f.lookupDepartures("AR", "FJRN");
344 for(DepartureBean d : deps) {
345 System.out.println( d.getTime() + ";" + d.getUpdated() + ";" + d.getTrainNumber() + ";" +
346 d.getDestination() + ";" + d.getOrigin() + ";" + d.getLocation() + ";" + d.getStatus() + ";" + d.getNote() );
347 }
348
349 System.out.println("--------------------------");
350 }*/
351 }

  ViewVC Help
Powered by ViewVC 1.1.20