();
final Matcher mConCoarse = P_CONNECTIONS_COARSE.matcher(page);
while (mConCoarse.find())
{
final Matcher mConFine = P_CONNECTIONS_FINE.matcher(mConCoarse.group(1));
if (mConFine.matches())
{
final String link = API_BASE + ParserUtils.resolveEntities(mConFine.group(3));
if (mConFine.group(6) == null)
{
Date date;
if (mConFine.group(1) != null)
date = parseDate(mConFine.group(1), mConFine.group(2), new SimpleDateFormat("yyyy").format(currentDate));
else
date = currentDate;
Date departureTime = ParserUtils.joinDateTime(date, ParserUtils.parseTime(mConFine.group(4)));
if (!connections.isEmpty())
{
final long diff = ParserUtils.timeDiff(departureTime, connections.get(connections.size() - 1).departureTime);
if (diff > PARSER_DAY_ROLLOVER_THRESHOLD_MS)
departureTime = ParserUtils.addDays(departureTime, -1);
else if (diff < -PARSER_DAY_ROLLOVER_THRESHOLD_MS)
departureTime = ParserUtils.addDays(departureTime, 1);
}
Date arrivalTime = ParserUtils.joinDateTime(date, ParserUtils.parseTime(mConFine.group(5)));
if (departureTime.after(arrivalTime))
arrivalTime = ParserUtils.addDays(arrivalTime, 1);
final Connection connection = new Connection(ParserUtils.extractId(link), link, departureTime, arrivalTime, null, null, 0,
from, 0, to, null);
connections.add(connection);
}
else
{
final int min = Integer.parseInt(mConFine.group(6)) * 60 + Integer.parseInt(mConFine.group(7));
final Calendar calendar = new GregorianCalendar();
final Date departureTime = calendar.getTime();
calendar.add(Calendar.MINUTE, min);
final Date arrivalTime = calendar.getTime();
final Connection connection = new Connection(ParserUtils.extractId(link), link, departureTime, arrivalTime, null, null, 0,
from, 0, to, null);
connections.add(connection);
}
}
else
{
throw new IllegalArgumentException("cannot parse '" + mConCoarse.group(1) + "' on " + uri);
}
}
return new QueryConnectionsResult(uri, from, to, currentDate, linkEarlier, linkLater, connections);
}
else
{
throw new IOException(page.toString());
}
}
private static final Pattern P_CONNECTION_DETAILS_HEAD = Pattern.compile(".*?Detailansicht.*?" //
+ "Datum:[\\xa0\\s]+\\w{2}\\.,\\s(\\d+)\\.\\s(\\w{3,4})\\.[\\xa0\\s]+(\\d{4}).*?", Pattern.DOTALL);
private static final Pattern P_CONNECTION_DETAILS_COARSE = Pattern.compile("" //
+ "\r\\x0a(.+?)
.*?" //
+ "\r\\x0a(.+?)
.*?" //
+ "\r\\x0a(.+?)
", Pattern.DOTALL);
static final Pattern P_CONNECTION_DETAILS_FINE = Pattern.compile("(?:" //
+ "ab (\\d{1,2}:\\d{2})\\s(.*?)\\s*<.*?" // departureTime, departure
+ "(?: .*?)?" // product
+ " | \\s*(.*?)\\s* Richtung\\s*(.*?)\\s* | .*?" // line, destination
+ "an (\\d{1,2}:\\d{2})\\s(.*?)\\s*<" // arrivalTime, arrival
+ "|" //
+ " | ab (.*?)\\s*<.*?" // departure
+ "Fußweg[\\xa0\\s]+\\(ca\\.[\\xa0\\s]+(\\d+)[\\xa0\\s]+Minute.*?" // min
+ " | an (.*?)\\s*<" // arrival
+ "|" //
+ ".*? " //
+ ").*?", Pattern.DOTALL);
private static final Pattern P_CONNECTION_DETAILS_ERRORS = Pattern.compile("(session has expired)", Pattern.CASE_INSENSITIVE);
public GetConnectionDetailsResult getConnectionDetails(final String uri) throws IOException
{
final CharSequence page = ParserUtils.scrape(uri);
final Matcher mHead = P_CONNECTION_DETAILS_HEAD.matcher(page);
if (mHead.matches())
{
final Date currentDate = parseDate(mHead.group(1), mHead.group(2), mHead.group(3));
final List parts = new ArrayList(4);
Date lastTime = currentDate;
Date firstDepartureTime = null;
String firstDeparture = null;
Date lastArrivalTime = null;
String lastArrival = null;
String oldZebra = null;
final Matcher mDetCoarse = P_CONNECTION_DETAILS_COARSE.matcher(page);
while (mDetCoarse.find())
{
final String zebra = mDetCoarse.group(1);
if (oldZebra != null && zebra.equals(oldZebra))
throw new IllegalArgumentException("missed row? last:" + zebra);
else
oldZebra = zebra;
final String set = mDetCoarse.group(2) + mDetCoarse.group(3) + mDetCoarse.group(4);
final Matcher mDetFine = P_CONNECTION_DETAILS_FINE.matcher(set);
if (mDetFine.matches())
{
if (mDetFine.group(1) != null)
{
final Date departureTime = upTime(lastTime, ParserUtils.joinDateTime(currentDate, ParserUtils.parseTime(mDetFine.group(1))));
final String departure = ParserUtils.resolveEntities(mDetFine.group(2));
if (departure != null && firstDeparture == null)
firstDeparture = departure;
final String product = ParserUtils.resolveEntities(mDetFine.group(3));
final String line = ParserUtils.resolveEntities(mDetFine.group(4));
final String destination = ParserUtils.resolveEntities(mDetFine.group(5));
final Date arrivalTime = upTime(lastTime, ParserUtils.joinDateTime(currentDate, ParserUtils.parseTime(mDetFine.group(6))));
final String arrival = ParserUtils.resolveEntities(mDetFine.group(7));
final String normalizedLine = normalizeLine(product, line);
parts.add(new Connection.Trip(normalizedLine, LINES.get(normalizedLine), destination, departureTime, null, 0, departure,
arrivalTime, null, 0, arrival));
if (firstDepartureTime == null)
firstDepartureTime = departureTime;
lastArrival = arrival;
lastArrivalTime = arrivalTime;
}
else if (mDetFine.group(8) != null)
{
final String departure = ParserUtils.resolveEntities(mDetFine.group(8));
if (departure != null && firstDeparture == null)
firstDeparture = departure;
final String min = mDetFine.group(9);
final String arrival = ParserUtils.resolveEntities(mDetFine.group(10));
if (parts.size() > 0 && parts.get(parts.size() - 1) instanceof Connection.Footway)
{
final Connection.Footway lastFootway = (Connection.Footway) parts.remove(parts.size() - 1);
parts.add(new Connection.Footway(lastFootway.min + Integer.parseInt(min), 0, lastFootway.departure, 0, arrival));
}
else
{
parts.add(new Connection.Footway(Integer.parseInt(min), 0, departure, 0, arrival));
}
lastArrival = arrival;
}
}
else
{
throw new IllegalArgumentException("cannot parse '" + set + "' on " + uri);
}
}
if (firstDepartureTime == null && lastArrivalTime == null && parts.size() == 1 && parts.get(0) instanceof Connection.Footway)
{
final Calendar calendar = new GregorianCalendar();
firstDepartureTime = calendar.getTime();
calendar.add(Calendar.MINUTE, ((Connection.Footway) parts.get(0)).min);
lastArrivalTime = calendar.getTime();
}
return new GetConnectionDetailsResult(new Date(), new Connection(ParserUtils.extractId(uri), uri, firstDepartureTime, lastArrivalTime,
null, null, 0, firstDeparture, 0, lastArrival, parts));
}
else
{
if (P_CONNECTION_DETAILS_ERRORS.matcher(page).find())
throw new SessionExpiredException();
else
throw new IOException(page.toString());
}
}
private static Date upTime(final Date lastTime, Date time)
{
while (time.before(lastTime))
time = ParserUtils.addDays(time, 1);
lastTime.setTime(time.getTime());
return time;
}
public String departuresQueryUri(final String stationId, final int maxDepartures)
{
final StringBuilder uri = new StringBuilder();
uri.append(API_BASE).append("XSLT_DM_REQUEST");
uri.append("?outputFormat=XML");
uri.append("&coordOutputFormat=WGS84");
uri.append("&type_dm=stop");
uri.append("&name_dm=").append(stationId);
uri.append("&mode=direct");
return uri.toString();
}
private static final Pattern P_NORMALIZE_LINE_TRAM = Pattern.compile("[12]\\d");
private static final Pattern P_NORMALIZE_LINE_NACHTTRAM = Pattern.compile("N[12]\\d");
private static final Pattern P_NORMALIZE_LINE_METROBUS = Pattern.compile("[56]\\d");
private static final Pattern P_NORMALIZE_LINE_STADTBUS = Pattern.compile("1\\d{2}");
private static final Pattern P_NORMALIZE_LINE_NACHTBUS = Pattern.compile("N[48]\\d");
private static final Pattern P_NORMALIZE_LINE_REGIONALBUS = Pattern.compile("\\d{3}[A-Z]?");
private static final Pattern P_NORMALIZE_LINE_NUMBER = Pattern.compile("\\d{4}");
private String normalizeLine(final String product, final String line)
{
if (product == null)
{
if (P_NORMALIZE_LINE_METROBUS.matcher(line).matches())
return "B" + line;
if (P_NORMALIZE_LINE_STADTBUS.matcher(line).matches())
return "B" + line;
if (P_NORMALIZE_LINE_NACHTBUS.matcher(line).matches())
return "B" + line;
if (line.equals("N117")) // Ersatzbus für N17
return "BN117";
if (P_NORMALIZE_LINE_REGIONALBUS.matcher(line).matches())
return "B" + line;
if (line.equals("Schienenersatzverkehr"))
return "BSEV";
if (P_NORMALIZE_LINE_TRAM.matcher(line).matches())
return "T" + line;
if (P_NORMALIZE_LINE_NACHTTRAM.matcher(line).matches())
return "T" + line;
if (LINES.containsKey("S" + line))
return "S" + line;
if (line.equals("S20/27"))
return "S" + line;
if (LINES.containsKey("U" + line))
return "U" + line;
if (line.startsWith("D "))
return "R" + line;
if (line.startsWith("RE "))
return "R" + line;
if (line.startsWith("RB "))
return "R" + line;
if (line.startsWith("ALX ")) // Alex
return "R" + line;
if (line.startsWith("BOB ")) // Bayerische Oberlandbahn
return "R" + line;
if (line.startsWith("VBG ")) // Vogtlandbahn
return "R" + line;
if (line.startsWith("ICE "))
return "I" + line;
if (line.startsWith("IC "))
return "I" + line;
if (line.startsWith("EC "))
return "I" + line;
if (line.startsWith("CNL "))
return "I" + line;
if (P_NORMALIZE_LINE_NUMBER.matcher(line).matches())
return "?" + line;
throw new IllegalStateException("cannot normalize null product, line " + line);
}
else if (product.equals("Bus"))
{
if (line.startsWith("Bus"))
return "B" + line.substring(4);
else if (line.startsWith("StadtBus"))
return "B" + line.substring(9);
else if (line.startsWith("MetroBus"))
return "B" + line.substring(9);
else if (line.startsWith("Regionalbus"))
return "B" + line.substring(12);
else
return "B" + line;
}
else if (product.equals("Tram"))
{
if (line.startsWith("Tram"))
return "T" + line.substring(5);
else
return "T" + line;
}
else if (product.equals("U-Bahn"))
{
if (line.startsWith("U-Bahn"))
return "U" + line.substring(7);
else
return "U" + line;
}
else if (product.equals("S-Bahn"))
{
if (line.startsWith("S-Bahn"))
return "S" + line.substring(7);
else
return "S" + line;
}
else if (product.equals("Zug"))
{
final String[] lineParts = line.split("\\s+");
final String type = lineParts[0];
final String number = lineParts[1];
if (type.equals("IC"))
return "I" + type + number;
if (type.equals("ICE"))
return "I" + type + number;
if (type.equals("EC"))
return "I" + type + number;
if (type.equals("EN")) // EuroNight
return "I" + type + number;
if (type.equals("CNL"))
return "I" + type + number;
if (type.equals("RJ")) // Railjet, Österreich
return "I" + type + number;
if (type.equals("IRE")) // Franken-Sachsen-Express
return "I" + type + number;
if (type.equals("RB"))
return "R" + type + number;
if (type.equals("RE"))
return "R" + type + number;
if (type.equals("D"))
return "R" + type + number;
if (type.equals("BOB"))
return "R" + type + number;
if (type.equals("BRB")) // Bayerische Regiobahn
return "R" + type + number;
if (type.equals("ALX")) // Länderbahn und Vogtlandbahn
return "R" + type + number;
if (type.equals("ERB")) // Eurobahn
return "R" + type + number;
if (type.equals("VBG")) // Vogtlandbahn
return "R" + line;
throw new IllegalStateException("cannot normalize product " + product + " line " + line);
}
else if (product.equals("Schiff"))
{
return "F" + line;
}
else if (product.equals("Seilbahn")) // strangely marked as 'Seilbahn', but means 'Schienenersatzverkehr'
{
return "BSEV" + line;
}
throw new IllegalStateException("cannot normalize product " + product + " line " + line);
}
private static Date parseDate(final String day, final String month, final String year)
{
final Calendar calendar = new GregorianCalendar();
calendar.clear();
calendar.set(Calendar.DAY_OF_MONTH, Integer.parseInt(day));
calendar.set(Calendar.MONTH, parseMonth(month));
calendar.set(Calendar.YEAR, Integer.parseInt(year));
return calendar.getTime();
}
private final static String[] MONTHS = new String[] { "Jan", "Feb", "Mär", "Apr", "Mai", "Jun", "Jul", "Aug", "Sept", "Okt", "Nov", "Dez" };
private static int parseMonth(final String month)
{
for (int m = 0; m < MONTHS.length; m++)
if (MONTHS[m].equals(month))
return m;
throw new IllegalArgumentException("cannot parse month: " + month);
}
private static final Map LINES = new HashMap();
static
{
LINES.put("I", new int[] { Color.WHITE, Color.RED, Color.RED }); // generic
LINES.put("R", new int[] { Color.WHITE, Color.RED, Color.RED }); // generic
LINES.put("S", new int[] { Color.parseColor("#006e34"), Color.WHITE }); // generic
LINES.put("U", new int[] { Color.parseColor("#003090"), Color.WHITE }); // generic
LINES.put("SS1", new int[] { Color.parseColor("#00ccff"), Color.WHITE });
LINES.put("SS2", new int[] { Color.parseColor("#66cc00"), Color.WHITE });
LINES.put("SS3", new int[] { Color.parseColor("#880099"), Color.WHITE });
LINES.put("SS4", new int[] { Color.parseColor("#ff0033"), Color.WHITE });
LINES.put("SS6", new int[] { Color.parseColor("#00aa66"), Color.WHITE });
LINES.put("SS7", new int[] { Color.parseColor("#993333"), Color.WHITE });
LINES.put("SS8", new int[] { Color.BLACK, Color.parseColor("#ffcc00") });
LINES.put("SS20", new int[] { Color.BLACK, Color.parseColor("#ffaaaa") });
LINES.put("SS27", new int[] { Color.parseColor("#ffaaaa"), Color.WHITE });
LINES.put("SA", new int[] { Color.parseColor("#231f20"), Color.WHITE });
LINES.put("T12", new int[] { Color.parseColor("#883388"), Color.WHITE });
LINES.put("T15", new int[] { Color.parseColor("#3366CC"), Color.WHITE });
LINES.put("T16", new int[] { Color.parseColor("#CC8833"), Color.WHITE });
LINES.put("T17", new int[] { Color.parseColor("#993333"), Color.WHITE });
LINES.put("T18", new int[] { Color.parseColor("#66bb33"), Color.WHITE });
LINES.put("T19", new int[] { Color.parseColor("#cc0000"), Color.WHITE });
LINES.put("T20", new int[] { Color.parseColor("#00bbee"), Color.WHITE });
LINES.put("T21", new int[] { Color.parseColor("#33aa99"), Color.WHITE });
LINES.put("T23", new int[] { Color.parseColor("#fff000"), Color.WHITE });
LINES.put("T25", new int[] { Color.parseColor("#ff9999"), Color.WHITE });
LINES.put("T27", new int[] { Color.parseColor("#ff6600"), Color.WHITE });
LINES.put("TN17", new int[] { Color.parseColor("#999999"), Color.parseColor("#ffff00") });
LINES.put("TN19", new int[] { Color.parseColor("#999999"), Color.parseColor("#ffff00") });
LINES.put("TN20", new int[] { Color.parseColor("#999999"), Color.parseColor("#ffff00") });
LINES.put("TN27", new int[] { Color.parseColor("#999999"), Color.parseColor("#ffff00") });
LINES.put("UU1", new int[] { Color.parseColor("#227700"), Color.WHITE });
LINES.put("UU2", new int[] { Color.parseColor("#bb0000"), Color.WHITE });
LINES.put("UU2E", new int[] { Color.parseColor("#bb0000"), Color.WHITE });
LINES.put("UU3", new int[] { Color.parseColor("#ee8800"), Color.WHITE });
LINES.put("UU4", new int[] { Color.parseColor("#00ccaa"), Color.WHITE });
LINES.put("UU5", new int[] { Color.parseColor("#bb7700"), Color.WHITE });
LINES.put("UU6", new int[] { Color.parseColor("#0000cc"), Color.WHITE });
}
public int[] lineColors(final String line)
{
return LINES.get(line);
}
}
|