X-Git-Url: https://git.toastfreeware.priv.at/philipp/winterrodeln/wrpylib.git/blobdiff_plain/e554ec1b9d06c76888b42d2b4a6a78a22b0bdb69..6eb5f5cb8d4925fec2170093e7d387f2eb5decbe:/wrpylib/wrmwmarkup.py diff --git a/wrpylib/wrmwmarkup.py b/wrpylib/wrmwmarkup.py index 8b0f5dc..f626f2b 100644 --- a/wrpylib/wrmwmarkup.py +++ b/wrpylib/wrmwmarkup.py @@ -1,19 +1,115 @@ -#!/usr/bin/python2.6 +#!/usr/bin/python3.4 # -*- coding: iso-8859-15 -*- # $Id$ # $HeadURL$ -"""This module contains winterrodeln specific functions that are prcocessing the MediaWiki markup. +"""This module contains winterrodeln specific functions that are processing the MediaWiki markup. """ import re +import xml.etree.ElementTree +import collections import formencode import wrpylib.wrvalidators +import wrpylib.mwmarkup +WRMAP_POINT_TYPES = ['gasthaus', 'haltestelle', 'parkplatz', 'achtung', 'foto', 'verleih', 'punkt'] +WRMAP_LINE_TYPES = ['rodelbahn', 'gehweg', 'alternative', 'lift', 'anfahrt', 'linie'] -def _conv(fnct, value, fieldname): - """Internal function. - Like one of the to_xxx functions (e.g. to_bool), but adds the field name to the error message""" - try: return fnct(value) - except formencode.Invalid as e: raise formencode.Invalid(u"Conversion error in field '%s': %s" % (fieldname, unicode_e(e)), e.value, e.state) + +class ParseError(RuntimeError): + """Exception used by some of the functions""" + pass + + +class RodelbahnboxDictConverter(formencode.Validator): + """Converts a dict with Rodelbahnbox properties to a Sledrun class. Does no validation.""" + + def to_python(self, value, state=None): + """value is a dict of properties. If state is an object with the attribute sledrun, this sledrun class will be populated or updated.""" + props = value + if isinstance(state, object) and hasattr(state, 'sledrun'): + sledrun = state.sledrun + else: + class Sledrun(object): + pass + sledrun = Sledrun() + for k, v in props.items(): + if k == 'Position': sledrun.position_latitude, sledrun.position_longitude = v + elif k == 'Position oben': sledrun.top_latitude, sledrun.top_longitude = v + elif k == 'Höhe oben': sledrun.top_elevation = v + elif k == 'Position unten': sledrun.bottom_latitude, sledrun.bottom_longitude = v + elif k == 'Höhe unten': sledrun.bottom_elevation = v + elif k == 'Länge': sledrun.length = v + elif k == 'Schwierigkeit': sledrun.difficulty = v + elif k == 'Lawinen': sledrun.avalanches = v + elif k == 'Betreiber': sledrun.operator = v + elif k == 'Öffentliche Anreise': sledrun.public_transport = v + elif k == 'Aufstieg möglich': sledrun.walkup_possible = v + elif k == 'Aufstieg getrennt': sledrun.walkup_separate, sledrun.walkup_separate_comment = v + elif k == 'Gehzeit': sledrun.walkup_time = v + elif k == 'Aufstiegshilfe': sledrun.lift, sledrun.lift_details = v + elif k == 'Beleuchtungsanlage': sledrun.night_light, sledrun.night_light_comment = v + elif k == 'Beleuchtungstage': sledrun.night_light_days, sledrun.night_light_days_comment = v + elif k == 'Rodelverleih': sledrun.sled_rental, sledrun.sled_rental_comment = v + elif k == 'Gütesiegel': sledrun.cachet = v + elif k == 'Webauskunft': sledrun.information_web = v + elif k == 'Telefonauskunft': sledrun.information_phone = v + elif k == 'Bild': sledrun.image = v + elif k == 'In Übersichtskarte': sledrun.show_in_overview = v + elif k == 'Forumid': sledrun.forum_id = v + return sledrun + + def from_python(self, value, state=None): + """Converts a sledrun class to a dict of Rodelbahnbox properties. value is a sledrun instance.""" + sledrun = value + r = collections.OrderedDict() + r['Position'] = (sledrun.position_latitude, sledrun.position_longitude) + r['Position oben'] = (sledrun.top_latitude, sledrun.top_longitude) + r['Höhe oben'] = sledrun.top_elevation + r['Position unten'] = (sledrun.bottom_latitude, sledrun.bottom_longitude) + r['Höhe unten'] = sledrun.bottom_elevation + r['Länge'] = sledrun.length + r['Schwierigkeit'] = sledrun.difficulty + r['Lawinen'] = sledrun.avalanches + r['Betreiber'] = sledrun.operator + r['Öffentliche Anreise'] = sledrun.public_transport + r['Aufstieg möglich'] = sledrun.walkup_possible + r['Aufstieg getrennt'] = (sledrun.walkup_separate, sledrun.walkup_separate_comment) + r['Gehzeit'] = sledrun.walkup_time + r['Aufstiegshilfe'] = (sledrun.lift, sledrun.lift_details) + r['Beleuchtungsanlage'] = (sledrun.night_light, sledrun.night_light_comment) + r['Beleuchtungstage'] = (sledrun.night_light_days, sledrun.night_light_days_comment) + r['Rodelverleih'] = (sledrun.sled_rental, sledrun.sled_rental_comment) + r['Gütesiegel'] = sledrun.cachet + r['Webauskunft'] = sledrun.information_web + r['Telefonauskunft'] = sledrun.information_phone + r['Bild'] = sledrun.image + r['In Übersichtskarte'] = sledrun.show_in_overview + r['Forumid'] = sledrun.forum_id + return r + + +class WinterrodelnTemplateDict(formencode.Validator): + """Private helper class for RodelbahnboxValidator or GasthausboxValidator""" + def __init__(self, template_title): + self.template_title = template_title + + def to_python(self, value, state): + title, anonym_params, named_params = value + if title != self.template_title: + raise formencode.Invalid('Template title has to be "{}".'.format(self.template_title), value, state) + if len(anonym_params) > 0: + raise formencode.Invalid('No anonymous parameters are allowed in "{}".'.format(self.template_title), value, state) + return named_params + + def from_python(self, value, state): + return self.template_title, [], value + + +class RodelbahnboxValidator(wrpylib.wrvalidators.RodelbahnboxDictValidator): + def __init__(self): + wrpylib.wrvalidators.RodelbahnboxDictValidator.__init__(self) + self.pre_validators=[wrpylib.mwmarkup.TemplateValidator(as_table=True, as_table_keylen=20), WinterrodelnTemplateDict('Rodelbahnbox')] + self.chained_validators = [RodelbahnboxDictConverter()] def rodelbahnbox_to_sledrun(wikitext, sledrun=None): @@ -21,175 +117,440 @@ def rodelbahnbox_to_sledrun(wikitext, sledrun=None): to a sledrun. sledrun may be an instance of WrSledrunCache or an "empty" class (object()) (default). Raises a formencode.Invalid exception if the format is not OK or the Rodelbahnbox is not found. :return: (start, end, sledrun) tuple of the Rodelbahnbox.""" - if sledrun is None: sledrun = object() - - # match Rodelbahnbox - start, end = wrpylib.mwmarkup.find_template(wikitext, u'Rodelbahnbox') - if start is None: raise formencode.Invalid(u"Rodelbahnbox nicht gefunden", wikitext, None) - template_name, properties = wrpylib.mwmarkup.split_template(wikitext[start:end]) - - # process properties - for key, value in properties.iteritems(): - if key == u'Position': sledrun.position_latitude, sledrun.position_longitude = _conv(wrpylib.wrvalidators.GeoNone().to_python, value, key) # '47.583333 N 15.75 E' - elif key == u'Position oben': sledrun.top_latitude, sledrun.top_longitude = _conv(wrpylib.wrvalidators.GeoNone().to_python, value, key) # '47.583333 N 15.75 E' - elif key == u'Höhe oben': sledrun.top_elevation = _conv(wrpylib.wrvalidators.UnsignedNone().to_python, value, key) # '2000' - elif key == u'Position unten': sledrun.bottom_latitude, sledrun.bottom_longitude = _conv(wrpylib.wrvalidators.GeoNone().to_python, value, key) # '47.583333 N 15.75 E' - elif key == u'Höhe unten': sledrun.bottom_elevation = _conv(wrpylib.wrvalidators.UnsignedNone().to_python, value, key) # '1200' - elif key == u'Länge': sledrun.length = _conv(wrpylib.wrvalidators.UnsignedNone().to_python, value, key) # 3500 - elif key == u'Schwierigkeit': sledrun.difficulty = _conv(wrpylib.wrvalidators.GermanDifficulty().to_python, value, key) # 'mittel' elif key == u'Lawinen': sledrun.avalanches = _conv(wrpylib.wrvalidators.GermanAvalanches().to_python, value, key) # 'kaum' - elif key == u'Lawinen': sledrun.avalanches = _conv(wrpylib.wrvalidators.GermanAvalanches().to_python, value, key) # 'kaum' - elif key == u'Betreiber': sledrun.operator = _conv(wrpylib.wrvalidators.UnicodeNone().to_python, value, key) # 'Max Mustermann' - elif key == u'Öffentliche Anreise': sledrun.public_transport = _conv(wrpylib.wrvalidators.GermanPublicTransport().to_python, value, key) # 'Mittelmäßig' - elif key == u'Gehzeit': sledrun.walkup_time = _conv(wrpylib.wrvalidators.UnsignedNone().to_python, value, key) # 90 - elif key == u'Aufstieg möglich': sledrun.walkup_possible = _conv(wrpylib.wrvalidators.GermanBoolNone().to_python, value, key) # 'Ja' - elif key == u'Aufstieg getrennt': sledrun.walkup_separate, sledrun.walkup_separate_comment = _conv(wrpylib.wrvalidators.GermanTristateFloatComment().to_python, value, key) # 'Ja' - elif key == u'Aufstiegshilfe': sledrun.lift, sledrun.lift_details = _conv(wrpylib.wrvalidators.GermanLift().to_python, value, key) # 'Gondel (unterer Teil)' - elif key == u'Beleuchtungsanlage': sledrun.night_light, sledrun.night_light_comment = _conv(wrpylib.wrvalidators.GermanTristateFloatComment().to_python, value, key) - elif key == u'Beleuchtungstage': sledrun.night_light_days, sledrun.night_light_days_comment = _conv(wrpylib.wrvalidators.UnsignedCommentNone(7).to_python, value, key) # '3 (Montag, Mittwoch, Freitag)' - elif key == u'Rodelverleih': sledrun.sled_rental, sledrun.sled_rental_comment = _conv(wrpylib.wrvalidators.SledRental().to_python, value, key) # 'Talstation Serlesbahnan' - elif key == u'Gütesiegel': sledrun.cachet = _conv(wrpylib.wrvalidators.GermanCachet().to_python, value, key) # 'Tiroler Naturrodelbahn-Gütesiegel 2009 mittel' - elif key == u'Webauskunft': sledrun.information_web = _conv(wrpylib.wrvalidators.UrlNeinNone().to_python, value, key) # 'http://www.nösslachhütte.at/page9.php' - elif key == u'Telefonauskunft': sledrun.information_phone = _conv(wrpylib.wrvalidators.PhoneCommentListNeinLoopNone(comments_are_optional=False).to_python, value, key) # '+43-664-5487520 (Mitterer Alm)' - elif key == u'Bild': sledrun.image = _conv(wrpylib.wrvalidators.UnicodeNone().to_python, value, key) - elif key == u'In Übersichtskarte': sledrun.show_in_overview = _conv(wrpylib.wrvalidators.GermanBoolNone().to_python, value, key) - elif key == u'Forumid': sledrun.forum_id = _conv(wrpylib.wrvalidators.UnsignedNeinNone().to_python, value, key) - else: raise formencode.Invalid(u"Unbekannte Eigenschaft der Rodelbahnbox: '%s' (mit Wert '%s')" % (key, value), value, None) - return start, end, sledrun - - -def sledrun_to_rodelbahnbox(sledrun, version): + # find Rodelbahnbox + start, end = wrpylib.mwmarkup.find_template(wikitext, 'Rodelbahnbox') + if start is None: raise formencode.Invalid("Rodelbahnbox nicht gefunden", wikitext, None) + + # convert to sledrun + if sledrun is None: + state = None + else: + class State(object): + pass + state = State() + state.sledrun = sledrun + return start, end, RodelbahnboxValidator().to_python(wikitext[start:end], state) + + +def sledrun_to_rodelbahnbox(sledrun, version=None): """Converts a sledrun class to the {{Rodelbahnbox}} representation. The sledrun class has to have properties like position_latitude, ... See the table sledruncache for field (column) values. :param sledrun: an arbitrary class that contains the right properties :param version: a string specifying the version of the rodelbahnbox zu produce. - Version '1.3' and '1.4' are supported.""" - keys = [] - values = [] - keys.append(u'Position') - values.append(wrpylib.wrvalidators.GeoNone().from_python((sledrun.position_latitude, sledrun.position_longitude))) - keys.append(u'Position oben') - values.append(wrpylib.wrvalidators.GeoNone().from_python((sledrun.top_latitude, sledrun.top_longitude))) - keys.append(u'Höhe oben') - values.append(wrpylib.wrvalidators.UnsignedNone().from_python(sledrun.top_elevation)) - keys.append(u'Position unten') - values.append(wrpylib.wrvalidators.GeoNone().from_python((sledrun.bottom_latitude, sledrun.bottom_longitude))) - keys.append(u'Höhe unten') - values.append(wrpylib.wrvalidators.UnsignedNone().from_python(sledrun.bottom_elevation)) - keys.append(u'Länge') - values.append(wrpylib.wrvalidators.UnsignedNone().from_python(sledrun.length)) - keys.append(u'Schwierigkeit') - values.append(wrpylib.wrvalidators.GermanDifficulty().from_python(sledrun.difficulty)) - keys.append(u'Lawinen') - values.append(wrpylib.wrvalidators.GermanAvalanches().from_python(sledrun.avalanches)) - keys.append(u'Betreiber') - values.append(wrpylib.wrvalidators.UnicodeNone().from_python(sledrun.operator)) - keys.append(u'Öffentliche Anreise') - values.append(wrpylib.wrvalidators.GermanPublicTransport().from_python(sledrun.public_transport)) - if version == '1.4': - keys.append(u'Aufstieg möglich') - values.append(wrpylib.wrvalidators.GermanBoolNone().from_python(sledrun.walkup_possible)) - keys.append(u'Gehzeit') - values.append(wrpylib.wrvalidators.UnsignedNone().from_python(sledrun.walkup_time)) - keys.append(u'Aufstieg getrennt') - values.append(wrpylib.wrvalidators.GermanTristateFloatComment().from_python((sledrun.walkup_separate, sledrun.walkup_separate_comment))) - keys.append(u'Aufstiegshilfe') - values.append(wrpylib.wrvalidators.GermanLift().from_python((sledrun.lift, sledrun.lift_details))) - keys.append(u'Beleuchtungsanlage') - values.append(wrpylib.wrvalidators.GermanTristateFloatComment().from_python((sledrun.night_light, sledrun.night_light_comment))) - keys.append(u'Beleuchtungstage') - values.append(wrpylib.wrvalidators.UnsignedCommentNone(max=7).from_python((sledrun.night_light_days, sledrun.night_light_days_comment))) - keys.append(u'Rodelverleih') - values.append(wrpylib.wrvalidators.SledRental().from_python((sledrun.sled_rental, sledrun.sled_rental_comment))) - keys.append(u'Gütesiegel') - values.append(wrpylib.wrvalidators.GermanCachet().from_python(sledrun.cachet)) - keys.append(u'Webauskunft') - values.append(wrpylib.wrvalidators.UrlNeinNone().from_python(sledrun.information_web)) - keys.append(u'Telefonauskunft') - values.append(wrpylib.wrvalidators.PhoneCommentListNeinLoopNone(comments_are_optional=False).from_python(sledrun.information_phone)) - keys.append(u'Bild') - values.append(wrpylib.wrvalidators.UnicodeNone().from_python(sledrun.image)) - keys.append(u'In Übersichtskarte') - values.append(wrpylib.wrvalidators.GermanBoolNone().from_python(sledrun.show_in_overview)) - keys.append(u'Forumid') - values.append(wrpylib.wrvalidators.UnsignedNeinNone().from_python(sledrun.forum_id)) - result = [u'{{Rodelbahnbox'] - for i in xrange(len(keys)): result.append(u'| %-20s = %s' % (keys[i], values[i])) - result.append('}}') - return '\n'.join(result) + Version '1.4' is supported.""" + assert version in [None, '1.4'] + return RodelbahnboxValidator().from_python(sledrun) + + +class GasthausboxDictConverter(formencode.Validator): + """Converts a dict with Gasthausbox properties to a Inn class. Does no validation.""" + + def to_python(self, value, state=None): + """value is a dict of properties. If state is an object with the attribute inn, this inn class will be populated or updated.""" + props = value + if isinstance(state, object) and hasattr(state, 'inn'): + inn = state.inn + else: + class Inn(object): + pass + inn = Inn() + for k, v in props.items(): + if k == 'Position': inn.position_latitude, inn.position_longitude = v + elif k == 'Höhe': inn.position_elevation = v + elif k == 'Betreiber': inn.operator = v + elif k == 'Sitzplätze': inn.seats = v + elif k == 'Übernachtung': inn.overnight, inn.overnight_comment = v + elif k == 'Rauchfrei': inn.nonsmoker_area, inn.smoker_area = v + elif k == 'Rodelverleih': inn.sled_rental, inn.sled_rental_comment = v + elif k == 'Handyempfang': inn.mobile_provider = v + elif k == 'Homepage': inn.homepage = v + elif k == 'E-Mail': inn.email_list = v + elif k == 'Telefon': inn.phone_list = v + elif k == 'Bild': inn.image = v + elif k == 'Rodelbahnen': inn.sledding_list = v + return inn + + def from_python(self, value, state=None): + """Converts an inn class to a dict of Gasthausbox properties. value is an Inn instance.""" + inn = value + r = collections.OrderedDict() + r['Position'] = (inn.position_latitude, inn.position_longitude) + r['Höhe'] = inn.position_elevation + r['Betreiber'] = inn.operator + r['Sitzplätze'] = inn.seats + r['Übernachtung'] = (inn.overnight, inn.overnight_comment) + r['Rauchfrei'] = (inn.nonsmoker_area, inn.smoker_area) + r['Rodelverleih'] = (inn.sled_rental, inn.sled_rental_comment) + r['Handyempfang'] = inn.mobile_provider + r['Homepage'] = inn.homepage + r['E-Mail'] = inn.email_list + r['Telefon'] = inn.phone_list + r['Bild'] = inn.image + r['Rodelbahnen'] = inn.sledding_list + return r +class GasthausboxValidator(wrpylib.wrvalidators.GasthausboxDictValidator): + def __init__(self): + wrpylib.wrvalidators.GasthausboxDictValidator.__init__(self) + self.pre_validators=[wrpylib.mwmarkup.TemplateValidator(as_table=True, as_table_keylen=17), WinterrodelnTemplateDict('Gasthausbox')] + self.chained_validators = [GasthausboxDictConverter()] -def gasthausbox_to_inn(wikitext, inn): + +def gasthausbox_to_inn(wikitext, inn=None): """Converts a inn wiki page containing a {{Gasthausbox}} to an inn. - raises a formencode.Invalid exception if an error occurs. - :return: (start, end) tuple.""" - # Match Gasthausbox - regexp = re.compile(u"\{\{(Gasthausbox[^\}]*)\}\}", re.DOTALL) - match = regexp.search(wikitext) - if not match: - raise formencode.Invalid(u"No 'Gasthausbox' found") - box = match.group(1) - - # Process Gashausbox - for property in box.split('|'): - property = property.strip() - if property == u'Gasthausbox': continue - key_value = property.split('=') - if len(key_value) != 2: - raise formencode.Invalid(u"Property '%s' has unexpected format" % key_value, wikitext, None) - key = key_value[0].strip() - value = key_value[1].strip() - if key == u'Position': inn.position_latitude, inn.position_longitude = _conv(wrpylib.wrvalidators.GeoNone().to_python, value, key) # '47.583333 N 15.75 E' - elif key == u'Höhe': inn.position_elevation = _conv(wrpylib.wrvalidators.UnsignedNone().to_python, value, key) - elif key == u'Betreiber': inn.operator = _conv(wrpylib.wrvalidators.UnicodeNone().to_python, value, key) - elif key == u'Sitzplätze': inn.seats = _conv(wrpylib.wrvalidators.UnsignedNone().to_python, value, key) - elif key == u'Übernachtung': inn.overnight, inn.overnight_comment = _conv(wrpylib.wrvalidators.BoolUnicodeTupleValidator().to_python, value, key) - elif key == u'Rauchfrei': inn.nonsmoker_area, inn.smoker_area = _conv(wrpylib.wrvalidators.GermanTristateTuple().to_python, value, key) - elif key == u'Rodelverleih': inn.sled_rental, inn.sled_rental_comment = _conv(wrpylib.wrvalidators.BoolUnicodeTupleValidator().to_python, value, key) - elif key == u'Handyempfang': inn.mobile_provider = _conv(wrpylib.wrvalidators.ValueCommentListNeinLoopNone().to_python, value, key) - elif key == u'Homepage': inn.homepage = _conv(wrpylib.wrvalidators.UrlNeinNone().to_python, value, key) - elif key == u'E-Mail': inn.email_list = _conv(wrpylib.wrvalidators.EmailCommentListNeinLoopNone().to_python, value, key) - elif key == u'Telefon': inn.phone_list = _conv(wrpylib.wrvalidators.PhoneCommentListNeinLoopNone(comments_are_optional=True).to_python, value, key) - elif key == u'Bild': inn.image = _conv(wrpylib.wrvalidators.UnicodeNone().to_python, value, key) - elif key == u'Rodelbahnen': inn.sledding_list = _conv(wrpylib.wrvalidators.WikiPageListLoopNone().to_python, value, key) - else: raise formencode.Invalid(u"Unbekannte Eigenschaft der Gasthausbox: '%s' (mit Wert '%s')" % (key, value), value, None) - return match.span() + inn may be an instance of WrInnCache or an "empty" class (default). + raises a formencode.Invalid exception if the format is not OK or the Gasthausbox is not found. + :return: (start, end, inn) tuple.""" + # find Gasthausbox + start, end = wrpylib.mwmarkup.find_template(wikitext, 'Gasthausbox') + if start is None: raise formencode.Invalid("No 'Gasthausbox' found", wikitext, None) + + # convert to inn + if inn is None: + state = None + else: + class State(object): + pass + state = State() + state.inn = inn + return start, end, GasthausboxValidator().to_python(wikitext[start:end], state) def inn_to_gasthausbox(inn): """Converts the inn class to the {{Gasthausbox}} representation.""" - keys = [] - values = [] - keys.append(u'Position') - values.append(wrpylib.wrvalidators.GeoNone().from_python((inn.position_latitude, inn.position_longitude))) - keys.append(u'Höhe') - values.append(wrpylib.wrvalidators.UnsignedNone().from_python(inn.position_elevation)) - keys.append(u'Betreiber') - values.append(wrpylib.wrvalidators.UnicodeNone().from_python(inn.operator)) - keys.append(u'Sitzplätze') - values.append(wrpylib.wrvalidators.UnsignedNone().from_python(inn.seats)) - keys.append(u'Übernachtung') - values.append(wrpylib.wrvalidators.BoolUnicodeTupleValidator().from_python((inn.overnight, inn.overnight_comment))) - keys.append(u'Rauchfrei') - values.append(wrpylib.wrvalidators.GermanTristateTuple().from_python((inn.nonsmoker_area, inn.smoker_area))) - keys.append(u'Rodelverleih') - values.append(wrpylib.wrvalidators.BoolUnicodeTupleValidator().from_python((inn.sled_rental, inn.sled_rental_comment))) - keys.append(u'Handyempfang') - values.append(wrpylib.wrvalidators.ValueCommentListNeinLoopNone().from_python(inn.mobile_provider)) - keys.append(u'Homepage') - values.append(wrpylib.wrvalidators.UrlNeinNone().from_python(inn.homepage)) - keys.append(u'E-Mail') - values.append(wrpylib.wrvalidators.EmailCommentListNeinLoopNone().from_python(inn.email_list)) - keys.append(u'Telefon') - values.append(wrpylib.wrvalidators.PhoneCommentListNeinLoopNone(comments_are_optional=True).from_python(inn.phone_list)) - keys.append(u'Bild') - values.append(wrpylib.wrvalidators.UnicodeNone().from_python(inn.image)) - keys.append(u'Rodelbahnen') - values.append(wrpylib.wrvalidators.WikiPageListLoopNone().from_python(inn.sledding_list)) - result = [u'{{Gasthausbox'] - for i in xrange(len(keys)): result.append(u'| %-17s = %s' % (keys[i], values[i])) - result.append('}}\n') + return GasthausboxValidator().from_python(inn) + + +def find_template_latlon_ele(wikitext, template_title): + """Finds the first occurance of the '{{template_title|47.076207 N 11.453553 E|1890}}' template + and returns the tuple (start, end, lat, lon, ele) or (None, None, None, None, None) if the + template was not found. If the template has no valid format, an exception is thrown.""" + start, end = wrpylib.mwmarkup.find_template(wikitext, template_title) + if start is None: return (None,) * 5 + title, params = wrpylib.mwmarkup.split_template(wikitext[start:end]) + lat, lon = wrpylib.wrvalidators.GeoNone().to_python(params['1'].strip()) + ele = wrpylib.wrvalidators.UnsignedNone().to_python(params['2'].strip()) + return start, end, lat, lon, ele + + +def create_template_latlon_ele(template_title, lat, lon, ele): + geo = wrpylib.wrvalidators.GeoNone().from_python((lat, lon)) + if len(geo) == 0: geo = ' ' + ele = wrpylib.wrvalidators.UnsignedNone().from_python(ele) + if len(ele) == 0: ele = ' ' + return wrpylib.mwmarkup.create_template(template_title, [geo, ele]) + + +def find_template_PositionOben(wikitext): + """Same as find_template_latlon_ele with template '{{Position oben|47.076207 N 11.453553 E|1890}}'""" + return find_template_latlon_ele(wikitext, 'Position oben') + + +def create_template_PositionOben(lat, lon, ele): + return create_template_latlon_ele('Position, oben', lat, lon, ele) + + +def find_template_PositionUnten(wikitext): + """Same as find_template_latlon_ele with template '{{Position unten|47.076207 N 11.453553 E|1890}}'""" + return find_template_latlon_ele(wikitext, 'Position unten') + + +def find_template_unsigned(wikitext, template_title): + """Finds the first occurance of the '{{template_title|1890}}' template + and returns the tuple (start, end, unsigned_value) or (None, None, None) if the + template was not found. If the template has no valid format, an exception is thrown.""" + start, end = wrpylib.mwmarkup.find_template(wikitext, template_title) + if start is None: return (None,) * 3 + title, params = wrpylib.mwmarkup.split_template(wikitext[start:end]) + unsigned_value = wrpylib.wrvalidators.UnsignedNone().to_python(params['1'].strip()) + return start, end, unsigned_value + + +def create_template_unsigned(template_title, unsigned): + unsigned = wrpylib.wrvalidators.UnsignedNone().from_python(unsigned) + if len(unsigned) == 0: unsigned = ' ' + return wrpylib.mwmarkup.create_template(template_title, [unsigned]) + + +def find_template_Hoehenunterschied(wikitext): + """Same as find_template_unsigned with template '{{Höhenunterschied|350}}'""" + return find_template_unsigned(wikitext, 'Höhenunterschied') + + +def create_template_Hoehenunterschied(ele_diff): + return create_template_unsigned('Höhenunterschied', ele_diff) + + +def find_template_Bahnlaenge(wikitext): + """Same as find_template_unsigned with template '{{Bahnlänge|4500}}'""" + return find_template_unsigned(wikitext, 'Bahnlänge') + + +def create_template_Bahnlaenge(length): + return create_template_unsigned('Bahnlänge', length) + + +def find_template_Gehzeit(wikitext): + """Same as find_template_unsigned with template '{{Gehzeit|60}}'""" + return find_template_unsigned(wikitext, 'Gehzeit') + + +def create_template_Gehzeit(walkup_time): + return create_template_unsigned('Gehzeit', walkup_time) + + +def find_template_Forumlink(wikitext): + """Same as find_template_unsigned with template '{{Forumlink|26}}'""" + start, end = wrpylib.mwmarkup.find_template(wikitext, 'Forumlink') + if start is None: return (None,) * 3 + title, params = wrpylib.mwmarkup.split_template(wikitext[start:end]) + forumid = params['1'].strip() + if forumid == '': unsigned_value = None + else: unsigned_value = wrpylib.wrvalidators.UnsignedNone().to_python(forumid) + return start, end, unsigned_value + # return find_template_unsigned(wikitext, u'Forumlink') + + +def find_template_Parkplatz(wikitext): + """Same as find_template_latlon_ele with template '{{Parkplatz|47.076207 N 11.453553 E|1890}}'""" + return find_template_latlon_ele(wikitext, 'Parkplatz') + + +def find_template_Haltestelle(wikitext): + """Finds the first occurance of the '{{Haltestelle|Ortsname|Haltestellenname|47.076207 N 11.453553 E|1890}}' template + and returns the tuple (start, end, city, stop, lat, lon, ele) or (None, None, None, None, None, None, None) if the + template was not found. If the template has no valid format, an exception is thrown.""" + start, end = wrpylib.mwmarkup.find_template(wikitext, 'Haltestelle') + if start is None: return (None,) * 7 + title, params = wrpylib.mwmarkup.split_template(wikitext[start:end]) + city = wrpylib.wrvalidators.UnicodeNone().to_python(params['1'].strip()) + stop = wrpylib.wrvalidators.UnicodeNone().to_python(params['2'].strip()) + lat, lon = wrpylib.wrvalidators.GeoNone().to_python(params['3'].strip()) + ele = wrpylib.wrvalidators.UnsignedNone().to_python(params['4'].strip()) + return start, end, city, stop, lat, lon, ele + + +def find_all_templates(wikitext, find_func): + """Returns a list of return values of find_func that searches for a template. + Example: + >>> find_all_templates(wikitext, find_template_Haltestelle) + Returns an empty list if the template was not found at all. + """ + results = [] + result = find_func(wikitext) + start, end = result[:2] + while start is not None: + results.append(result) + result = find_func(wikitext[end:]) + if result[0] is None: + start = None + else: + start = result[0] + end + end += result[1] + result = (start, end) + result[2:] + return results + + +def googlemap_to_wrmap(attributes, coords, paths): + """Converts the output of parse_googlemap to the GeoJSON format wrmap uses. + :returns: (GeoJSON as nested Python datatypes) + """ + json_features = [] + + # point + for point in coords: + lon, lat, symbol, title = point + properties = {'type': 'punkt' if symbol is None else symbol.lower()} + if title is not None: properties['name'] = title + json_features.append({ + 'type': 'Feature', + 'geometry': {'type': 'Point', 'coordinates': [lon, lat]}, + 'properties': properties}) + + # path + for path in paths: + style, entries = path + style = style.lower() + PATH_TYPES = {'6#ff014e9a': 'rodelbahn', '6#ffe98401': 'gehweg', '6#ff7f7fff': 'alternative', '3#ff000000': 'lift', '3#ffe1e100': 'anfahrt'} + if style in PATH_TYPES: + properties = {'type': PATH_TYPES[style]} + else: + properties = {'type': 'line'} + properties['dicke'] = style[0] + properties['farbe'] = style[4:] + json_features.append({ + 'type': 'Feature', + 'geometry': { + 'type': 'LineString', + 'coordinates': [[lon, lat] for lon, lat, symbol, title in entries]}, + 'properties': properties}) + + geojson = { + 'type': 'FeatureCollection', + 'features': json_features, + 'properties': attributes} + return geojson + + +def parse_wrmap_coordinates(coords): + '''gets a string coordinates and returns an array of lon/lat coordinate pairs, e.g. + 47.12 N 11.87 E + 47.13 N 11.70 E + -> + [[11.87, 47.12], [11.70, 47.13]]''' + result = [] + pos = 0 + for match in re.finditer(r'\s*(\d+\.?\d*)\s*N?\s+(\d+\.?\d*)\s*E?\s*', coords): + if match.start() != pos: + break + result.append([float(match.groups()[1]), float(match.groups()[0])]) + pos = match.end() + else: + if pos == len(coords): + return result + raise RuntimeError('Wrong coordinate format: {}'.format(coords)) + + +def parse_wrmap(wikitext): + """Parses the (unicode) u'content' of the Winterrodeln wrmap extension. + If wikitext does not contain the tag or if the tag contains + invalid formatted lines, a ParseError is raised. + Use wrpylib.mwmarkup.find_tag(wikitext, 'wrmap') to find the wrmap tag within an arbitrary + wikitext before using this function. + + :param wikitext: wikitext containing only the template. Example: + + wikitext = u''' + + 47.240689 11.190454 + 47.245789 11.238971 + 47.245711 11.238283 + + 47.238587 11.203360 + 47.244951 11.230868 + 47.245470 11.237853 + + + ''' + :returns: GeoJSON as nested Python datatype + """ + # parse XML + try: + wrmap_xml = xml.etree.ElementTree.fromstring(wikitext.encode('utf-8')) + except xml.etree.ElementTree.ParseError as e: + row, column = e.position + raise ParseError("XML parse error on row {}, column {}: {}".format(row, column, e)) + if wrmap_xml.tag not in ['wrmap', 'wrgmap']: + raise ParseError('No valid tag name') + + # convert XML to geojson (http://www.geojson.org/geojson-spec.html) + json_features = [] + for feature in wrmap_xml: + # determine feature type + is_point = feature.tag in WRMAP_POINT_TYPES + is_line = feature.tag in WRMAP_LINE_TYPES + if (not is_point and not is_line): + raise ParseError('Unknown element <{}>.'.format(feature.tag)) + + # point + if is_point: + properties = {'type': feature.tag} + allowed_properties = {'name', 'wiki'} + wrong_properties = set(feature.attrib.keys()) - allowed_properties + if len(wrong_properties) > 0: + raise ParseError("The attribute '{}' is not allowed at <{}>.".format(list(wrong_properties)[0], feature.tag)) + properties.update(feature.attrib) + coordinates = parse_wrmap_coordinates(feature.text) + if len(coordinates) != 1: + raise ParseError('The element <{}> has to have exactly one coordinate pair.'.format(feature.tag)) + json_features.append({ + 'type': 'Feature', + 'geometry': {'type': 'Point', 'coordinates': coordinates[0]}, + 'properties': properties}) + + # line + if is_line: + properties = {'type': feature.tag} + allowed_properties = {'farbe', 'dicke'} + wrong_properties = set(feature.attrib.keys()) - allowed_properties + if len(wrong_properties) > 0: + raise ParseError("The attribute '{}' is not allowed at <{}>.".format(list(wrong_properties)[0], feature.tag)) + if 'farbe' in feature.attrib: + if not re.match('#[0-9a-fA-F]{6}$', feature.attrib['farbe']): + raise ParseError('The attribute "farbe" has to have a format like "#a0bb43".') + properties['strokeColor'] = feature.attrib['farbe'] # e.g. #a200b7 + if 'dicke' in feature.attrib: + try: + properties['strokeWidth'] = int(feature.attrib['dicke']) # e.g. 6 + except ValueError: + raise ParseError('The attribute "dicke" has to be an integer.') + json_features.append({ + 'type': 'Feature', + 'geometry': {'type': 'LineString', 'coordinates': parse_wrmap_coordinates(feature.text)}, + 'properties': properties}) + + # attributes + properties = {} + for k, v in wrmap_xml.attrib.items(): + if k in ['lat', 'lon']: + try: + properties[k] = float(v) + except ValueError: + raise ParseError('Attribute "{}" has to be a float value.'.format(k)) + elif k in ['zoom', 'width', 'height']: + try: + properties[k] = int(v) + except ValueError: + raise ParseError('Attribute "{}" has to be an integer value.'.format(k)) + else: + raise ParseError('Unknown attribute "{}".'.format(k)) + + geojson = { + 'type': 'FeatureCollection', + 'features': json_features, + 'properties': properties} + + return geojson + + +def create_wrmap_coordinates(coords): + result = [] + for coord in coords: + result.append('{:.6f} N {:.6f} E'.format(coord[1], coord[0])) return '\n'.join(result) + + +def create_wrmap(geojson): + """Creates a wikitext from geojson (as python types).""" + wrmap_xml = xml.etree.ElementTree.Element('wrmap') + wrmap_xml.text = '\n\n' + for k, v in geojson['properties'].items(): + if k in ['lon', 'lat']: + wrmap_xml.attrib[k] = '{:.6f}'.format(v) + else: + wrmap_xml.attrib[k] = str(v) + + assert geojson['type'] == 'FeatureCollection' + json_features = geojson['features'] + last_json_feature = None + for json_feature in json_features: + feature_xml = xml.etree.ElementTree.SubElement(wrmap_xml, json_feature['properties']['type']) + geo = json_feature['geometry'] + if geo['type'] == 'Point': + feature_xml.text = create_wrmap_coordinates([geo['coordinates']]) + if last_json_feature is not None: + last_json_feature.tail = '\n' + else: + if last_json_feature is not None: + last_json_feature.tail = '\n\n' + feature_xml.text = '\n' + create_wrmap_coordinates(geo['coordinates']) + '\n' + last_json_feature = feature_xml + feature_xml.attrib = json_feature['properties'] + del feature_xml.attrib['type'] + if last_json_feature is not None: + last_json_feature.tail = '\n\n' + return xml.etree.ElementTree.tostring(wrmap_xml, encoding='utf-8').decode('utf-8')