From aa26690e33c793520be2d6d84c445ced8aba2a45 Mon Sep 17 00:00:00 2001 From: martin speleo Date: Sat, 4 Jul 2009 17:19:30 +0100 Subject: [PATCH] [svn] Pareser for cave descriptions --- parsers/descriptions.py | 38 ++++++++++++++++++++++++++++++++++++++ 1 file changed, 38 insertions(+) create mode 100644 parsers/descriptions.py diff --git a/parsers/descriptions.py b/parsers/descriptions.py new file mode 100644 index 0000000..fe325e7 --- /dev/null +++ b/parsers/descriptions.py @@ -0,0 +1,38 @@ +from django.conf import settings +import core.models as models +import os +from utils import html_to_wiki, get_html_body, get_html_title + +pages = [(["smkridge", "204", "ariston-rigging.html"], "ariston-rigging"), + (["smkridge", "204", "ariston.html"], "ariston"), + (["smkridge", "204", "bivvy.html"], "bivvy"), + (["smkridge", "204", "bridge.html"], "bridge"), + (["smkridge", "204", "entrance-rigging.html"], "entrance-rigging"), + (["smkridge", "204", "entrance.html"], "entrance"), + (["smkridge", "204", "midlevel.html"], "midlevel"), + (["smkridge", "204", "millennium.html"], "millennium"), + (["smkridge", "204", "nopain.html"], "nopain"), + (["smkridge", "204", "razordance.html"], "razordance"), + (["smkridge", "204", "rhino.html"], "rhino"), + (["smkridge", "204", "sbview.html"], "sbview"), + (["smkridge", "204", "subway.html"], "subway"), + (["smkridge", "204", "swings.html"], "swings"), + (["smkridge", "204", "treeumphant.html"], "treeumphant"), + (["smkridge", "204", "uworld.html"], "uworld"), ] + + +def getDescriptions(): + for filelocation, name in pages: + f = open(os.path.join(settings.EXPOWEB, *filelocation), "r") + html = f.read() + + cd = models.CaveDescription(short_name = name, + long_name = unicode(get_html_title(html), "latin1"), + description = unicode(get_html_body(html), "latin1")) + cd.save() + +def parseDescriptions(): + for cd in models.CaveDescription.objects.all(): + cd.description = html_to_wiki(cd.description) + + cd.save() \ No newline at end of file