aboutsummaryrefslogtreecommitdiff
path: root/mensa.py
diff options
context:
space:
mode:
Diffstat (limited to 'mensa.py')
-rw-r--r--mensa.py52
1 files changed, 52 insertions, 0 deletions
diff --git a/mensa.py b/mensa.py
new file mode 100644
index 0000000..1ecef11
--- /dev/null
+++ b/mensa.py
@@ -0,0 +1,52 @@
+# Copyright (C) 2017 Gabriel Perez-Cerezo <gabriel@gpcf.eu>
+
+import urllib2
+from lxml import etree
+from lxml.cssselect import CSSSelector
+import html5lib
+from common import Food
+
+def get_food_items(mensa="mensa-tu-hardenbergstra%C3%9Fe", ignore_nudelauswahl=False) :
+ user_agent = 'Mozilla/5.0 (Windows NT 6.1; Win64; x64)'
+ headers = {'User-Agent': user_agent}
+
+ req = urllib2.Request('https://www.stw.berlin/mensen/mensa-tu-hardenbergstra%C3%9Fe.html', headers=headers)
+ response = urllib2.urlopen(req)
+ the_page = response.read()
+ document = html5lib.parse(the_page, treebuilder="lxml")
+ groupsel = CSSSelector('.splGroupWrapper')
+ groups = [e for e in groupsel(document)]
+ fl = []
+ for i in groups :
+ name = CSSSelector('.splGroup')(i)[0].text
+ sel = CSSSelector('.splMeal')
+ meals = [e for e in sel(i)]
+ for m in meals :
+ namesel = CSSSelector('.bold')
+ nm = namesel(m)[0].text
+ if ignore_nudelauswahl and "Nudelauswahl" in nm:
+ continue
+ pricesel = CSSSelector('.col-md-3')
+ veg = 0
+ if len(pricesel(m)[0]) >= 2 :
+ if "15" in pricesel(m)[0][1].attrib["src"] :
+ veg = 2
+ elif "1.png" in pricesel(m)[0][1].attrib["src"] :
+ veg = 1
+ price = pricesel(m)[-1].text.strip()
+ fl.append(Food(nm, price, name, veg))
+ return fl
+
+
+
+# format:
+if __name__ == "__main__":
+ food = get_food_items("", ignore_nudelauswahl=True)
+ cat = []
+ vegkeys = [ "", "Vegetarian", "Vegan" ]
+ for i in food:
+ if not i.category in cat :
+ cat.append(i.category)
+ if not i.category == None :
+ print i.category
+ print "\t" + i.name.ljust(80) + "\t"+ i.price.ljust(20) + vegkeys[i.veggie]