-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathloadData.py
126 lines (115 loc) · 3.86 KB
/
loadData.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
from datetime import datetime, date, time
import logging
import pprint
import hashlib
from google.appengine.ext import db
from google.appengine.api import memcache
import models
import menuparser
def load(offset=0):
# Fetch menu data
data = menuparser.getData(offset)
meals = []
entrees = []
# Loop through dining halls
for hall in data:
# Loop through menus
for menu in hall['menus']:
# Loop through meals
for meal in menu['meals']:
(m, e) = constructModels(hall, menu, meal)
# Get any meal with the same date, place, and type.
oldmeal = models.getMealByDateHallType(m.date, m.hall, m.type)
# Don't bother adding if no meals.
diff = False
# If the meal doesn't exist, or is different than the old, update.
if oldmeal is not None:
if m.entreeIDs == []:
continue
if len(oldmeal.entreeIDs) != len(m.entreeIDs):
diff = True
else:
for i in range(len(oldmeal.entreeIDs)):
if oldmeal.entreeIDs[i] != m.entreeIDs[i]:
diff = True
break
else:
diff = True
# Don't bother adding if the same as a meal already in the database
if diff:
handleMealAddAndDelete(m, oldmeal)
memcache.flush_all()
# Return debug info even if not unique?
meals.append(m)
entrees = entrees + e
return (meals, entrees)
@db.transactional(xg=True)
def handleMealAddAndDelete(newmeal, oldmeal):
print "Got unique meal"
if oldmeal is not None:
print "Deleting old meal."
oldmeal.delete()
if newmeal.entreeIDs != []:
newmeal.put()
def constructModels(hall, menu, meal):
# Get date
dt = datetime.now()
dateStr = menu['date'] + " %d" % dt.year
dt = datetime.strptime(dateStr, "%A, %B %d %Y")
d = dt.date()
# Get entree models
entrees = []
entreeIDs = []
hashes = []
hallID = models.halls[hall['name']]
for entree in meal['entrees']:
key = entree['name']
e = models.Entree()
e.date = d
e.name = entree['name']
e.protoname = entree['name'] + "|" + hallID
e.allergens = entree['allergens']
e.ingredients = entree['ingredients']
e.hall = hallID
e.type = meal['type']
h = hashlib.md5()
h.update(e.protoname)
h.update(str(e.date.month))
h.update(str(e.date.day))
h.update(e.type)
for s in e.ingredients:
h.update(s)
for s in e.allergens:
h.update(s)
e.hexhash = h.hexdigest()
hashes.append(e.hexhash)
entrees.append(e)
# fetch entrees by hashes
dbentrees = models.getEntreesByHashes(hashes)
eKeys = []
nentrees = []
# remove duplicates and add to eKeys
for entree in entrees:
found = False
for dbentree in dbentrees:
if entree.hexhash == dbentree.hexhash:
found = True
eKeys.append(dbentree.key())
break
if not found:
#print "Adding", entree.name
eKeys.append(db.put(entree))
# Speed up user clicking on an entree by asserting ratings exist.
models.Rating.get_or_insert(entree.protoname)
entrees = nentrees
# Add the entrees and get their IDs
#eKeys = eKeys + db.put(entrees)
for eKey in eKeys:
entreeIDs.append(eKey.id())
# Construct meals
m = models.Meal()
m.date = d
m.hall = hallID
m.type = meal['type']
m.entreeIDs = entreeIDs
return (m, entrees)