forked from ronilp/Finding-Influencers-in-Social-Networks
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathgetPartialInfluenceScore.py
55 lines (47 loc) · 1.62 KB
/
getPartialInfluenceScore.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
from database import getPagesClusterInfoCollection, getFriendsCollection, getClusterInfluencerScoreCollection
import datetime
import bisect
def getPartialInfluenceScore():
clusterInfoCollection = getPagesClusterInfoCollection()
clusterInfluencerCollection = getClusterInfluencerScoreCollection()
friendsCollection = getFriendsCollection()
clusterInfluencerCollection.drop()
clusterNumber = len(clusterInfoCollection.distinct('cluster'))
for friend in friendsCollection.find():
_id = friend['id']
document = {}
document['_id'] = _id
document['cluster'] = {}
for i in range(clusterNumber):
document['cluster'][str(i)] = []
clusterInfluencerCollection.insert(document)
pagesCursor = clusterInfoCollection.find({"count" : {"$gt" :3}})
epoch = datetime.datetime.utcfromtimestamp(0)
dt = 7*24*60*60
scores = []
done = 0
for page in pagesCursor:
users = page['people']
try:
users.sort(key = lambda x : x['created_time'])
cluster = page['cluster']
liketime = []
for user in users:
liketime.append((user['created_time'] - epoch).total_seconds())
back = 0
done += 1
print done
for user in users:
userId = user['id']
timeahead = (user['created_time'] - epoch).total_seconds() + dt
timeback = (user['created_time'] - epoch).total_seconds() - dt
ahead = bisect.bisect_right(liketime, timeahead)
score = ahead - back
back += 1
#print userId, cluster, score
clusterInfluencerCollection.update({ '_id' : userId}, { '$push' : {'cluster.' +str(cluster) : score} }, upsert = False)
except:
print "hmmm"
if __name__ == '__main__':
getPartialInfluenceScore()
print 'done'