-
Notifications
You must be signed in to change notification settings - Fork 79
/
Copy pathquery_d.py
50 lines (44 loc) · 1.4 KB
/
query_d.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
import time
import os
import numpy as np
import cPickle
from collections import defaultdict
def timeid(input1):
t1=time.strptime(input1[0],"%Y-%m-%d %H:%M:%S")
mon=t1.tm_mon
day=t1.tm_mday
hour=t1.tm_hour
minute=t1.tm_min
time_id=60*(24*(30*(mon-4)+day-1)+hour)+minute
# if time_id >=87840:
# print"%d\t%d\t%d\t%d"(mon,day,hour,minute)
time_id_s=time_id+int(input1[1])+int(input1[11])
time_id_d=time_id_s+int(input1[10])
return time_id_d
t=17568
r=72
c=68
result = defaultdict()
path="../query_beijing_parsed_filtered"
files=os.listdir(path)
kk=0
for file in files:
f = open(path+"/"+file)
kk+=1
print(kk,'day is over')
for line in f.readlines():
line=line.split('\t')
time_id_d=timeid(line)
# row_id_s=int(line[7])
# col_id_s=int(line[6])
row_id_d=int(line[9])
col_id_d=int(line[8])
d_query=line[14]
if time_id_d<87840 and time_id_d>-1:
time_id_5min = int(time_id_d/5)
if (time_id_5min,row_id_d,col_id_d) not in result:
result[(time_id_5min, row_id_d, col_id_d)] = list()
result[(time_id_5min,row_id_d,col_id_d)].append(d_query)
print "dumping dict ..."
#cPickle.dump(s_grid,open("/home/binbingliao/gyf/s_grid.pkl",'wb'))
cPickle.dump(result, open("../pkl/query_d_grid_beijing.pkl", 'wb'))