forked from learnedsystems/SOSD
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdownsample_50.py
32 lines (27 loc) · 1002 Bytes
/
downsample_50.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
import numpy as np
import struct
import os
def downsample(fn):
if os.path.exists("data/" + fn + "_50M_uint64") and os.path.exists("data/" + fn + "_50M_uint32"):
return
print("Downsampling 50M", fn)
if os.path.exists("data/" + fn + "200M_uint64"):
d_64 = np.fromfile("data/" + fn + "_200M_uint64", dtype=np.uint64)[1:]
nd_64 = d_64[::4]
with open("data/" + fn + "_50M_uint64", "wb") as f:
f.write(struct.pack("Q", len(nd_64)))
nd_64.tofile(f)
if os.path.exists("data/" + fn + "200M_uint32"):
d_32 = np.fromfile("data/" + fn + "_200M_uint32", dtype=np.uint32)[1:]
nd_32 = d_32[::4]
with open("data/" + fn + "_50M_uint32", "wb") as f:
f.write(struct.pack("Q", len(nd_32)))
nd_32.tofile(f)
downsample("books")
downsample("fb")
downsample("osm_cellids")
downsample("wiki_ts")
downsample("lognormal")
downsample("normal")
downsample("uniform_dense")
downsample("uniform_sparse")