-
Notifications
You must be signed in to change notification settings - Fork 42
/
tfrecord2tif.py
141 lines (101 loc) · 4.06 KB
/
tfrecord2tif.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
from S2parser import S2parser
import tensorflow as tf
import numpy as np
import rasterio
import pandas as pd
import os
import datetime
import argparse
def main():
parser = argparse.ArgumentParser(description='convert tfrecord.gz file to folder of tif images.')
parser.add_argument('tfrecord', help='path to tfrecord.gz file (format path/0000.tfrecord.gz')
parser.add_argument('--outdir', default="tif", help='output directory')
parser.add_argument('--geotransforms', default=None, help='path to csv file for geotransforms.')
args = parser.parse_args()
tfrecordgzpath = "/data/data_IJGI18/datasets/full/480/data16/5886.tfrecord.gz"
outdir = "0"
#geotransforms = "/data/data_IJGI18/datasets/full/480/geotransforms.csv"
geotransforms = None
write_timeseries(args.tfrecord, args.outdir, args.geotransforms)
def tfrecord2npy(path):
parser = S2parser()
def mapping_function(serialized_feature):
# read data from .tfrecords
feature = parser.parse_example(serialized_example=serialized_feature)
return feature
dataset = tf.data.TFRecordDataset([path], compression_type="GZIP")
dataset = dataset.map(mapping_function, num_parallel_calls=1)
sess = tf.InteractiveSession()
sess.run([tf.global_variables_initializer(), tf.local_variables_initializer(), tf.tables_initializer()])
iterator = dataset.make_initializable_iterator()
sess.run([iterator.initializer])
x10,x20,x60,doy,year,labels = sess.run(iterator.get_next())
x10, x20, x60, doy, year, labels = [np.array(f) for f in [x10, x20, x60, doy, year, labels]]
x10, x20, x60, doy, year, labels = remove_padded_instances(x10, x20, x60, doy, year, labels)
return x10, x20, x60, doy, year, labels
def remove_padded_instances(x10,x20,x60,doy,year,labels):
# remove padded instances
mask = doy > 0
x10 = x10[mask]
x20 = x20[mask]
x60 = x60[mask]
doy = doy[mask]
year = year[mask]
labels = labels[mask]
return x10,x20,x60,doy,year,labels
def write_tif(arr, filename, geo=None):
path = os.path.dirname(filename)
if not os.path.exists(path):
os.makedirs(path)
print("writing "+filename)
# geo = gt.north, gt.west, pixelx, pixely, crs
if geo is not None:
north, west, pixelx, pixely, crs = geo
crs = crs
transform = rasterio.transform.from_origin(north, west, pixelx, pixely)
else:
transform = None
crs = None
H,W,D = arr.shape
new_dataset = rasterio.open(
filename,
'w',
driver='GTiff',
height=H,
width=W,
count=D,
dtype=rasterio.uint16,
crs=crs,
transform=transform,
)
for d in range(D):
new_dataset.write(arr[:,:,d].astype(np.uint16), d+1)
new_dataset.close()
def write_timeseries(tfrecordgzpath, outdir, geotransforms=None):
x10,x20,x60,doy,year,labels = tfrecord2npy(tfrecordgzpath)
id = int(os.path.basename(tfrecordgzpath).replace(".tfrecord.gz",""))
if geotransforms is not None:
print("reading geotranform file from "+geotransforms)
df = pd.read_csv(geotransforms, index_col=0, names=["north","pixelx","shearx","west","sheary","pixely","crs"])
g = df.loc[id]
north = g.north
west = g.west
crs = int(g.crs)
else:
north = 0
west = 0
crs = None
outpath = os.path.join(outdir,str(id))
if not os.path.exists(outpath):
os.makedirs(outpath)
for t in range(x10.shape[0]):
y = year[t]
d = doy[t]
dt = datetime.datetime.strptime(str(y) +' '+ str(d) , '%Y %j')
date = dt.strftime("%Y%m%d")
write_tif(x10[t],os.path.join(outpath,"10m",date+".tif"), geo=(north, west, 10, 10, crs))
write_tif(x20[t],os.path.join(outpath,"20m",date+".tif"), geo=(north, west, 20, 20, crs))
write_tif(x60[t],os.path.join(outpath,"60m",date+".tif"), geo=(north, west, 60, 60, crs))
write_tif(labels[0][:,:,None],os.path.join(outpath,"labels.tif"), geo=(north, west, 10, 10, crs))
if __name__ == "__main__":
main()