-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathsource_indexer.py
33 lines (22 loc) · 923 Bytes
/
source_indexer.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
from collections import defaultdict
import zipfile
import re
import glob
def all_VNIR_SWIR():
return glob.glob("./data/**/AST_07XT_*.zip", recursive=True)
def all_TIR():
return glob.glob("./data/**/AST_05_*.zip", recursive=True)
def band_sources_in_groups():
group_name_grep = re.compile("AST_[^_]+_(\d+)_.+")
band_number_grep = re.compile(".*Band(\d+)(N|)\.tif$")
groups = defaultdict(dict)
for z in all_VNIR_SWIR() + all_TIR():
with zipfile.ZipFile(z, "r") as zip_ref:
all_files = sorted(zip_ref.namelist())
relevant_files = filter(lambda x: band_number_grep.search(x), all_files)
for file in relevant_files:
group = group_name_grep.search(file).group(1)
band = band_number_grep.search(file).group(1)
value = f"zip:{z}!{file}"
groups[group][int(band)] = value
return groups