-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathextract_gf_metadata.py
80 lines (56 loc) · 1.82 KB
/
extract_gf_metadata.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
# -*- coding: utf-8 -*-
if __name__ == "__main__":
import os
import sys
import tarfile
xml_path = u""
tar_gz_name = u""
# TODO: setup datapool
#
datapool = u"D:/datapool"
# TODO: setup script dir
#
script_dir = u"E:\01.备份\04.黄炎\3技术培训\2015影像培训班\5_示例数据\exercise 11:归档影像建库\ArchivedRasterType_gf"
input_file = os.path.join(script_dir, "extract_gf_metadata.in");
output_file = os.path.join(script_dir, "extract_gf_metadata.out");
# read input file
#
with open(input_file,'r') as fp:
tar_gz_name = fp.readline()
# check datapool and make it available
#
isdir = os.path.isdir(datapool)
isexists = os.path.exists(datapool)
if (not isexists) or (isexists and not isdir):
os.makedirs(datapool)
tar = None
try:
# open tar.gz
#
tar = tarfile.TarFile.open(tar_gz_name)
# get tar members
#
members = tar.getmembers()
# get jpeg and meta member
#
jpeg = None
meta = None
for m in members:
if m.name.upper().find(".JPG") >= 0 and \
m.name.upper().find("_THUMB.JPG") == -1:
jpeg = m
if m.name.upper().find(".XML") >= 0:
meta = m
if jpeg is None or meta is None:
raise Exception
fname = os.path.basename(tar_gz_name)
fname = fname.upper().replace(".TAR.GZ", "")
tar.extractall(os.path.join(datapool, fname), [meta, jpeg])
xml_path = os.path.join(datapool, fname, meta.name)
xml_path = os.path.normpath(xml_path)
with open(output_file, 'w') as fp:
fp.write(xml_path)
except Exception as e:
pass
if tar:
tar.close()