This repository has been archived by the owner on Nov 11, 2022. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathconfigs.py
184 lines (113 loc) · 3.98 KB
/
configs.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
import os, pickle
from enum import Enum
venue_address = '/app/' if os.path.isdir('/app/') else os.path.dirname(os.path.abspath(__file__))
data_address = venue_address + '/Data/'
version = "0.2.0"
def get_version():
return version
def config_url_venu():
return venue_address
def config_url_data():
return data_address
def config_url_log():
return os.path.join(config_tmp_dir(), 'logfile.log')
def config_dirname_pdfs_no_ocr():
return '0-pdfs_no_ocr/'
def config_url_pdfs_no_ocr():
return os.path.join(data_address, config_dirname_pdfs_no_ocr())
def config_dirname_pdfs():
return '1-pdfs/'
def config_url_pdfs():
return os.path.join(data_address, config_dirname_pdfs())
def config_dirname_layouts():
return '2-layouts/'
def config_url_layouts():
return os.path.join(data_address, config_dirname_layouts())
def config_dirname_refs():
return '3-refs/'
def config_url_refs():
return os.path.join(data_address, config_dirname_refs())
def config_dirname_refs_seg():
return '3-refs_seg/'
def config_url_refs_segment():
return os.path.join(data_address, config_dirname_refs_seg())
def config_dirname_bibtex():
return '3-refs_bibtex/'
def config_url_refs_bibtex():
return os.path.join(data_address, config_dirname_bibtex())
def config_dirname_seg_prob():
return '3-refs_seg_prob/'
def config_url_refs_segment_prob():
return os.path.join(data_address, config_dirname_seg_prob())
def config_dirname_seg_dict():
return '3-refs_seg_dict/'
def config_url_refs_segment_dict():
return os.path.join(data_address, config_dirname_seg_dict())
def config_dirname_crossref():
return '4-refs_crossref/'
def config_url_refs_crossref():
return os.path.join(data_address, config_dirname_crossref())
def email_address():
return 'boulanger@lhlt.mpg.de'
def config_data_dirnames():
return [
config_dirname_pdfs_no_ocr(),
config_dirname_pdfs(),
config_dirname_layouts(),
config_dirname_refs(),
config_dirname_refs_seg(),
config_dirname_seg_prob(),
config_dirname_seg_dict(),
config_dirname_bibtex(),
config_dirname_crossref()
]
def config_url_git_repo():
return "https://github.com/cboulanger/excite-docker"
def config_exparser_dir(version=None):
if version:
return os.path.join(config_tmp_dir(), os.path.basename(config_url_git_repo()) + "-" + version)
return os.path.join(venue_address, "EXparser")
def config_exparser_version_file():
return os.path.join(config_tmp_dir(), "exparser-version.txt")
def config_dataset_dir(model_name=None):
if model_name:
return os.path.join(config_dataset_dir(), model_name)
return os.path.join(venue_address, "Dataset")
def config_model_dir(model_name=None, version=None):
"""
Returns the path to the dir containing the trained model files. If no argument is passed,
return the root path where all trained model data is located. If the model name is passed,
return the path to this model's data, for the current engine version. If a version is passed,
return the path to the model data for this version. No check is done if the path exists.
:param model_name:str
:param version:str
:return:str
"""
if model_name:
return os.path.join(config_model_dir(None, version), version or get_version(), model_name)
return os.path.join(venue_address, "Models")
def config_lists_dir():
return os.path.join(venue_address, "Lists")
def config_tmp_dir():
return os.path.join(venue_address, "tmp")
class DatasetDirs(Enum):
FEATURES = "Features"
LYT = "LYT"
LRT = "LRT"
REFLD = "RefLD"
SEG = "SEG"
TEST_LYT = "TEST_LYT"
TEST_REFS = "TEST_REFS"
TEST_SEG = "TEST_SEG"
# Model data in global vars
class ModelObjects:
rf = None
crf = None
kde_ntag = None
kde_atag = None
kde_wtag = None
# kde_ltag = None
# kde_dtag = None
# kde_gtag = None
# kde_llen = None
# kde_tlen = None