added more logging

bug_fix
voje 5 years ago
parent 2b7339ac5a
commit c17361fbda

@ -30,6 +30,10 @@ class Parser():
"missing_srl": []
}
# for logging output
self.n_kres_files = -1
self.nth_kres_file = -1
def parse_jos_links(self, sent_el):
if self.corpus == "kres":
return self.parse_jos_links_kres(sent_el)
@ -91,8 +95,16 @@ class Parser():
def sentence_generator(self):
# Using generators so we don't copy a whole corpu around in memory.
if self.corpus == "kres":
# some logging output
if self.n_kres_files == -1:
self.n_kres_files = len(list(Path(self.kres_folder).glob('*')))
for xml_file in self.kres_folder.iterdir():
# self.parse_xml_file(xml_file)
self.nth_kres_file += 1
self.logger.info("{} ({}/{})".format(
xml_file, self.nth_kres_file, self.n_kres_files))
yield from self.parse_xml_file(xml_file)
else:
yield from self.parse_xml_file(self.ssj_file)

Loading…
Cancel
Save