forked from kristjan/cjvt-valency
logging when indexing
This commit is contained in:
parent
c5fc78dca1
commit
14a6e2423b
|
@ -453,6 +453,9 @@ def prepare_app_index(appindex_json):
|
|||
for corpus in CORPORA:
|
||||
res_hws = {}
|
||||
res_fns = {}
|
||||
|
||||
nentries = valdb[corpus].count()
|
||||
idx = 0
|
||||
for e in valdb[corpus].find({}):
|
||||
if "headwords" not in e:
|
||||
continue
|
||||
|
@ -468,6 +471,10 @@ def prepare_app_index(appindex_json):
|
|||
res_fns[fn] += 1
|
||||
else:
|
||||
res_fns[fn] = 1
|
||||
idx += 1
|
||||
if idx % 10000 == 0:
|
||||
log.debug("indexing {}: {}/{}".format(
|
||||
corpus, idx, nentries))
|
||||
|
||||
alphabetical = {}
|
||||
for k, e in res_hws.items():
|
||||
|
|
Loading…
Reference in New Issue
Block a user