Commit e20658cb authored by c24b's avatar c24b

[DEBUG] adding docs_count into parsing

parent cd9b6308
...@@ -36,8 +36,8 @@ def parse_extract(corpus): ...@@ -36,8 +36,8 @@ def parse_extract(corpus):
if corpus.status()['error']: if corpus.status()['error']:
print("ERROR: aborting parse_extract for corpus #%i" % corpus_id) print("ERROR: aborting parse_extract for corpus #%i" % corpus_id)
return None return None
docs_count = corpus.children("DOCUMENT").count()
print('CORPUS #%d: parsed' % (corpus.id)) print('CORPUS #%d: parsed %d documents' % (corpus.id, docs_count))
extract_ngrams(corpus) extract_ngrams(corpus)
print('CORPUS #%d: extracted ngrams' % (corpus.id)) print('CORPUS #%d: extracted ngrams' % (corpus.id))
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment