Commit 842efbe4 authored by delanoe's avatar delanoe

[FEAT] EUROPRESSE PARSER FOR HTML5. still bug with zip files.

parent ecd6640d
...@@ -238,7 +238,7 @@ def compute_tfidf_global(corpus): ...@@ -238,7 +238,7 @@ def compute_tfidf_global(corpus):
lnD = log(D) lnD = log(D)
cursor.execute('UPDATE tmp__idf SET idf = idf + %f' % (lnD, )) cursor.execute('UPDATE tmp__idf SET idf = idf + %f' % (lnD, ))
# show off # show off
dbg.show('insert tfidf for %d documents' % (D, )) dbg.show('insert tfidf')
cursor.execute(''' cursor.execute('''
INSERT INTO INSERT INTO
%s (nodex_id, nodey_id, ngram_id, score) %s (nodex_id, nodey_id, ngram_id, score)
......
This diff is collapsed.
This diff is collapsed.
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment