Commit e4ebb943 authored by PkSM3's avatar PkSM3

Merge branch 'master' of ssh://delanoe.org:1979/gargantext into samuel

parents ea2c34dd 80dd36a9
...@@ -243,9 +243,9 @@ def get_cooc(request=None, corpus_id=None, cooc_id=None, type='node_link', n=150 ...@@ -243,9 +243,9 @@ def get_cooc(request=None, corpus_id=None, cooc_id=None, type='node_link', n=150
def tfidf(corpus, document, ngram): def tfidf(corpus, document, ngram):
try: try:
x = Node_Ngram.objects.get(node=document, ngram=ngram).weight occurences_of_ngram = Node_Ngram.objects.get(node=document, ngram=ngram).weight
y = Node_Ngram.objects.filter(node=document).count() ngrams_by_document = sum([ x.weight for x in Node_Ngram.objects.filter(node=document)])
tf = x/y term_frequency = occurences_of_ngram / ngrams_by_document
xx = Node.objects.filter(parent=corpus, type=NodeType.objects.get(name="Document")).count() xx = Node.objects.filter(parent=corpus, type=NodeType.objects.get(name="Document")).count()
yy = Node_Ngram.objects.filter(ngram=ngram).count() yy = Node_Ngram.objects.filter(ngram=ngram).count()
......
...@@ -138,9 +138,9 @@ class EuropressFileParser(FileParser): ...@@ -138,9 +138,9 @@ class EuropressFileParser(FileParser):
# metadata['language_iso2'] = 'en' # metadata['language_iso2'] = 'en'
# metadata['publication_year'] = metadata['date'].strftime('%Y') metadata['publication_year'] = metadata['publication_date'].strftime('%Y')
# metadata['publication_month'] = metadata['date'].strftime('%m') metadata['publication_month'] = metadata['publication_date'].strftime('%m')
# metadata['publication_day'] = metadata['date'].strftime('%d') metadata['publication_day'] = metadata['publication_date'].strftime('%d')
metadata['publication_date'] = "" metadata['publication_date'] = ""
metadata['object_id'] = str(metadata['text'][-9]) metadata['object_id'] = str(metadata['text'][-9])
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment