[UPDATE] good version :)

a4c676fe · PkSM3 · 31fd980b · a4c676fe · a4c676fe
Commit a4c676fe authored Mar 05, 2015 by PkSM3
Hide whitespace changes
Inline Side-by-side

Showing with 4 additions and 3 deletions

db.py gargantext_web/db.py +2 -2

corpustools.py parsing/corpustools.py +2 -1

No files found.
--- a/gargantext_web/db.py
+++ b/gargantext_web/db.py
@@ -134,8 +134,8 @@ class ModelCache(dict):
            for column in self._columns
            if key.__class__ == column.type.python_type
        ]
-        if len(conditions) == 0:
-            raise KeyError
+        # if len(conditions) == 0:
+        #     raise KeyError
        element = session.query(self._model).filter(or_(*conditions)).first()
        if element is None:
            raise KeyError

--- a/parsing/corpustools.py
+++ b/parsing/corpustools.py
@@ -195,6 +195,7 @@ class NgramsExtractors(defaultdict):
 ngramsextractors = NgramsExtractors()

 def extract_ngrams(corpus, keys):
+    print("yoloo")
    dbg = DebugTime('Corpus #%d - ngrams' % corpus.id)
    default_language_iso2 = None if corpus.language_id is None else cache.Language[corpus.language_id].iso2
    # query the metadata associated with the given keys
@@ -224,7 +225,7 @@ def extract_ngrams(corpus, keys):
        ngramsextractor = ngramsextractors[language_iso2]
        for text in nodeinfo[2:]:
            if text is not None and len(text):
-                ngrams = ngramsextractor.extract_ngrams(text)
+                ngrams = ngramsextractor.extract_ngrams(text.replace("[","").replace("]",""))
                for ngram in ngrams:
                    terms = ' '.join([token for token, tag in ngram]).lower()
                    n = len(ngram)