nodes api: merge 31de1848 (status) and bf3ce4bd (publications)

311d73ec · Romain Loth · 389fb0c4 · 311d73ec
Commit 311d73ec authored Sep 19, 2016 by Romain Loth
Hide whitespace changes
Inline Side-by-side

Showing with 21 additions and 23 deletions

nodes.py gargantext/views/api/nodes.py +21 -23

No files found.
--- a/gargantext/views/api/nodes.py
+++ b/gargantext/views/api/nodes.py

 from gargantext.models          import Node, Ngram, NodeNgram, NodeNodeNgram, NodeNode
-from gargantext.constants       import NODETYPES
+from gargantext.constants       import NODETYPES, DEFAULT_N_DOCS_HAVING_NGRAM
 from gargantext.util.db         import session, delete, func, bulk_insert
 from gargantext.util.db_cache   import cache, or_
 from gargantext.util.validation import validate
@@ -192,6 +192,8 @@ class NodeListHaving(APIView):
    Simple implementation:
    Takes IDs of corpus and ngram and returns list of relevent documents in json format
    according to TFIDF score (order is decreasing).
+
+    2016-09: add total counts to output json
    '''
    def get(self, request, corpus_id):
        parameters = get_parameters(request)
@@ -202,7 +204,7 @@ class NodeListHaving(APIView):
        except :
            raise ValidationException('"ngram_ids" needs integers separated by comma.')

-        limit=5
+        limit = DEFAULT_N_DOCS_HAVING_NGRAM
        nodes_list = []

        corpus = session.query(Node).filter(Node.id==corpus_id).first()
@@ -225,26 +227,18 @@ class NodeListHaving(APIView):
            .filter(Node.typename == 'DOCUMENT', Node.parent_id== corpus.id)
            .filter(or_(*[NodeNodeNgram.ngram_id==ngram_id for ngram_id in ngram_ids]))
            .group_by(Node)
-            .order_by(func.sum(NodeNodeNgram.score).desc())
-            .limit(limit)
        )
-        # print("\n")
-        # print("in TFIDF:")
-        # print("\tcorpus_id:",corpus_id)
-        # convert query result to a list of dicts
-#         if nodes_query is None:
-#             print("TFIDF error, juste take sums")
-#             nodes_query = (session
-#                 .query(Node, func.sum(NodeNgram.weight))
-#                 .join(NodeNgram, NodeNgram.node_id == Node.id)
-#                 .filter(Node.parent_id == corpus_id)
-#                 .filter(Node.typename == 'DOCUMENT')
-#                 .filter(or_(*[NodeNgram.ngram_id==ngram_id for ngram_id in ngram_ids]))
-#                 .group_by(Node)
-#                 .order_by(func.sum(NodeNgram.weight).desc())
-#                 .limit(limit)
-#             )
-        for node, score in nodes_query:
+
+        # get the total count before applying limit
+        nodes_count = nodes_query.count()
+
+        # now the query with the limit
+        nodes_results_query = (nodes_query
+                                .order_by(func.sum(NodeNodeNgram.score).desc())
+                                .limit(limit)
+                            )
+
+        for node, score in nodes_results_query:
            print(node,score)
            print("\t corpus:",corpus_id,"\t",node.name)
            node_dict = {
@@ -256,7 +250,10 @@ class NodeListHaving(APIView):
                    node_dict[key] = node.hyperdata[key]
            nodes_list.append(node_dict)

-        return JsonHttpResponse(nodes_list)
+        return JsonHttpResponse({
+                                    'count': nodes_count,
+                                    'records': nodes_list
+                                })



@@ -531,7 +528,8 @@ class CorpusFacet(APIView):
        # check that the hyperfield parameter makes sense
        _facet_available_subfields = [
            'journal', 'publication_year', 'rubrique',
-            'language_iso2', 'language_iso3', 'language_name'
+            'language_iso2', 'language_iso3', 'language_name',
+            'authors'
        ]
        parameters = get_parameters(request)