1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
# Without this, we couldn't use the Django environment
#from admin.env import *
#from ngram.stemLem import *
from admin.utils import PrintException,DebugTime
from gargantext_web.db import NodeNgram,NodeNodeNgram,NodeNgramNgram
from gargantext_web.db import get_or_create_node, session, bulk_insert
from sqlalchemy.sql import func
from sqlalchemy import desc, asc, or_, and_, Date, cast, select
from sqlalchemy import literal_column
from sqlalchemy.orm import aliased
def compute_miam(corpus,limit=500):
'''
According to Specificities and stoplist,
'''
dbg = DebugTime('Corpus #%d - computing Miam' % corpus.id)
node_group = get_or_create_node(nodetype='Group', corpus=corpus)
node_stop = get_or_create_node(nodetype='StopList', corpus=corpus)
node_spec = get_or_create_node(nodetype='Specificity', corpus=corpus)
Stop=aliased(NodeNgram)
Group=aliased(NodeNgramNgram)
Spec=aliased(NodeNodeNgram)
top_miam = (session.query(Spec.ngram_id, Spec.score)
.outerjoin(Group, Group.ngramy_id == Spec.ngram_id)
.outerjoin(Stop, Stop.ngram_id == Spec.ngram_id)
.filter(Group.node_id == node_group.id)
.filter(Stop.node_id == node_stop.id)
.order_by(desc(Spec.score))
.limit(limit)
)
print([t for t in top_miam])
node_miam = get_or_create_node(nodetype='MiamList', corpus=corpus)
session.query(NodeNgram).filter(NodeNgram.node_id==node_miam.id).delete()
session.commit()
data = zip(
[node_miam.id for i in range(1,limit)]
, [n[0] for n in top_miam]
, [1 for i in range(1,limit)]
)
print([d for d in data])
bulk_insert(NodeNgram, ['node_id', 'ngram_id', 'weight'], [d for d in data])
dbg.show('Miam computed')