Commit 8a3abdd7 authored by delanoe's avatar delanoe

[FEAT] Europress old files.

parent 53e8b81c
import sys
sys.path.append('/srv/gargantext')
from admin.env import *
#from admin.env import *
import re
import locale
from lxml import etree
......@@ -168,6 +168,7 @@ class EuropressFileParser(FileParser):
if test_date_fr is not None or test_date_fr_v2 is not None:
hyperdata['language_iso2'] = 'fr'
self.localeEncoding = "fr_FR"
locale.setlocale(locale.LC_ALL, "fr_FR.utf-8")
if encoding != "utf-8":
......@@ -198,6 +199,7 @@ class EuropressFileParser(FileParser):
if test_date_en is not None:
hyperdata['language_iso2'] = 'en'
localeEncoding = "en_GB.UTF-8"
locale.setlocale(locale.LC_ALL, localeEncoding)
try :
......@@ -259,10 +261,6 @@ class EuropressFileParser(FileParser):
except :
hyperdata['publication_date'] = timezone.now()
#if lang == 'fr':
#hyperdata['language_iso2'] = 'fr'
#elif lang == 'en':
# hyperdata['language_iso2'] = 'en'
hyperdata['publication_year'] = hyperdata['publication_date'].strftime('%Y')
hyperdata['publication_month'] = hyperdata['publication_date'].strftime('%m')
......
......@@ -3,6 +3,7 @@ from .IsiFileParser import IsiFileParser
from .JstorFileParser import JstorFileParser
from .ZoteroFileParser import ZoteroFileParser
from .PubmedFileParser import PubmedFileParser
from .EuropressFileParser_old import EuropressFileParser
from .EuropressFileParser_en import EuropressFileParser_en
from .EuropressFileParser_fr import EuropressFileParser_fr
from .ISTex import ISTex
......
......@@ -6,7 +6,7 @@ parsers = {
'Scopus (RIS format)' : RisFileParser,
'Zotero (RIS format)' : ZoteroFileParser,
'Jstor (RIS format)' : JstorFileParser,
#'Europress' : EuropressFileParser,
'Europress (old corpora)' : EuropressFileParser,
'Europress (French)' : EuropressFileParser_fr,
'Europress (English)' : EuropressFileParser_en,
'CSVParser' : CSVParser,
......
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment