Adding constants + parsers CERN

b11e1f9a · c24b · 2e8dd028 · b11e1f9a · b11e1f9a
Commit b11e1f9a authored May 11, 2016 by c24b
Hide whitespace changes
Inline Side-by-side

Showing with 5 additions and 4 deletions

constants.py gargantext/constants.py +1 -1

Cern.py gargantext/util/parsers/Cern.py +4 -3

No files found.
--- a/gargantext/constants.py
+++ b/gargantext/constants.py
@@ -195,7 +195,7 @@ RESOURCETYPES = [
    },
    # type 10
   {    "name": 'CERN',
-        "parser": CERNParser,
+        "parser": CernParser,
        "default_language": "en",
   },
 ]

--- a/gargantext/util/parsers/Cern.py
+++ b/gargantext/util/parsers/Cern.py
@@ -5,7 +5,7 @@ import json
 class CernParser(Parser):
-    self.MARC21 = {
+    MARC21 = {
            "100":{"a": "author_name",
                        "v": "author_affiliation",
                        "w": "author_country",
@@ -32,12 +32,13 @@ class CernParser(Parser):
            "653": {"a":"keywords"},
            "856": {"u":"pdf_source"},
            }
    def parse(self, filebuf):
        tree = etree.tostring(filebuf)
        #root = tree.getroot()
+        hyperdata_list =[]
        soup = BeautifulSoup(tree, "lxml")
-        for record in soupr.find_all("record"):
+        for record in soup.find_all("record"):
            r = {v:[] for v in self.MARC21["700"].values()}
            r["uid"]  = soup.find("controlfield").text