diff --git a/.gitignore b/.gitignore index f13d16f8bfa5d49bd05f86666bfc9c8a180d8ef8..575b7a337a170ef3d2851e96da98dcbb64b652c5 100644 --- a/.gitignore +++ b/.gitignore @@ -1,2 +1,3 @@ dataSources/PubMed/tmp/* +dataSources/PubMed/data/* .venv \ No newline at end of file diff --git a/dataSources/PubMed/data/save_3_years.json b/dataSources/PubMed/data/save_3_years.json deleted file mode 100644 index 0637a088a01e8ddab3bf3fa98dbe804cbde1a0dc..0000000000000000000000000000000000000000 --- a/dataSources/PubMed/data/save_3_years.json +++ /dev/null @@ -1 +0,0 @@ -[] \ No newline at end of file diff --git a/dataSources/PubMed/pubmedApi.py b/dataSources/PubMed/pubmedApi.py index 8523c34c8bfe4b1090a354ad457787bd1f1b603c..df29e744902d2570583d88b851cfee7b602643aa 100644 --- a/dataSources/PubMed/pubmedApi.py +++ b/dataSources/PubMed/pubmedApi.py @@ -85,16 +85,20 @@ def getPubmedData(term, date_min, date_max, nb_items = -1, debug = False, store for part in entrie["MedlineCitation"]["Article"]["Journal"]["Title"]: if "#text" in part: data["Title"] += part["#text"] - else: - data["Title"] = entrie["MedlineCitation"]["Article"]["Journal"]["Title"] + elif isinstance(entrie["MedlineCitation"]["Article"]["Journal"]["Title"], object): + data["Title"] = entrie["MedlineCitation"]["Article"]["Journal"]["Title"]["#text"] + else: + data["Title"] = entrie["MedlineCitation"]["Article"]["Journal"]["Title"] data["ArticleTitle"] = "" if isinstance(entrie["MedlineCitation"]["Article"]["ArticleTitle"], list): for part in entrie["MedlineCitation"]["Article"]["ArticleTitle"]: if "#text" in part: data["ArticleTitle"] += part["#text"] - else: - data["ArticleTitle"] = entrie["MedlineCitation"]["Article"]["ArticleTitle"] + elif isinstance(entrie["MedlineCitation"]["Article"]["ArticleTitle"], object): + data["ArticleTitle"] = entrie["MedlineCitation"]["Article"]["ArticleTitle"]["#text"] + else: + data["ArticleTitle"] = entrie["MedlineCitation"]["Article"]["ArticleTitle"] data["Abstract"] = "" if "Abstract" in entrie["MedlineCitation"]["Article"] : @@ -102,6 +106,8 @@ def getPubmedData(term, date_min, date_max, nb_items = -1, debug = False, store for part in entrie["MedlineCitation"]["Article"]["Abstract"]["AbstractText"]: if "#text" in part: data["Abstract"] += part["#text"] + elif isinstance(entrie["MedlineCitation"]["Article"]["Abstract"]["AbstractText"], object): + data["Abstract"] = entrie["MedlineCitation"]["Article"]["Abstract"]["AbstractText"]["#text"] else: data["Abstract"] = entrie["MedlineCitation"]["Article"]["Abstract"]["AbstractText"]