diff --git a/1-enrich-with-datacite/concatenate-enrich-dois.py b/1-enrich-with-datacite/concatenate-enrich-dois.py index 111059b540c5fda572dae6e0bb99272f80323348..0f74b736617e44d9d4e298a1a070201495b6f7f6 100644 --- a/1-enrich-with-datacite/concatenate-enrich-dois.py +++ b/1-enrich-with-datacite/concatenate-enrich-dois.py @@ -63,10 +63,10 @@ if temp_rows : if result[0] not in dois_added: dois_added.append(result[0]) df_fresh.loc[i, "doi"] = result[0] - df_fresh.loc[i, "relation_nbInstances"] = result[1] - df_fresh.loc[i, "relation_nbCitation"] = result[2] - if str(result[3]) != "[]": df_fresh.loc[i, "traveled_dois"] = str(result[3]) - if str(result[4]) != "[]": df_fresh.loc[i, "all_relations"] = str(result[4]) + if str(result[1]) != "[]": df_fresh.loc[i, "traveled_dois"] = str(result[1]) + else: df_fresh.loc[i, "traveled_dois"] = "" + if str(result[2]) != "[]": df_fresh.loc[i, "all_relations"] = str(result[2]) + else: df_fresh.loc[i, "all_relations"] = "" else: to_del.append(i) diff --git a/1-enrich-with-datacite/z_personal_functions.py b/1-enrich-with-datacite/z_personal_functions.py index a7ddc7dd1c232560f0c85105ca1129246b018f4c..bf19cd4aa0a4b8ec3b5e3e2b7b3ca01ffad75598 100644 --- a/1-enrich-with-datacite/z_personal_functions.py +++ b/1-enrich-with-datacite/z_personal_functions.py @@ -1,12 +1,11 @@ import requests, json -def get_origin_version(doi, count=0, cited=0, history=[], first=True): +def get_origin_version(doi, history=[], first=True): if first: history=[] # ligne ajoutée pour éviter certains soucis de cache où history n'est pas vide au premier appel de la fonction - cited = 0 req = requests.get( f"https://api.datacite.org/dois/{doi}" ) res = req.json() final = [] - result = (doi, count, cited, history, final) + result = (doi, history, final) try: related = res["data"]["attributes"]["relatedIdentifiers"] except: @@ -20,14 +19,13 @@ def get_origin_version(doi, count=0, cited=0, history=[], first=True): ignore = True elem_to_save_i = i.get("relatedIdentifier") history.append([i.get("relationType"), i.get("relatedIdentifier")]) - if i.get("relationType") == "isCitedBy" and i.get("relatedIdentifierType") == "DOI": cited += 1 if i.get("relationType") == "IsIdenticalTo" and i.get("relatedIdentifierType") == "DOI": duplicate = True elem_to_save_d = i.get("relatedIdentifier") history.append([i.get("relationType"), i.get("relatedIdentifier")]) if duplicate and not(ignore): - result = (elem_to_save_d, count, cited, history, final) - if ignore: result = get_origin_version(elem_to_save_i, count+1, cited, history, False) + result = (elem_to_save_d, history, final) + if ignore: result = get_origin_version(elem_to_save_i, history, False) return result def get_md_from_datacite( doi ) :