-
Notifications
You must be signed in to change notification settings - Fork 4
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge pull request #6 from DavidFichtmueller/main
Added support for ORCID search
- Loading branch information
Showing
5 changed files
with
173 additions
and
3 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,3 +1,4 @@ | ||
from .orcid import Orcid | ||
from .orcid_authentication import OrcidAuthentication | ||
from .orcid_scrapper import OrcidScrapper | ||
from .orcid_scrapper import OrcidScrapper | ||
from .orcid_search import OrcidSearch |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,162 @@ | ||
import requests | ||
import os | ||
from urllib import parse | ||
|
||
class OrcidSearch(): | ||
''' | ||
This is a wrapper class for ORCID Search API | ||
''' | ||
def __init__(self, orcid_access_token = " ", state = "public", sandbox=False) -> None: | ||
''' | ||
Initialize orcid search instance | ||
state : Whether to use public or member API of ORCID | ||
orcid_access_token : Orcid access token obtained from the user with this orcid_id (default: "public") | ||
sandbox : bool : a boolean value to show if the ORCID sandbox API should be used (default: False) | ||
''' | ||
self._orcid_access_token = orcid_access_token | ||
self._state = state | ||
self._sandbox = sandbox | ||
# For testing purposes (pytesting on github workflow) | ||
if orcid_access_token != " ": | ||
try: | ||
self.__is_access_token_valid() | ||
except: | ||
if not self.__test_is_access_token_valid(): | ||
raise ValueError( | ||
f"Invalid access token! Please make sure the provided credentials are correct.") | ||
|
||
return | ||
|
||
def search(self, query, start = 0, rows = 1000, search_mode = "expanded-search", columns = "orcid,given-names,family-name,current-institution-affiliation-name"): | ||
''' | ||
Search orcid records | ||
for details on the query format see https://info.orcid.org/documentation/api-tutorials/api-tutorial-searching-the-orcid-registry/ | ||
query : the search query | ||
start : the offset for the paginated search, default = 0 | ||
rows : the number of rows to be returned, default = 1000 | ||
search_mode : the search mode, either "expanded-search" (default), "search", or "csv-search" | ||
columns : for the csv-search, default: "orcid,given-names,family-name,current-institution-affiliation-name" | ||
return : a dictionary of search results | ||
''' | ||
|
||
access_token = self._orcid_access_token | ||
|
||
|
||
_search_mode = "expanded-search" | ||
if search_mode == "search" or search_mode == "csv-search": | ||
_search_mode = search_mode | ||
_columns = columns | ||
query_encoded = parse.quote_plus(query) | ||
|
||
api_url = "" | ||
|
||
if self._state == "public": | ||
# Specify the ORCID record endpoint for the desired ORCID iD | ||
api_url = f'https://pub.orcid.org/' | ||
if (self._sandbox): | ||
api_url = f'https://pub.sandbox.orcid.org/' # for testing | ||
|
||
elif self._state == "member": | ||
api_url = f'https://api.orcid.org/' | ||
if (self._sandbox): | ||
api_url = f'https://api.sandbox.orcid.org/' # for testing | ||
|
||
api_url = api_url + f'v3.0/{_search_mode}/?q={query_encoded}&start={start}&rows={rows}' | ||
|
||
content_type = 'application/json' | ||
if search_mode == "csv-search": | ||
api_url = api_url + f'&fl={columns}' | ||
content_type = "text/csv" | ||
|
||
# Set the headers with the access token for authentication | ||
headers = { | ||
'Authorization': f'Bearer {access_token}', | ||
'Content-Type': f'{content_type}' | ||
} | ||
|
||
#print(api_url) | ||
|
||
# Make a GET request to retrieve the ORCID record | ||
response = requests.get(api_url, headers=headers) | ||
|
||
# The request was successful | ||
data = response.json() | ||
# Check the response status code | ||
if response.status_code == 200 or data is not None: | ||
return data | ||
else: | ||
# Handle the case where the request failed | ||
print("Failed to retrieve ORCID search results. Status code:", response.status_code) | ||
return None | ||
def __is_access_token_valid(self): | ||
''' | ||
Checks if the current access token is valid | ||
''' | ||
access_token = self._orcid_access_token | ||
|
||
if access_token == "": | ||
raise ValueError( | ||
"Empty value for access token! Please make sure you are authenticated by ORCID as developer.") | ||
# Make a test request to the API using the token | ||
headers = { | ||
'Authorization': f'Bearer {access_token}', | ||
'Content-Type': 'application/json' | ||
} | ||
|
||
api_url = "" | ||
|
||
if self._state == "public": | ||
# Specify the ORCID record endpoint for the desired ORCID iD | ||
api_url = f'https://pub.orcid.org/v3.0/search' | ||
if (self._sandbox): | ||
api_url = f'https://pub.sandbox.orcid.org/v3.0/search' # for testing | ||
|
||
elif self._state == "member": | ||
api_url = f'https://api.orcid.org/v3.0/search' | ||
if (self._sandbox): | ||
api_url = f'https://api.sandbox.orcid.org/v3.0/search' # for testing | ||
|
||
response = requests.get(api_url, headers=headers) | ||
|
||
if response.status_code == 404: | ||
# The request was successful, and the token is likely valid | ||
return False | ||
else: | ||
# The request failed, indicating that the token may have expired or is invalid | ||
return True | ||
|
||
## THESE FUNCTIONS ARE FOR TESTING PURPOSES ## | ||
|
||
def __test_is_access_token_valid(self): | ||
''' | ||
FOR TESTING PURPOSES ONLY | ||
Checks if the current access token is valid | ||
''' | ||
# Access the environment variable from github secrets | ||
access_token = os.environ["ORCID_ACCESS_TOKEN"] | ||
if access_token == "": | ||
raise ValueError( | ||
"Empty value for access token! Please make sure you are authenticated by ORCID as developer.") | ||
# Make a test request to the API using the token | ||
headers = { | ||
'Authorization': f'Bearer {access_token}', | ||
'Content-Type': 'application/json' | ||
} | ||
|
||
api_url = "" | ||
|
||
if self._state == "public": | ||
# Specify the ORCID record endpoint for the desired ORCID iD | ||
api_url = f'https://pub.sandbox.orcid.org/v3.0/search' | ||
|
||
elif self._state == "member": | ||
api_url = f'https://api.sandbox.orcid.org/v3.0/search' | ||
|
||
response = requests.get(api_url, headers=headers) | ||
if response.status_code == 404: | ||
# The request was successful, and the token is likely valid | ||
return False | ||
else: | ||
# The request failed, indicating that the token may have expired or is invalid | ||
return True |