-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathfind_retractions.py
63 lines (46 loc) · 1.89 KB
/
find_retractions.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
import requests
from db import save_retraction_to_db, retracted_id_exists, get_latest_timestamp
user_agent = "RetractionBot (https://github.com/Samwalton9/RetractionBot; mailto:[email protected])"
def get_crossref_retractions():
# List of crossref retraction types based on, but stricter than,
# https://github.com/fathomlabs/crossref-retractions/blob/master/index.js
retraction_types = [
'removal',
'retraction',
'Retraction',
'retration',
]
crossref_api_url = ('https://api.crossref.org/works'
'?filter=update-type:{type},from-pub-date:{date}'
'&select=DOI,update-to,created'
'&rows=1000'
'&offset={offset}')
latest_date = get_latest_timestamp()
for retraction_type in retraction_types:
items_count = 0
continue_running = True
while continue_running:
response = requests.get(crossref_api_url.format(
date=latest_date,
type=retraction_type,
offset=items_count
),
headers={'User-Agent': user_agent}
)
json_response = response.json()
returned_items = json_response['message']['items']
if len(returned_items) == 0:
continue_running = False
else:
items_count += len(returned_items)
for item in returned_items:
timestamp = item['created']['date-time']
old_doi = item['update-to'][0]['DOI']
new_doi = item['DOI']
if not retracted_id_exists(new_doi):
save_retraction_to_db(timestamp, 'doi', 'Crossref',
old_doi, new_doi)
def get_ncbi_retractions():
pass
if __name__ == '__main__':
get_crossref_retractions()