-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathgleason_pathology.py
65 lines (54 loc) · 1.76 KB
/
gleason_pathology.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
import csv
import sys
import requests
import json
import psycopg2
# User fed parameters
file="pathology.json"
solr_url="<Enter Solr URL here>"
conn_string = "host='%s' dbname='%s' user='%s' password='%s' port=%s" % ('host',
'dbname',
'user',
'password',
'port')
# Constructing solr_url
url = solr_url + '/update?commit=true'
headers = {
'Content-type': 'application/json',
}
# Connecting to the database
conn = psycopg2.connect(conn_string)
cursor = conn.cursor()
# Extracting person_source_value -> person_id mapping information from the database
cursor.execute("""SELECT person_id, person_source_value from mimic_v5.person;""")
result = cursor.fetchall()
map = dict()
for i in result:
pid = i[0]
psv = str(i[1])
if psv not in map:
map[psv] = pid
# Pushing data to Solr
content = ""
with open(file, 'r') as f:
for line in f.readlines():
content += line
json_list = json.loads(content)
# Uploading file in chunks to server
s = []
for j in json_list:
# Getting the person_source_value to person_id mapping
if str(j['subject']) not in map:
continue
subject_id = map[str(j['subject'])]
# Modifying input data with subject_id
j['subject'] = subject_id
# Appending to upload list
s.append(j)
data = json.dumps(s)
response = requests.post(url, headers=headers, data=data)
if response.status_code != 200:
print("Couldn't upload")
print(response.reason)
else:
print ("\n\nUploaded Gleason Pathology Reports\n\n")