-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathmerger.py
92 lines (83 loc) · 4.21 KB
/
merger.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
from rdflib import Graph
from objects import Person, Zenodo, Article
import openalex
def sources(name):
"""
It queries all the databases merging the results into single objects
Initially authored by Ricardo Usbeck
Args:
name: keyword to search for in the databases
Returns:
the graph object and the formatted results
"""
g = Graph()
results = []
# g, results = dblp.search(name, g, results)
# g, results = zenodo.search(name, g, results)
g, results = openalex.open_alex(name, g, results)
# TODO add materialized triples via https://github.com/RDFLib/OWL-RL
g.parse('zenodo2schema.ttl')
g = g.serialize(format="ttl")
return g, format_results(results)
def format_results(results):
"""From the results obtained from the databases it creates an HTML, and it returns it
Args:
results: array of the different types of results
Returns:
string: single string with the HTML of the results
"""
formatted_results = """<!DOCTYPE html>
<html>
<head>
<style>
.subtitle {display: inline; font-size: 20px;}
.title {display: inline; font-size: 30px;}
a { color: blue; }
.url { color: gray; }
.emoji { font-size:20px }
.emoji-title { font-size:30px }
</style>
</head>
<body>"""
person_result = "<h1 class='title'>Researchers - </h1><span class='emoji-title'>🦉</span><br><br>"
exist_person = False
article_result = "<h1 class='title'>Articles - </h1><span class='emoji-title'>📰</span><br><br>"
exist_article = False
zenodo_result = "<h1 class='title'>Zenodo - </h1><span class='emoji-title'>💼</span><br><br>"
exist_zenodo = False
for result in results:
if type(result) is Person:
person_result += "<span class='emoji'>🦉</span><h2 class='subtitle'><a href='" + \
result.URL.split(' - ')[0]+"' target='_blank' >"+result.name + \
"</a></h2><p class='faded'>"+result.URL+"</p><br>"
exist_person = True
elif type(result) is Article:
if " - " in result.URL:
article_result += "<p class='url'>" + result.URL \
+ "</p><span class='emoji'>📰</span><h2 class='subtitle'></i><a href='" +\
result.URL.split(" - ")[0] + "' target='_blank'>" + \
result.title + "</a></h2> - " + result.date + "<p>" + result.authors + "</p><br>"
else:
article_result += "<p class='url'>" + result.URL +\
"</p><span class='emoji'>📰</span><h2 class='subtitle'><a href='"+result.URL+\
"' target='_blank'>" + result.title + \
"</a></h2> - "+result.date+"<p>"+result.authors+"</p><br>"
exist_article = True
elif type(result) is Zenodo:
zenodo_result += "<p class='url'>" + result.URL +\
"</p><span class='emoji'>💼</span><h2 class='subtitle'><a href='"+\
result.URL+"' target='_blank'>" + result.title + \
"</a></h2> - "+result.date+ "<p>" + result.type + "</p><br>"
exist_zenodo = True
else:
print("Type of result not yet handled")
#Checking that we have actual results and act accordingly if not
if not exist_person:
person_result = ""
if not exist_article:
article_result = ""
if not exist_zenodo:
zenodo_result = ""
if not exist_zenodo and not exist_article and not exist_person:
person_result = "<br><br><h1>No results found </h1><span class='emoji-title'>😥</span>"
return formatted_results + person_result + article_result + zenodo_result + "</body></html>"