calibre-web/cps/metadata_provider/scholar.py

62 lines
2.3 KiB
Python
Raw Normal View History

2021-07-05 18:55:54 +02:00
# -*- coding: utf-8 -*-
# This file is part of the Calibre-Web (https://github.com/janeczku/calibre-web)
# Copyright (C) 2021 OzzieIsaacs
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
2021-07-06 20:24:27 +02:00
from scholarly import scholarly
2021-07-05 18:55:54 +02:00
from cps.services.Metadata import Metadata
2021-07-06 20:24:27 +02:00
class scholar(Metadata):
2021-07-08 19:14:38 +02:00
__name__ = "Google Scholar"
__id__ = "googlescholar"
2021-07-05 18:55:54 +02:00
2021-08-29 14:36:05 +02:00
def search(self, query, generic_cover=""):
2021-07-07 21:10:38 +02:00
val = list()
2021-07-05 18:55:54 +02:00
if self.active:
2021-07-07 21:10:38 +02:00
scholar_gen = scholarly.search_pubs(' '.join(query.split('+')))
i = 0
for publication in scholar_gen:
v = dict()
v['id'] = "1234" # publication['bib'].get('title')
v['title'] = publication['bib'].get('title')
v['authors'] = publication['bib'].get('author', [])
v['description'] = publication['bib'].get('abstract', "")
v['publisher'] = publication['bib'].get('venue', "")
if publication['bib'].get('pub_year'):
v['publishedDate'] = publication['bib'].get('pub_year')+"-01-01"
else:
v['publishedDate'] = ""
v['tags'] = ""
v['ratings'] = 0
v['series'] = ""
2021-08-29 14:36:05 +02:00
v['cover'] = generic_cover
2021-07-31 09:18:05 +02:00
v['url'] = publication.get('pub_url') or publication.get('eprint_url') or "",
2021-07-07 21:10:38 +02:00
v['source'] = {
2021-07-08 19:14:38 +02:00
"id": self.__id__,
2021-07-07 21:10:38 +02:00
"description": "Google Scholar",
"link": "https://scholar.google.com/"
}
val.append(v)
i += 1
if (i >= 10):
break
return val
2021-07-06 20:24:27 +02:00
2021-07-05 18:55:54 +02:00