calibre-web/cps/metadata_provider/scholar.py

68 lines
2.5 KiB
Python
Raw Normal View History

2021-07-05 09:55:54 -07:00
# -*- coding: utf-8 -*-
# This file is part of the Calibre-Web (https://github.com/janeczku/calibre-web)
# Copyright (C) 2021 OzzieIsaacs
#
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
try:
from fake_useragent.errors import FakeUserAgentError
except (ImportError):
FakeUserAgentError = BaseException
try:
from scholarly import scholarly
except FakeUserAgentError:
raise ImportError("No module named 'scholarly'")
2021-07-05 09:55:54 -07:00
from cps.services.Metadata import Metadata
2021-07-06 11:24:27 -07:00
class scholar(Metadata):
2021-07-08 10:14:38 -07:00
__name__ = "Google Scholar"
__id__ = "googlescholar"
2021-07-05 09:55:54 -07:00
2021-12-23 20:16:41 -08:00
def search(self, query, generic_cover=""):
2021-07-07 12:10:38 -07:00
val = list()
2021-07-05 09:55:54 -07:00
if self.active:
2021-07-07 12:10:38 -07:00
scholar_gen = scholarly.search_pubs(' '.join(query.split('+')))
i = 0
for publication in scholar_gen:
v = dict()
2021-12-23 15:05:20 -08:00
v['id'] = publication['url_scholarbib'].split(':')[1]
2021-07-07 12:10:38 -07:00
v['title'] = publication['bib'].get('title')
v['authors'] = publication['bib'].get('author', [])
v['description'] = publication['bib'].get('abstract', "")
v['publisher'] = publication['bib'].get('venue', "")
if publication['bib'].get('pub_year'):
v['publishedDate'] = publication['bib'].get('pub_year')+"-01-01"
else:
v['publishedDate'] = ""
2021-12-23 15:05:20 -08:00
v['tags'] = []
v['rating'] = 0
2021-07-07 12:10:38 -07:00
v['series'] = ""
2022-01-04 12:11:52 -08:00
v['cover'] = ""
2021-07-31 00:18:05 -07:00
v['url'] = publication.get('pub_url') or publication.get('eprint_url') or "",
2021-07-07 12:10:38 -07:00
v['source'] = {
2021-07-08 10:14:38 -07:00
"id": self.__id__,
2021-07-07 12:10:38 -07:00
"description": "Google Scholar",
"link": "https://scholar.google.com/"
}
val.append(v)
i += 1
if (i >= 10):
break
return val
2021-07-06 11:24:27 -07:00
2021-07-05 09:55:54 -07:00