2021-04-23 18:23:02 +03:00
|
|
|
import re
|
|
|
|
from enum import Enum
|
|
|
|
|
|
|
|
from nexus.nlptools.regex import (
|
|
|
|
DOI_REGEX,
|
|
|
|
ISBN_REGEX,
|
|
|
|
NID_REGEX,
|
2021-05-02 10:45:22 +03:00
|
|
|
ONLY_DOI_REGEX,
|
2021-04-23 18:23:02 +03:00
|
|
|
URL_REGEX,
|
|
|
|
)
|
|
|
|
|
|
|
|
# ToDo: redo all, code is logically incorrect now
|
|
|
|
|
|
|
|
|
|
|
|
class QueryClass(Enum):
|
|
|
|
Default = 'default'
|
|
|
|
DOI = 'doi'
|
|
|
|
ISBN = 'isbn'
|
|
|
|
NID = 'nid'
|
|
|
|
URL = 'url'
|
|
|
|
|
|
|
|
|
|
|
|
def check_doi(query) -> (QueryClass, str):
|
2021-05-02 10:45:22 +03:00
|
|
|
if (
|
|
|
|
((r := re.search(DOI_REGEX, query)) and re.search(URL_REGEX, query))
|
|
|
|
or re.search(ONLY_DOI_REGEX, query)
|
|
|
|
):
|
2021-04-23 18:23:02 +03:00
|
|
|
doi = (r[1] + '/' + r[2]).lower()
|
|
|
|
return {
|
|
|
|
'doi': doi,
|
|
|
|
'query': f'doi:"{doi}"',
|
|
|
|
'class': QueryClass.DOI,
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
def check_isbn(query: str) -> (QueryClass, str):
|
|
|
|
if r := re.search(ISBN_REGEX, query):
|
|
|
|
isbn = r[1].replace('-', '')
|
|
|
|
return {
|
|
|
|
'isbn': isbn,
|
|
|
|
'query': 'isbns:' + isbn,
|
|
|
|
'class': QueryClass.ISBN
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
def check_nid(query: str) -> (QueryClass, str):
|
|
|
|
if r := re.search(NID_REGEX, query):
|
|
|
|
return {
|
|
|
|
'id': r[1],
|
|
|
|
'query': 'id:' + r[1],
|
|
|
|
'class': QueryClass.NID,
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
def check_url(query: str) -> (QueryClass, str):
|
|
|
|
if r := re.search(URL_REGEX, query):
|
|
|
|
return {
|
|
|
|
'url': r[0],
|
|
|
|
'query': r[0],
|
|
|
|
'class': QueryClass.URL,
|
|
|
|
}
|