hyperboria/nexus/pylon/sources/libgen_doi.py

import re
from typing import (
    AsyncIterable,
    Callable,
)

from library.logging import error_log
from nexus.pylon.exceptions import RegexNotFoundError

from .base import (
    DoiSource,
    PreparedRequest,
)


class LibgenDoiSource(DoiSource):
    base_url = 'http://libgen.gs'
    resolve_timeout = 10

    async def resolve(self, error_log_func: Callable = error_log) -> AsyncIterable[PreparedRequest]:
        async with self.get_resolve_session() as session:
            url = f'{self.base_url}/scimag/ads.php?doi={self.doi}'
            async with PreparedRequest(
                method='get',
                url=url,
                timeout=self.resolve_timeout,
            ).execute_with(session=session) as resp:
                downloaded_page_bytes = await resp.read()
                downloaded_page = downloaded_page_bytes.decode('utf-8', 'backslashreplace')
            match = re.search(
                'https?://.*/scimag/get\\.php\\?doi=.*&key=[A-Za-z0-9]+',
                downloaded_page,
                re.IGNORECASE,
            )
            if match:
                yield PreparedRequest(method='get', url=match.group(), timeout=self.timeout)
            else:
                error_log_func(RegexNotFoundError(url=url))
- Send Pylon to golden - Move fancy naming to Hub - Adopt translations - Fix long authors list in bot - Support CJK in scitech - Fixed pylon bug with decoding improper unicode ch... GitOrigin-RevId: 74f73c44f749a71cb65dd5ddd3416f32a83d329f 2021-01-08 21:08:47 +01:00			`import re`
- feat(pylon): Refactor code - feat(idm): Rename IDM-2 to IDM - feat(idm): Open IDM 3 internal commit(s) GitOrigin-RevId: e302e9b5cda18cca1adc4ae8a3d906714d222106 2021-04-12 19:47:21 +02:00			`from typing import (`
			`AsyncIterable,`
			`Callable,`
			`)`
- Send Pylon to golden - Move fancy naming to Hub - Adopt translations - Fix long authors list in bot - Support CJK in scitech - Fixed pylon bug with decoding improper unicode ch... GitOrigin-RevId: 74f73c44f749a71cb65dd5ddd3416f32a83d329f 2021-01-08 21:08:47 +01:00
			`from library.logging import error_log`
			`from nexus.pylon.exceptions import RegexNotFoundError`

			`from .base import (`
			`DoiSource,`
			`PreparedRequest,`
			`)`


			`class LibgenDoiSource(DoiSource):`
			`base_url = 'http://libgen.gs'`
			`resolve_timeout = 10`

- feat(pylon): Refactor code - feat(idm): Rename IDM-2 to IDM - feat(idm): Open IDM 3 internal commit(s) GitOrigin-RevId: e302e9b5cda18cca1adc4ae8a3d906714d222106 2021-04-12 19:47:21 +02:00			`async def resolve(self, error_log_func: Callable = error_log) -> AsyncIterable[PreparedRequest]:`
- Send Pylon to golden - Move fancy naming to Hub - Adopt translations - Fix long authors list in bot - Support CJK in scitech - Fixed pylon bug with decoding improper unicode ch... GitOrigin-RevId: 74f73c44f749a71cb65dd5ddd3416f32a83d329f 2021-01-08 21:08:47 +01:00			`async with self.get_resolve_session() as session:`
			`url = f'{self.base_url}/scimag/ads.php?doi={self.doi}'`
- feat(pylon): Refactor code - feat(idm): Rename IDM-2 to IDM - feat(idm): Open IDM 3 internal commit(s) GitOrigin-RevId: e302e9b5cda18cca1adc4ae8a3d906714d222106 2021-04-12 19:47:21 +02:00			`async with PreparedRequest(`
			`method='get',`
			`url=url,`
			`timeout=self.resolve_timeout,`
			`).execute_with(session=session) as resp:`
- Send Pylon to golden - Move fancy naming to Hub - Adopt translations - Fix long authors list in bot - Support CJK in scitech - Fixed pylon bug with decoding improper unicode ch... GitOrigin-RevId: 74f73c44f749a71cb65dd5ddd3416f32a83d329f 2021-01-08 21:08:47 +01:00			`downloaded_page_bytes = await resp.read()`
			`downloaded_page = downloaded_page_bytes.decode('utf-8', 'backslashreplace')`
			`match = re.search(`
			`'https?://./scimag/get\\.php\\?doi=.&key=[A-Za-z0-9]+',`
			`downloaded_page,`
			`re.IGNORECASE,`
			`)`
			`if match:`
- feat(pylon): Refactor code - feat(idm): Rename IDM-2 to IDM - feat(idm): Open IDM 3 internal commit(s) GitOrigin-RevId: e302e9b5cda18cca1adc4ae8a3d906714d222106 2021-04-12 19:47:21 +02:00			`yield PreparedRequest(method='get', url=match.group(), timeout=self.timeout)`
- Send Pylon to golden - Move fancy naming to Hub - Adopt translations - Fix long authors list in bot - Support CJK in scitech - Fixed pylon bug with decoding improper unicode ch... GitOrigin-RevId: 74f73c44f749a71cb65dd5ddd3416f32a83d329f 2021-01-08 21:08:47 +01:00			`else:`
- feat(pylon): Refactor code - feat(idm): Rename IDM-2 to IDM - feat(idm): Open IDM 3 internal commit(s) GitOrigin-RevId: e302e9b5cda18cca1adc4ae8a3d906714d222106 2021-04-12 19:47:21 +02:00			`error_log_func(RegexNotFoundError(url=url))`