Skip to content

Latest commit

 

History

History
53 lines (36 loc) · 1.59 KB

README.md

File metadata and controls

53 lines (36 loc) · 1.59 KB

Crawler providers system

Build status

What is it?

Manga crawler plugin system (see manga-py/manga_py)

Usage example

from sys import stderr

from crawler_providers import matched_providers
from crawler_providers.exceptions import *
from crawler_providers.types import *

url = 'http://best-site/manga/awesome'

try:
    providers = matched_providers(url)  # type: list
except ProviderNotFoundError as e:
    print('Provider not found', file=stderr)
    exit(1)
print('Providers count: {}'.format(len(providers)))

for p in providers:
    provider = p(url)  # OR p.new(url) OR p(url, quiet=True) for "silent mode" See documentation: https://manga-py.com/providers/ or https://manga-py.github.com/providers/

    # overload default chapter name:
    Chapter.name_format = '%s/{vol:>03}_ch_{ch:>03}' % (provider.__class__.__name__,)

    try:
        chapters = provider.get_chapters()
    except ChaptersNotFoundException as e:
        print('Chapters not found')
        continue

    for chapter in chapters:
        print('chapter: {}'.format(chapter))

        try:
            files = provider.get_chapter_files(chapter)
        except ImagesNotFoundException as e:
            # e.chapter == chapter (for async methods)
            print('Images not found for chapter: {}'.format(e.chapter))
            continue

    print('Files count: {}'.format(len(files)))