summaryrefslogtreecommitdiffstatshomepage
path: root/tests/scrapers/test_scraper.py
blob: 6f6f29d97f06832162759039ffc1b77f91196ee6 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
from hircine.scraper import Scraper, ScrapeWarning


class MockScraper(Scraper):
    is_available = True

    def scrape(self):
        yield lambda: "foo"
        yield "bar"


class WarningScraper(Scraper):
    is_available = True

    def warn(self, str):
        raise ScrapeWarning("Invalid input")

    def scrape(self):
        yield lambda: "foo"
        yield lambda: self.warn("bar")
        yield "baz"


class ParserlessScraper(Scraper):
    is_available = True

    def scrape(self):
        yield "literal"


def test_scraper_collects():
    generator = MockScraper(None).collect()

    assert set(generator) == set(["foo", "bar"])


def test_scraper_collects_with_transformer():
    generator = MockScraper(None).collect([lambda gen, info: map(str.upper, gen)])

    assert set(generator) == set(["FOO", "BAR"])


def test_scraper_collects_warnings():
    scraper = WarningScraper(None)
    generator = scraper.collect()

    assert set(generator) == set(["foo", "baz"])
    assert scraper.get_warnings() == ["Invalid input"]


def test_scraper_collects_literal():
    scraper = ParserlessScraper(None)
    generator = scraper.collect()

    assert set(generator) == set(["literal"])