File size: 674 Bytes
d6fdb17
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
import os
import sys
import unittest

from bs4 import BeautifulSoup

sys.path.append(os.path.abspath("../scripts"))

from browse import extract_hyperlinks


class TestBrowseLinks(unittest.TestCase):
    def test_extract_hyperlinks(self):
        body = """
        <body>
        <a href="https://google.com">Google</a>
        <a href="foo.html">Foo</a>
        <div>Some other crap</div>
        </body>
        """
        soup = BeautifulSoup(body, "html.parser")
        links = extract_hyperlinks(soup, "http://example.com")
        self.assertEqual(
            links,
            [("Google", "https://google.com"), ("Foo", "http://example.com/foo.html")],
        )