Spaces:
Running
Running
Update app.py
Browse files
app.py
CHANGED
@@ -22,10 +22,10 @@ def find_all(url,q=None,num=None):
|
|
22 |
for tag in soup.find_all():
|
23 |
try:
|
24 |
n = tag.get(tag.string)
|
25 |
-
rawp.append(
|
26 |
except Exception as e:
|
27 |
print (e)
|
28 |
-
rawp.append(
|
29 |
|
30 |
#rawp.append(tag.string)
|
31 |
for url in soup.find_all('a'):
|
@@ -43,8 +43,8 @@ def find_it(url,q=None,num=None):
|
|
43 |
soup = bs4.BeautifulSoup(source,'lxml')
|
44 |
for p in soup.find_all(f'{q}'):
|
45 |
#out.append(p)
|
46 |
-
out.append(p.string)
|
47 |
-
out.append(p.parent.name)
|
48 |
|
49 |
for url in soup.find_all('a'):
|
50 |
print(url.get('href'))
|
|
|
22 |
for tag in soup.find_all():
|
23 |
try:
|
24 |
n = tag.get(tag.string)
|
25 |
+
rawp.append({tag.name:tag.string,"parent":tag.parent.name,"children":tag.children.name})
|
26 |
except Exception as e:
|
27 |
print (e)
|
28 |
+
rawp.append({tag.name:tag.string})
|
29 |
|
30 |
#rawp.append(tag.string)
|
31 |
for url in soup.find_all('a'):
|
|
|
43 |
soup = bs4.BeautifulSoup(source,'lxml')
|
44 |
for p in soup.find_all(f'{q}'):
|
45 |
#out.append(p)
|
46 |
+
out.append({q:p.string,"parent":p.parent.name})
|
47 |
+
#out.append(p.parent.name)
|
48 |
|
49 |
for url in soup.find_all('a'):
|
50 |
print(url.get('href'))
|