Spaces:
Build error
Build error
Update app.py
Browse files
app.py
CHANGED
|
@@ -12,11 +12,12 @@ def link_find(url):
|
|
| 12 |
rawp=(f'RAW TEXT RETURNED: {soup.text}')
|
| 13 |
cnt=0
|
| 14 |
cnt+=len(rawp)
|
|
|
|
| 15 |
#out.append(rawp)
|
| 16 |
#out.append("HTML fragments: ")
|
| 17 |
q=("a","p","span","content","article")
|
| 18 |
for p in soup.find_all("a"):
|
| 19 |
-
out.append({"LINK TITLE":p.get('title'),"URL":p.get('href'),"STRING":p.string,"TREE":[]})
|
| 20 |
else:
|
| 21 |
pass
|
| 22 |
return out
|
|
|
|
| 12 |
rawp=(f'RAW TEXT RETURNED: {soup.text}')
|
| 13 |
cnt=0
|
| 14 |
cnt+=len(rawp)
|
| 15 |
+
rawt=soup.text
|
| 16 |
#out.append(rawp)
|
| 17 |
#out.append("HTML fragments: ")
|
| 18 |
q=("a","p","span","content","article")
|
| 19 |
for p in soup.find_all("a"):
|
| 20 |
+
out.append({"LINK TITLE":p.get('title'),"URL":p.get('href'),"STRING":p.string,"TEXT":rawt,"TREE":[]})
|
| 21 |
else:
|
| 22 |
pass
|
| 23 |
return out
|