Spaces:

DenisT
/

brain-rot-tok

Sleeping

brain-rot-tok / endpoints /utils.py

add and disable rumble option, webscraper is buggin

dc61d50 12 months ago

1.57 kB

	import os
	import shutil
	import time
	import httpx
	from bs4 import BeautifulSoup


	def get_file_name(prefix: str) -> str:
	return f"{prefix}_{time.strftime('%Y%m%d-%H%M%S')}.mp4"


	def remove_content_from_dir(folder):
	for filename in os.listdir(folder):
	file_path = os.path.join(folder, filename)
	try:
	if os.path.isfile(file_path) or os.path.islink(file_path):
	os.unlink(file_path)
	elif os.path.isdir(file_path):
	shutil.rmtree(file_path)
	except Exception as e:
	print('Failed to delete %s. Reason: %s' % (file_path, e))


	async def rumble_link_scraper(rumble_link):
	url = "https://imgpanda.com/wp-admin/admin-ajax.php"
	downloader_type = "Rumble"
	server_name = "Server2"

	headers = {
	"Content-Type": "application/x-www-form-urlencoded",
	}

	data = {
	"action": "ajax_call_custom",
	"SocialDownUrl": rumble_link,
	"downloaderType": downloader_type,
	"serverName": server_name,
	}

	async with httpx.AsyncClient() as client:
	response = await client.post(url, headers=headers, data=data)

	if response.status_code == 200:
	soup = BeautifulSoup(response.text, 'html.parser')
	inner_html_string = ' '.join(response.text.split(' ')[1:-1])
	inner_soup = BeautifulSoup(inner_html_string, 'html.parser')

	# all a-tags within the class "social-download-result"
	a_tags = inner_soup.select('a')
	last_a_tag = a_tags[-1]

	if last_a_tag:
	return last_a_tag.get('href').replace('\\', '').replace('"', '')
	else:
	print('No matching <a> tag found within the class "social-download-result"')
	else:
	print(f"Error: {response.status_code}")