XAUUSD-PRO

Paused

App Files Files Community

XAUUSD-PRO / fetch_news.py

Dooratre

Upload 4 files

10e8373 verified 3 months ago

raw

history blame

6.36 kB

	import requests
	from datetime import datetime, timedelta

	def fetch_news_items():
	"""
	Fetch the main TradingView news feed for XAUUSD and DXY,
	return it as a Python dictionary (JSON).
	"""
	url = (
	"https://news-mediator.tradingview.com/news-flow/v2/news"
	"?filter=lang%3Aen&filter=symbol%3AOANDA%3AXAUUSD%2CTVC%3ADXY"
	"&client=screener&streaming=true"
	)
	headers = {
	"User-Agent": (
	"Mozilla/5.0 (Windows NT 10.0; Win64; x64) "
	"AppleWebKit/537.36 (KHTML, like Gecko) "
	"Chrome/138.0.0.0 Safari/537.36"
	)
	}
	response = requests.get(url, headers=headers)
	response.raise_for_status()
	return response.json()


	def fetch_story_by_id(story_id):
	"""
	Given a story ID from the news feed, fetch its full content JSON
	(shortDescription, astDescription, etc.) from TradingView.
	"""
	base_url = "https://news-headlines.tradingview.com/v3/story"
	params = {
	"id": story_id,
	"lang": "en"
	}
	headers = {
	"User-Agent": (
	"Mozilla/5.0 (Windows NT 10.0; Win64; x64) "
	"AppleWebKit/537.36 (KHTML, like Gecko) "
	"Chrome/138.0.0.0 Safari/537.36"
	)
	}
	response = requests.get(base_url, headers=headers, params=params)
	response.raise_for_status()
	return response.json()


	def parse_ast_node(node):
	"""
	Recursively parse an AST node from the 'astDescription' field:
	- If it's a string, just return it.
	- If it's a dictionary with a known 'type', handle it.
	- Otherwise, parse children recursively.
	"""
	if isinstance(node, str):
	# Direct text
	return node

	if isinstance(node, dict):
	node_type = node.get("type", "")
	children = node.get("children", [])

	if node_type == "root":
	# 'root' typically contains multiple children; parse them all
	return "".join(parse_ast_node(child) for child in children)

	elif node_type == "p":
	# Paragraph node: parse children, add a newline
	paragraph_text = "".join(parse_ast_node(child) for child in children)
	return paragraph_text + "\n"

	elif node_type == "url":
	# Format a hyperlink: [text](url)
	params = node.get("params", {})
	link_text = params.get("linkText", "")
	url = params.get("url", "")
	return f"{link_text} ({url})"

	elif node_type == "symbol":
	# Format a symbol mention
	params = node.get("params", {})
	symbol = params.get("symbol", "")
	text = params.get("text", "")
	return text if text else symbol

	else:
	# Unknown or unhandled node type; parse children anyway
	return "".join(parse_ast_node(child) for child in children)

	# If not string or dict (e.g., None?), return empty string
	return ""


	def extract_full_content_from_story(story_data):
	"""
	Extract the full textual content from a story, handling both
	shortDescription and the more detailed astDescription if available.
	"""
	# Try to get the AST description first (more detailed)
	ast_description = story_data.get("astDescription")
	if ast_description:
	return parse_ast_node(ast_description)

	# Fall back to short description if AST not available
	return story_data.get("shortDescription", "No content available")


	def get_recent_news_items(hours=100):
	"""
	Fetch recent news items within the specified number of hours
	and return detailed information including publish time and full content.
	"""
	# Get current time and calculate the threshold
	now_utc = datetime.utcnow()
	time_threshold = now_utc - timedelta(hours=hours)

	# Fetch news data
	news_data = fetch_news_items()
	items = news_data.get("items", [])
	detailed_news = []

	for item in items:
	item_id = item.get("id", "")
	published_ts = item.get("published")

	if not item_id or not published_ts:
	continue

	published_dt = datetime.utcfromtimestamp(published_ts)
	if published_dt >= time_threshold:
	# For each qualifying news item, fetch its full story content
	try:
	story_data = fetch_story_by_id(item_id)

	# Create a detailed news item
	detailed_item = {
	"id": item_id,
	"title": item.get("title", ""),
	"source": item.get("source", {}).get("name", ""),
	"published_time": published_dt.strftime("%Y-%m-%d %H:%M:%S UTC"),
	"timestamp": published_ts,
	"content": extract_full_content_from_story(story_data)
	}
	detailed_news.append(detailed_item)
	except Exception as e:
	print(f"Error fetching details for story {item_id}: {e}")

	# Sort by timestamp descending (newest first)
	detailed_news.sort(key=lambda x: x["timestamp"], reverse=True)
	return detailed_news


	def build_news_summary(news_items):
	"""
	Build a comprehensive summary of news items, including title, source,
	publication time, and full content.
	"""
	if not news_items:
	return "No recent news available."

	summaries = []
	for item in news_items:
	summary = (
	f"📰 {item['title']}\n"
	f"🔍 Source: {item['source']}\n"
	f"⏰ Published: {item['published_time']}\n"
	f"📝 Content:\n{item['content']}\n"
	f"{'=' * 50}"
	)
	summaries.append(summary)

	return "\n\n".join(summaries)


	def get_formatted_news_summary(hours=24):
	"""
	Convenience function to get a formatted news summary for the specified time period.
	"""
	news_items = get_recent_news_items(hours)
	return build_news_summary(news_items)


	# Example usage:
	if __name__ == "__main__":
	print("Fetching recent gold and DXY news...")
	news_summary = get_formatted_news_summary(48) # Get news from the last 48 hours
	print(news_summary)