Spaces:

a-ghorbani
/

ai-phone-leaderboard

Running

App Files Files Community

ai-phone-leaderboard / src /services /firebase.py

agh123

rename memory usage to peak memory

b748cf7 6 months ago

raw

history blame

6.68 kB

	import firebase_admin
	from firebase_admin import credentials, firestore
	from typing import List, Dict, Optional
	import pandas as pd
	import streamlit as st
	import json


	def initialize_firebase():
	"""Initialize Firebase with credentials"""
	try:
	firebase_admin.get_app()
	except ValueError:
	# Get the entire Firebase credentials JSON from secrets
	firebase_creds = json.loads(st.secrets["FIREBASE_CREDENTIALS"])
	cred = credentials.Certificate(firebase_creds)
	firebase_admin.initialize_app(cred)
	return firestore.client()


	db = initialize_firebase()


	def normalize_device_id(device_info: dict) -> str:
	"""Normalize device identifier for aggregation"""
	emulator = "/Emulator" if device_info["isEmulator"] else ""
	if device_info["systemName"].lower() == "ios":
	return f"iOS/{device_info['model']}{emulator}"

	memory_tier = f"{device_info['totalMemory'] // (1024**3)}GB"
	return f"{device_info['brand']}/{device_info['model']}/{memory_tier}{emulator}"


	def format_params_in_b(params: int) -> float:
	"""Format number of parameters in billions"""
	b_value = params / 1e9
	if b_value >= 10:
	return round(b_value, 1)
	elif b_value >= 1:
	return round(b_value, 2)
	else:
	return round(b_value, 3)


	def format_leaderboard_data(submissions: List[dict]) -> pd.DataFrame:
	"""Format submissions for leaderboard display"""
	formatted_data = []

	for sub in submissions:
	try:
	benchmark_result = sub.get("benchmarkResult", {})
	device_info = sub.get("deviceInfo", {})

	# Skip if missing required data
	if not benchmark_result or not device_info:
	continue

	# Skip if missing initSettings
	if "initSettings" not in benchmark_result:
	continue

	# Skip emulators
	if device_info.get("isEmulator", False):
	continue

	formatted_data.append(
	{
	"Device": device_info.get("model", "Unknown"),
	"Platform": device_info.get("systemName", "Unknown"),
	"Benchmark": f"{benchmark_result.get('config', {}).get('label', 'Unknown')} (pp: {benchmark_result.get('config', {}).get('pp', 'N/A')}, tg: {benchmark_result.get('config', {}).get('tg', 'N/A')})",
	"PP Config": benchmark_result.get("config", {}).get("pp", "N/A"),
	"TG Config": benchmark_result.get("config", {}).get("tg", "N/A"),
	"Model": benchmark_result.get("modelName", "Unknown"),
	"Model Size": format_params_in_b(
	benchmark_result.get("modelNParams", 0)
	),
	"Prompt Processing": round(benchmark_result.get("ppAvg", 0), 2),
	"Token Generation": round(benchmark_result.get("tgAvg", 0), 2),
	"Memory Usage (%)": benchmark_result.get("peakMemoryUsage", {}).get(
	"percentage"
	),
	"Peak Memory (GB)": (
	round(
	benchmark_result.get("peakMemoryUsage", {}).get("used", 0)
	/ (1024**3),
	2,
	)
	if benchmark_result.get("peakMemoryUsage", {}).get("used")
	else None
	),
	"Total Memory (GB)": round(
	device_info.get("totalMemory", 0) / (1024**3), 2
	),
	"CPU Cores": device_info.get("cpuDetails", {}).get(
	"cores", "Unknown"
	),
	"Normalized Device ID": normalize_device_id(device_info),
	"Timestamp": benchmark_result.get("timestamp", "Unknown"),
	"Model ID": benchmark_result.get("modelId", "Unknown"),
	"OID": benchmark_result.get("oid"),
	#"initSettings": benchmark_result.get("initSettings"),
	"n_threads": benchmark_result.get("initSettings", {}).get("n_threads", -1),
	"n_gpu_layers": benchmark_result.get("initSettings", {}).get("n_gpu_layers", 0),
	"flash_attn": benchmark_result.get("initSettings", {}).get("flash_attn", False),
	"cache_type_k": benchmark_result.get("initSettings", {}).get("cache_type_k", "f16"),
	"cache_type_v": benchmark_result.get("initSettings", {}).get("cache_type_v", "f16"),
	"n_context": benchmark_result.get("initSettings", {}).get("n_context", -1),
	"n_batch": benchmark_result.get("initSettings", {}).get("n_batch", -1),
	"n_ubatch": benchmark_result.get("initSettings", {}).get("n_ubatch", -1),
	"Version": device_info.get("version", "Unknown"),
	}
	)
	except Exception as e:
	st.warning(f"Error processing submission: {str(e)}")
	continue

	return pd.DataFrame(formatted_data)


	async def fetch_leaderboard_data(
	model_name: Optional[str] = None, benchmark_label: Optional[str] = None
	) -> pd.DataFrame:
	"""Fetch and process leaderboard data from Firestore"""
	try:
	# Navigate to the correct collection path: benchmarks/v1/submissions
	submissions_ref = (
	db.collection("benchmarks").document("v1").collection("submissions")
	)

	# Get all documents
	docs = submissions_ref.stream()
	all_docs = list(docs)

	if len(all_docs) == 0:
	return pd.DataFrame()

	# Process documents and filter in memory
	submissions = []

	for doc in all_docs:
	data = doc.to_dict()

	if not data or "benchmarkResult" not in data:
	continue

	benchmark_result = data["benchmarkResult"]

	# Apply filters
	if (
	model_name
	and model_name != "All"
	and benchmark_result.get("modelName") != model_name
	):
	continue
	if (
	benchmark_label
	and benchmark_label != "All"
	and benchmark_result.get("config", {}).get("label") != benchmark_label
	):
	continue

	submissions.append(data)

	return format_leaderboard_data(submissions)

	except Exception as e:
	st.error(f"Error fetching data from Firestore: {str(e)}")
	return pd.DataFrame()