|
import streamlit as st |
|
from huggingface_hub import HfApi |
|
import pandas as pd |
|
import matplotlib.pyplot as plt |
|
import seaborn as sns |
|
from datetime import datetime |
|
from concurrent.futures import ThreadPoolExecutor, as_completed |
|
from functools import lru_cache |
|
import time |
|
import requests |
|
from collections import Counter |
|
import numpy as np |
|
|
|
st.set_page_config(page_title="HF Contributions", layout="wide", initial_sidebar_state="expanded") |
|
|
|
|
|
st.markdown(""" |
|
<style> |
|
/* μ¬μ΄λλ° μ€νμΌλ§ */ |
|
[data-testid="stSidebar"] { |
|
min-width: 35vw !important; |
|
max-width: 35vw !important; |
|
background-color: #f8f9fa; |
|
padding: 1rem; |
|
border-right: 1px solid #e9ecef; |
|
} |
|
|
|
/* ν€λ μ€νμΌλ§ */ |
|
h1, h2, h3 { |
|
color: #1e88e5; |
|
font-weight: 700; |
|
} |
|
h1 { |
|
font-size: 2.5rem; |
|
margin-bottom: 1.5rem; |
|
border-bottom: 2px solid #e0e0e0; |
|
padding-bottom: 0.5rem; |
|
} |
|
h2 { |
|
font-size: 1.8rem; |
|
margin-top: 1.5rem; |
|
} |
|
h3 { |
|
font-size: 1.4rem; |
|
margin-top: 1rem; |
|
} |
|
|
|
/* μΉ΄λ μ€νμΌλ§ */ |
|
div[data-testid="stMetric"] { |
|
background-color: #f1f8fe; |
|
border-radius: 10px; |
|
padding: 1rem; |
|
box-shadow: 0 2px 5px rgba(0,0,0,0.05); |
|
margin-bottom: 1rem; |
|
} |
|
|
|
/* μ°¨νΈ μ»¨ν
μ΄λ μ€νμΌλ§ */ |
|
.chart-container { |
|
background-color: white; |
|
border-radius: 10px; |
|
padding: 1rem; |
|
box-shadow: 0 2px 10px rgba(0,0,0,0.1); |
|
margin: 1rem 0; |
|
} |
|
|
|
/* ν
μ΄λΈ μ€νμΌλ§ */ |
|
div[data-testid="stDataFrame"] { |
|
background-color: white; |
|
border-radius: 10px; |
|
padding: 0.5rem; |
|
box-shadow: 0 2px 5px rgba(0,0,0,0.05); |
|
} |
|
|
|
/* ν μ€νμΌλ§ */ |
|
button[data-baseweb="tab"] { |
|
font-weight: 600; |
|
} |
|
|
|
/* μλΈν€λ λ°°κ²½ */ |
|
.subheader { |
|
background-color: #f1f8fe; |
|
padding: 0.5rem 1rem; |
|
border-radius: 5px; |
|
margin-bottom: 1rem; |
|
} |
|
|
|
/* μ 보 λ±μ§ */ |
|
.info-badge { |
|
background-color: #e3f2fd; |
|
color: #1976d2; |
|
padding: 0.3rem 0.7rem; |
|
border-radius: 20px; |
|
display: inline-block; |
|
font-weight: 500; |
|
margin-right: 0.5rem; |
|
} |
|
|
|
/* νλ‘κ·Έλ μ€ λ° */ |
|
div[data-testid="stProgress"] { |
|
height: 0.5rem !important; |
|
} |
|
|
|
/* λ²νΌ μ€νμΌλ§ */ |
|
.stButton button { |
|
background-color: #1e88e5; |
|
color: white; |
|
border: none; |
|
font-weight: 500; |
|
} |
|
|
|
/* κ²½κ³ /μ±κ³΅ λ©μμ§ κ°μ */ |
|
div[data-testid="stAlert"] { |
|
border-radius: 10px; |
|
margin: 1rem 0; |
|
} |
|
|
|
/* μΉ΄ν
κ³ λ¦¬ λΆμ μΉμ
*/ |
|
.category-section { |
|
background-color: white; |
|
border-radius: 10px; |
|
padding: 1rem; |
|
margin-bottom: 1.5rem; |
|
box-shadow: 0 2px 5px rgba(0,0,0,0.05); |
|
} |
|
</style> |
|
""", unsafe_allow_html=True) |
|
|
|
api = HfApi() |
|
|
|
|
|
@lru_cache(maxsize=1000) |
|
def cached_repo_info(repo_id, repo_type): |
|
return api.repo_info(repo_id=repo_id, repo_type=repo_type) |
|
|
|
@lru_cache(maxsize=1000) |
|
def cached_list_commits(repo_id, repo_type): |
|
return list(api.list_repo_commits(repo_id=repo_id, repo_type=repo_type)) |
|
|
|
@lru_cache(maxsize=100) |
|
def cached_list_items(username, kind): |
|
if kind == "model": |
|
return list(api.list_models(author=username)) |
|
elif kind == "dataset": |
|
return list(api.list_datasets(author=username)) |
|
elif kind == "space": |
|
return list(api.list_spaces(author=username)) |
|
return [] |
|
|
|
|
|
@lru_cache(maxsize=1) |
|
def get_trending_accounts(limit=100): |
|
try: |
|
trending_data = {"spaces": [], "models": []} |
|
|
|
|
|
spaces_response = requests.get("https://huggingface.co/api/spaces", |
|
params={"limit": 10000}, |
|
timeout=30) |
|
|
|
|
|
models_response = requests.get("https://huggingface.co/api/models", |
|
params={"limit": 10000}, |
|
timeout=30) |
|
|
|
|
|
spaces_owners = [] |
|
if spaces_response.status_code == 200: |
|
spaces = spaces_response.json() |
|
|
|
|
|
owner_counts_spaces = {} |
|
for space in spaces: |
|
if '/' in space.get('id', ''): |
|
owner, _ = space.get('id', '').split('/', 1) |
|
else: |
|
owner = space.get('owner', '') |
|
|
|
if owner != 'None': |
|
owner_counts_spaces[owner] = owner_counts_spaces.get(owner, 0) + 1 |
|
|
|
|
|
top_owners_spaces = sorted(owner_counts_spaces.items(), key=lambda x: x[1], reverse=True)[:limit] |
|
trending_data["spaces"] = top_owners_spaces |
|
spaces_owners = [owner for owner, _ in top_owners_spaces] |
|
|
|
|
|
models_owners = [] |
|
if models_response.status_code == 200: |
|
models = models_response.json() |
|
|
|
|
|
owner_counts_models = {} |
|
for model in models: |
|
if '/' in model.get('id', ''): |
|
owner, _ = model.get('id', '').split('/', 1) |
|
else: |
|
owner = model.get('owner', '') |
|
|
|
if owner != 'None': |
|
owner_counts_models[owner] = owner_counts_models.get(owner, 0) + 1 |
|
|
|
|
|
top_owners_models = sorted(owner_counts_models.items(), key=lambda x: x[1], reverse=True)[:limit] |
|
trending_data["models"] = top_owners_models |
|
models_owners = [owner for owner, _ in top_owners_models] |
|
|
|
|
|
combined_score = {} |
|
for i, owner in enumerate(spaces_owners): |
|
if owner not in combined_score: |
|
combined_score[owner] = 0 |
|
combined_score[owner] += (limit - i) |
|
|
|
for i, owner in enumerate(models_owners): |
|
if owner not in combined_score: |
|
combined_score[owner] = 0 |
|
combined_score[owner] += (limit - i) |
|
|
|
|
|
sorted_combined = sorted(combined_score.items(), key=lambda x: x[1], reverse=True)[:limit] |
|
trending_authors = [owner for owner, _ in sorted_combined] |
|
|
|
return trending_authors, trending_data["spaces"], trending_data["models"] |
|
except Exception as e: |
|
st.error(f"Error fetching trending accounts: {str(e)}") |
|
fallback_authors = ["ritvik77", "facebook", "google", "stabilityai", "Salesforce", "tiiuae", "bigscience"] |
|
return fallback_authors, [(author, 0) for author in fallback_authors], [(author, 0) for author in fallback_authors] |
|
|
|
|
|
class RateLimiter: |
|
def __init__(self, calls_per_second=10): |
|
self.calls_per_second = calls_per_second |
|
self.last_call = 0 |
|
|
|
def wait(self): |
|
current_time = time.time() |
|
time_since_last_call = current_time - self.last_call |
|
if time_since_last_call < (1.0 / self.calls_per_second): |
|
time.sleep((1.0 / self.calls_per_second) - time_since_last_call) |
|
self.last_call = time.time() |
|
|
|
rate_limiter = RateLimiter() |
|
|
|
|
|
def fetch_commits_for_repo(repo_id, repo_type, username, selected_year): |
|
try: |
|
rate_limiter.wait() |
|
|
|
repo_info = cached_repo_info(repo_id, repo_type) |
|
if repo_info.private or (hasattr(repo_info, 'gated') and repo_info.gated): |
|
return [], 0 |
|
|
|
|
|
initial_commit_date = pd.to_datetime(repo_info.created_at).tz_localize(None).date() |
|
commit_dates = [] |
|
commit_count = 0 |
|
|
|
|
|
if initial_commit_date.year == selected_year: |
|
commit_dates.append(initial_commit_date) |
|
commit_count += 1 |
|
|
|
|
|
commits = cached_list_commits(repo_id, repo_type) |
|
for commit in commits: |
|
commit_date = pd.to_datetime(commit.created_at).tz_localize(None).date() |
|
if commit_date.year == selected_year: |
|
commit_dates.append(commit_date) |
|
commit_count += 1 |
|
|
|
return commit_dates, commit_count |
|
except Exception as e: |
|
return [], 0 |
|
|
|
|
|
def get_commit_events(username, kind=None, selected_year=None): |
|
commit_dates = [] |
|
items_with_type = [] |
|
kinds = [kind] if kind else ["model", "dataset", "space"] |
|
|
|
for k in kinds: |
|
try: |
|
items = cached_list_items(username, k) |
|
items_with_type.extend((item, k) for item in items) |
|
repo_ids = [item.id for item in items] |
|
|
|
|
|
chunk_size = 5 |
|
for i in range(0, len(repo_ids), chunk_size): |
|
chunk = repo_ids[i:i + chunk_size] |
|
with ThreadPoolExecutor(max_workers=min(5, len(chunk))) as executor: |
|
future_to_repo = { |
|
executor.submit(fetch_commits_for_repo, repo_id, k, username, selected_year): repo_id |
|
for repo_id in chunk |
|
} |
|
for future in as_completed(future_to_repo): |
|
repo_commits, repo_count = future.result() |
|
if repo_commits: |
|
commit_dates.extend(repo_commits) |
|
except Exception as e: |
|
st.warning(f"Error fetching {k}s for {username}: {str(e)}") |
|
|
|
|
|
df = pd.DataFrame(commit_dates, columns=["date"]) |
|
if not df.empty: |
|
df = df.drop_duplicates() |
|
return df, items_with_type |
|
|
|
|
|
def make_calendar_heatmap(df, title, year): |
|
if df.empty: |
|
st.info(f"No {title.lower()} found for {year}.") |
|
return |
|
|
|
|
|
df["count"] = 1 |
|
df = df.groupby("date", as_index=False).sum() |
|
df["date"] = pd.to_datetime(df["date"]) |
|
|
|
|
|
start = pd.Timestamp(f"{year}-01-01") |
|
end = pd.Timestamp(f"{year}-12-31") |
|
all_days = pd.date_range(start=start, end=end) |
|
|
|
|
|
heatmap_data = pd.DataFrame({"date": all_days, "count": 0}) |
|
heatmap_data = heatmap_data.merge(df, on="date", how="left", suffixes=("", "_y")) |
|
heatmap_data["count"] = heatmap_data["count_y"].fillna(0) |
|
heatmap_data = heatmap_data.drop("count_y", axis=1) |
|
|
|
|
|
heatmap_data["dow"] = heatmap_data["date"].dt.dayofweek |
|
heatmap_data["week"] = (heatmap_data["date"] - start).dt.days // 7 |
|
|
|
|
|
pivot = heatmap_data.pivot(index="dow", columns="week", values="count").fillna(0) |
|
|
|
|
|
month_labels = pd.date_range(start, end, freq="MS").strftime("%b") |
|
month_positions = pd.date_range(start, end, freq="MS").map(lambda x: (x - start).days // 7) |
|
|
|
|
|
from matplotlib.colors import ListedColormap, BoundaryNorm |
|
colors = ['#ebedf0', '#9be9a8', '#40c463', '#30a14e', '#216e39'] |
|
bounds = [0, 1, 3, 11, 31, float('inf')] |
|
cmap = ListedColormap(colors) |
|
norm = BoundaryNorm(bounds, cmap.N) |
|
|
|
|
|
fig, ax = plt.subplots(figsize=(12, 1.5)) |
|
|
|
|
|
pivot_int = pivot.astype(int) |
|
|
|
|
|
sns.heatmap(pivot_int, ax=ax, cmap=cmap, norm=norm, linewidths=0.5, linecolor="white", |
|
square=True, cbar=False, yticklabels=["M", "T", "W", "T", "F", "S", "S"]) |
|
|
|
ax.set_title(f"{title}", fontsize=14, pad=10) |
|
ax.set_xlabel("") |
|
ax.set_ylabel("") |
|
ax.set_xticks(month_positions) |
|
ax.set_xticklabels(month_labels, fontsize=10) |
|
ax.set_yticklabels(ax.get_yticklabels(), rotation=0, fontsize=10) |
|
|
|
|
|
fig.tight_layout() |
|
fig.patch.set_facecolor('#F8F9FA') |
|
|
|
st.pyplot(fig) |
|
|
|
|
|
def create_contribution_radar(username, models_count, spaces_count, datasets_count, commits_count): |
|
|
|
categories = ['Models', 'Spaces', 'Datasets', 'Activity'] |
|
values = [models_count, spaces_count, datasets_count, commits_count] |
|
|
|
|
|
max_vals = [100, 100, 50, 500] |
|
normalized = [min(v/m, 1.0) for v, m in zip(values, max_vals)] |
|
|
|
|
|
angles = np.linspace(0, 2*np.pi, len(categories), endpoint=False).tolist() |
|
angles += angles[:1] |
|
|
|
normalized += normalized[:1] |
|
|
|
fig, ax = plt.subplots(figsize=(6, 6), subplot_kw={'polar': True}, facecolor='#F8F9FA') |
|
|
|
|
|
ax.set_theta_offset(np.pi / 2) |
|
ax.set_theta_direction(-1) |
|
ax.set_thetagrids(np.degrees(angles[:-1]), categories, fontsize=12, fontweight='bold') |
|
|
|
|
|
ax.grid(color='#CCCCCC', linestyle='-', linewidth=0.5, alpha=0.7) |
|
|
|
|
|
ax.fill(angles, normalized, color='#4CAF50', alpha=0.25) |
|
ax.plot(angles, normalized, color='#4CAF50', linewidth=3) |
|
|
|
|
|
for i, val in enumerate(values): |
|
angle = angles[i] |
|
x = (normalized[i] + 0.1) * np.cos(angle) |
|
y = (normalized[i] + 0.1) * np.sin(angle) |
|
ax.text(angle, normalized[i] + 0.1, str(val), |
|
ha='center', va='center', fontsize=12, |
|
fontweight='bold', color='#1976D2') |
|
|
|
|
|
circles = [0.25, 0.5, 0.75, 1.0] |
|
for circle in circles: |
|
ax.plot(angles, [circle] * len(angles), color='gray', alpha=0.3, linewidth=0.5, linestyle='--') |
|
|
|
ax.set_title(f"{username}'s Contribution Profile", fontsize=16, pad=20, fontweight='bold') |
|
|
|
|
|
ax.set_facecolor('#F8F9FA') |
|
|
|
return fig |
|
|
|
|
|
def create_contribution_pie(model_commits, dataset_commits, space_commits): |
|
labels = ['Models', 'Datasets', 'Spaces'] |
|
sizes = [model_commits, dataset_commits, space_commits] |
|
|
|
|
|
filtered_labels = [label for label, size in zip(labels, sizes) if size > 0] |
|
filtered_sizes = [size for size in sizes if size > 0] |
|
|
|
if not filtered_sizes: |
|
return None |
|
|
|
|
|
colors = ['#FF9800', '#2196F3', '#4CAF50'] |
|
filtered_colors = [color for color, size in zip(colors, sizes) if size > 0] |
|
|
|
fig, ax = plt.subplots(figsize=(7, 7), facecolor='#F8F9FA') |
|
|
|
|
|
explode = [0.1] * len(filtered_sizes) |
|
|
|
wedges, texts, autotexts = ax.pie( |
|
filtered_sizes, |
|
labels=None, |
|
colors=filtered_colors, |
|
autopct='%1.1f%%', |
|
startangle=90, |
|
shadow=True, |
|
explode=explode, |
|
textprops={'fontsize': 14, 'weight': 'bold'}, |
|
wedgeprops={'edgecolor': 'white', 'linewidth': 2} |
|
) |
|
|
|
|
|
for autotext in autotexts: |
|
autotext.set_color('white') |
|
autotext.set_fontsize(12) |
|
autotext.set_weight('bold') |
|
|
|
|
|
ax.legend( |
|
wedges, |
|
[f"{label} ({size})" for label, size in zip(filtered_labels, filtered_sizes)], |
|
title="Contribution Types", |
|
loc="center left", |
|
bbox_to_anchor=(0.85, 0.5), |
|
fontsize=12 |
|
) |
|
|
|
ax.set_title('Distribution of Contributions by Type', fontsize=16, pad=20, fontweight='bold') |
|
ax.axis('equal') |
|
|
|
return fig |
|
|
|
|
|
def create_monthly_activity(df, year): |
|
if df.empty: |
|
return None |
|
|
|
|
|
df['date'] = pd.to_datetime(df['date']) |
|
df['month'] = df['date'].dt.month |
|
df['month_name'] = df['date'].dt.strftime('%b') |
|
|
|
|
|
month_order = ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec'] |
|
counts_by_month = df.groupby('month_name')['date'].count() |
|
monthly_counts = pd.Series([counts_by_month.get(m, 0) for m in month_order], index=month_order) |
|
|
|
|
|
fig, ax = plt.subplots(figsize=(14, 6), facecolor='#F8F9FA') |
|
|
|
|
|
norm = plt.Normalize(0, monthly_counts.max() if monthly_counts.max() > 0 else 1) |
|
colors = plt.cm.viridis(norm(monthly_counts.values)) |
|
|
|
bars = ax.bar(monthly_counts.index, monthly_counts.values, color=colors, width=0.7) |
|
|
|
|
|
if monthly_counts.max() > 0: |
|
max_idx = monthly_counts.argmax() |
|
bars[max_idx].set_color('#FF5722') |
|
bars[max_idx].set_edgecolor('black') |
|
bars[max_idx].set_linewidth(1.5) |
|
|
|
|
|
ax.set_title(f'Monthly Activity in {year}', fontsize=18, pad=20, fontweight='bold') |
|
ax.set_xlabel('Month', fontsize=14, labelpad=10) |
|
ax.set_ylabel('Number of Contributions', fontsize=14, labelpad=10) |
|
|
|
|
|
for i, count in enumerate(monthly_counts.values): |
|
if count > 0: |
|
ax.text(i, count + 0.5, str(int(count)), ha='center', fontsize=12, fontweight='bold') |
|
|
|
|
|
ax.grid(axis='y', linestyle='--', alpha=0.7, color='#CCCCCC') |
|
ax.set_axisbelow(True) |
|
|
|
|
|
ax.spines['top'].set_visible(False) |
|
ax.spines['right'].set_visible(False) |
|
ax.spines['left'].set_linewidth(0.5) |
|
ax.spines['bottom'].set_linewidth(0.5) |
|
|
|
|
|
ax.tick_params(axis='x', labelsize=12, pad=5) |
|
ax.tick_params(axis='y', labelsize=12, pad=5) |
|
|
|
plt.tight_layout() |
|
|
|
return fig |
|
|
|
|
|
def simulate_follower_data(username, spaces_count, models_count, total_commits): |
|
|
|
|
|
import numpy as np |
|
from datetime import timedelta |
|
|
|
|
|
base_followers = max(10, int((spaces_count * 2 + models_count * 3 + total_commits/10) / 6)) |
|
|
|
|
|
end_date = datetime.now() |
|
start_date = end_date - timedelta(days=365) |
|
dates = pd.date_range(start=start_date, end=end_date, freq='W') |
|
|
|
|
|
followers = [] |
|
current = base_followers / 2 |
|
|
|
for i in range(len(dates)): |
|
growth_factor = 1 + (np.random.random() * 0.1) |
|
current = current * growth_factor |
|
followers.append(int(current)) |
|
|
|
|
|
followers[-1] = base_followers |
|
|
|
|
|
fig, ax = plt.subplots(figsize=(14, 6), facecolor='#F8F9FA') |
|
|
|
|
|
points = np.array([dates, followers]).T.reshape(-1, 1, 2) |
|
segments = np.concatenate([points[:-1], points[1:]], axis=1) |
|
|
|
from matplotlib.collections import LineCollection |
|
norm = plt.Normalize(0, len(segments)) |
|
lc = LineCollection(segments, cmap='viridis', norm=norm, linewidth=3, alpha=0.8) |
|
lc.set_array(np.arange(len(segments))) |
|
line = ax.add_collection(lc) |
|
|
|
|
|
ax.scatter(dates, followers, s=50, color='#9C27B0', alpha=0.8, zorder=10) |
|
|
|
|
|
ax.set_title(f"Estimated Follower Growth for {username}", fontsize=18, pad=20, fontweight='bold') |
|
ax.set_xlabel("Date", fontsize=14, labelpad=10) |
|
ax.set_ylabel("Followers", fontsize=14, labelpad=10) |
|
|
|
|
|
ax.set_xlim(dates.min(), dates.max()) |
|
ax.set_ylim(0, max(followers) * 1.1) |
|
|
|
|
|
ax.grid(True, linestyle='--', alpha=0.7, color='#CCCCCC') |
|
ax.set_axisbelow(True) |
|
|
|
|
|
ax.spines['top'].set_visible(False) |
|
ax.spines['right'].set_visible(False) |
|
ax.spines['left'].set_linewidth(0.5) |
|
ax.spines['bottom'].set_linewidth(0.5) |
|
|
|
|
|
ax.tick_params(axis='x', labelsize=12, rotation=45) |
|
ax.tick_params(axis='y', labelsize=12) |
|
|
|
|
|
ax.annotate(f"Start: {followers[0]}", |
|
xy=(dates[0], followers[0]), |
|
xytext=(10, 10), |
|
textcoords='offset points', |
|
fontsize=12, |
|
fontweight='bold', |
|
color='#9C27B0', |
|
bbox=dict(boxstyle="round,pad=0.3", fc="#F3E5F5", ec="#9C27B0", alpha=0.8)) |
|
|
|
ax.annotate(f"Current: {followers[-1]}", |
|
xy=(dates[-1], followers[-1]), |
|
xytext=(-10, 10), |
|
textcoords='offset points', |
|
fontsize=12, |
|
fontweight='bold', |
|
color='#9C27B0', |
|
ha='right', |
|
bbox=dict(boxstyle="round,pad=0.3", fc="#F3E5F5", ec="#9C27B0", alpha=0.8)) |
|
|
|
plt.tight_layout() |
|
|
|
return fig |
|
|
|
|
|
def create_ranking_chart(username, overall_rank, spaces_rank, models_rank): |
|
if not (overall_rank or spaces_rank or models_rank): |
|
return None |
|
|
|
|
|
fig, ax = plt.subplots(figsize=(12, 5), facecolor='#F8F9FA') |
|
|
|
categories = [] |
|
positions = [] |
|
colors = [] |
|
rank_values = [] |
|
|
|
if overall_rank: |
|
categories.append('Overall') |
|
positions.append(101 - overall_rank) |
|
colors.append('#673AB7') |
|
rank_values.append(overall_rank) |
|
|
|
if spaces_rank: |
|
categories.append('Spaces') |
|
positions.append(101 - spaces_rank) |
|
colors.append('#2196F3') |
|
rank_values.append(spaces_rank) |
|
|
|
if models_rank: |
|
categories.append('Models') |
|
positions.append(101 - models_rank) |
|
colors.append('#FF9800') |
|
rank_values.append(models_rank) |
|
|
|
|
|
bars = ax.barh(categories, positions, color=colors, alpha=0.8, height=0.6, |
|
edgecolor='white', linewidth=1.5) |
|
|
|
|
|
for i, bar in enumerate(bars): |
|
ax.text(bar.get_width() + 2, bar.get_y() + bar.get_height()/2, |
|
f'Rank #{rank_values[i]}', va='center', fontsize=12, |
|
fontweight='bold', color=colors[i]) |
|
|
|
|
|
ax.set_xlim(0, 105) |
|
ax.set_title(f"Ranking Positions for {username} (Top 100)", fontsize=18, pad=20, fontweight='bold') |
|
ax.set_xlabel("Percentile (higher is better)", fontsize=14, labelpad=10) |
|
|
|
|
|
ax.text(50, -0.6, "β Lower rank (higher number) | Higher rank (lower number) β", |
|
ha='center', va='center', fontsize=10, fontweight='bold', color='#666666') |
|
|
|
|
|
ax.axvline(x=90, color='#FF5252', linestyle='--', alpha=0.7, linewidth=2) |
|
ax.text(92, len(categories)/2, 'Top 10', color='#D32F2F', fontsize=12, |
|
rotation=90, va='center', fontweight='bold') |
|
|
|
|
|
ax.spines['top'].set_visible(False) |
|
ax.spines['right'].set_visible(False) |
|
ax.spines['left'].set_linewidth(0.5) |
|
ax.spines['bottom'].set_linewidth(0.5) |
|
|
|
|
|
ax.tick_params(axis='x', labelsize=12) |
|
ax.tick_params(axis='y', labelsize=14, pad=5) |
|
|
|
|
|
ax.grid(axis='x', linestyle='--', alpha=0.5, color='#CCCCCC') |
|
ax.set_axisbelow(True) |
|
|
|
|
|
ax.invert_xaxis() |
|
|
|
plt.tight_layout() |
|
return fig |
|
|
|
|
|
with st.spinner("Loading trending accounts..."): |
|
trending_accounts, top_owners_spaces, top_owners_models = get_trending_accounts(limit=100) |
|
|
|
|
|
with st.sidebar: |
|
st.markdown('<h1 style="text-align: center; color: #1E88E5;">π€ Contributor</h1>', unsafe_allow_html=True) |
|
|
|
|
|
tab1, tab2 = st.tabs([ |
|
"Top 100 Overall", |
|
"Top Spaces & Models" |
|
]) |
|
|
|
with tab1: |
|
|
|
st.markdown('<div class="subheader"><h3>π₯ Top 100 Contributors</h3></div>', unsafe_allow_html=True) |
|
|
|
|
|
if trending_accounts: |
|
|
|
spaces_rank = {owner: idx+1 for idx, (owner, _) in enumerate(top_owners_spaces)} |
|
models_rank = {owner: idx+1 for idx, (owner, _) in enumerate(top_owners_models)} |
|
|
|
|
|
overall_data = [] |
|
for idx, username in enumerate(trending_accounts[:100]): |
|
|
|
rank_display = "" |
|
if idx == 0: |
|
rank_display = "π " |
|
elif idx == 1: |
|
rank_display = "π " |
|
elif idx == 2: |
|
rank_display = "π " |
|
|
|
|
|
spaces_position = str(spaces_rank.get(username, "-")) |
|
models_position = str(models_rank.get(username, "-")) |
|
overall_data.append([f"{rank_display}{username}", spaces_position, models_position]) |
|
|
|
ranking_data_overall = pd.DataFrame( |
|
overall_data, |
|
columns=["Contributor", "Spaces Rank", "Models Rank"] |
|
) |
|
ranking_data_overall.index = ranking_data_overall.index + 1 |
|
|
|
st.dataframe( |
|
ranking_data_overall, |
|
height=900, |
|
column_config={ |
|
"Contributor": st.column_config.TextColumn("Contributor"), |
|
"Spaces Rank": st.column_config.TextColumn("Spaces Rank"), |
|
"Models Rank": st.column_config.TextColumn("Models Rank") |
|
}, |
|
use_container_width=True, |
|
hide_index=False |
|
) |
|
|
|
with tab2: |
|
|
|
st.markdown('<div class="subheader"><h3>π Spaces Leaders</h3></div>', unsafe_allow_html=True) |
|
|
|
|
|
if top_owners_spaces: |
|
spaces_data = [] |
|
for idx, (owner, count) in enumerate(top_owners_spaces[:50]): |
|
|
|
rank_display = "" |
|
if idx == 0: |
|
rank_display = "π₯ " |
|
elif idx == 1: |
|
rank_display = "π₯ " |
|
elif idx == 2: |
|
rank_display = "π₯ " |
|
|
|
spaces_data.append([f"{rank_display}{owner}", count]) |
|
|
|
ranking_data_spaces = pd.DataFrame(spaces_data, columns=["Contributor", "Spaces Count(Top 500 positions)"]) |
|
ranking_data_spaces.index = ranking_data_spaces.index + 1 |
|
|
|
st.dataframe( |
|
ranking_data_spaces, |
|
column_config={ |
|
"Contributor": st.column_config.TextColumn("Contributor"), |
|
"Spaces Count": st.column_config.NumberColumn("Spaces Count", format="%d") |
|
}, |
|
use_container_width=True, |
|
hide_index=False |
|
) |
|
|
|
|
|
st.markdown('<div class="subheader"><h3>π§ Models Leaders</h3></div>', unsafe_allow_html=True) |
|
|
|
|
|
if top_owners_models: |
|
models_data = [] |
|
for idx, (owner, count) in enumerate(top_owners_models[:50]): |
|
|
|
rank_display = "" |
|
if idx == 0: |
|
rank_display = "π₯ " |
|
elif idx == 1: |
|
rank_display = "π₯ " |
|
elif idx == 2: |
|
rank_display = "π₯ " |
|
|
|
models_data.append([f"{rank_display}{owner}", count]) |
|
|
|
ranking_data_models = pd.DataFrame(models_data, columns=["Contributor", "Models Count(Top 500 positions)"]) |
|
ranking_data_models.index = ranking_data_models.index + 1 |
|
|
|
st.dataframe( |
|
ranking_data_models, |
|
column_config={ |
|
"Contributor": st.column_config.TextColumn("Contributor"), |
|
"Models Count": st.column_config.NumberColumn("Models Count", format="%d") |
|
}, |
|
use_container_width=True, |
|
hide_index=False |
|
) |
|
|
|
|
|
st.markdown('<hr style="margin: 2rem 0; border-color: #e0e0e0;">', unsafe_allow_html=True) |
|
|
|
|
|
st.markdown('<div class="subheader"><h3>Select Contributor</h3></div>', unsafe_allow_html=True) |
|
selected_trending = st.selectbox( |
|
"Choose from trending accounts", |
|
options=trending_accounts[:100], |
|
index=0 if trending_accounts else None, |
|
key="trending_selectbox" |
|
) |
|
|
|
|
|
st.markdown('<div style="text-align: center; margin: 15px 0; font-weight: bold;">- OR -</div>', unsafe_allow_html=True) |
|
custom = st.text_input("Enter a username/organization:", placeholder="e.g. facebook, google...") |
|
|
|
|
|
st.markdown('<hr style="margin: 1.5rem 0; border-color: #e0e0e0;">', unsafe_allow_html=True) |
|
|
|
|
|
if custom.strip(): |
|
username = custom.strip() |
|
elif selected_trending: |
|
username = selected_trending |
|
else: |
|
username = "facebook" |
|
|
|
|
|
st.markdown('<div class="subheader"><h3>ποΈ Time Period</h3></div>', unsafe_allow_html=True) |
|
year_options = list(range(datetime.now().year, 2017, -1)) |
|
selected_year = st.selectbox("Select Year:", options=year_options) |
|
|
|
|
|
st.markdown('<div class="subheader"><h3>βοΈ Display Options</h3></div>', unsafe_allow_html=True) |
|
show_models = st.checkbox("Show Models", value=True) |
|
show_datasets = st.checkbox("Show Datasets", value=True) |
|
show_spaces = st.checkbox("Show Spaces", value=True) |
|
|
|
|
|
st.markdown(f'<h1 style="text-align: center; color: #1E88E5; margin-bottom: 2rem;">π€ Hugging Face Contributions</h1>', unsafe_allow_html=True) |
|
|
|
if username: |
|
|
|
header_col1, header_col2 = st.columns([1, 2]) |
|
with header_col1: |
|
st.markdown(f'<div style="background-color: #E3F2FD; padding: 20px; border-radius: 10px; border-left: 5px solid #1E88E5;">' |
|
f'<h2 style="color: #1E88E5;">π€ {username}</h2>' |
|
f'<p style="font-size: 16px;">Analyzing contributions for {selected_year}</p>' |
|
f'<p><a href="https://huggingface.co/{username}" target="_blank" style="color: #1E88E5; font-weight: bold;">View Profile</a></p>' |
|
f'</div>', unsafe_allow_html=True) |
|
|
|
with header_col2: |
|
|
|
st.markdown(f'<div style="background-color: #F3E5F5; padding: 20px; border-radius: 10px; border-left: 5px solid #9C27B0;">' |
|
f'<h3 style="color: #9C27B0;">About This Analysis</h3>' |
|
f'<p>This dashboard analyzes {username}\'s contributions to Hugging Face in {selected_year}, including models, datasets, and spaces.</p>' |
|
f'<p style="font-style: italic; font-size: 12px;">* Some metrics like follower growth are simulated for visualization purposes.</p>' |
|
f'</div>', unsafe_allow_html=True) |
|
|
|
with st.spinner(f"Fetching contribution data for {username}..."): |
|
|
|
overall_rank = None |
|
spaces_rank = None |
|
models_rank = None |
|
spaces_count = 0 |
|
models_count = 0 |
|
datasets_count = 0 |
|
|
|
|
|
if username in trending_accounts[:100]: |
|
overall_rank = trending_accounts.index(username) + 1 |
|
|
|
|
|
st.markdown(f'<div style="background-color: #FFF8E1; padding: 20px; border-radius: 10px; border-left: 5px solid #FFC107; margin: 1rem 0;">' |
|
f'<h2 style="color: #FFA000; text-align: center;">π Ranked #{overall_rank} in Top Contributors</h2>' |
|
f'</div>', unsafe_allow_html=True) |
|
|
|
|
|
for i, (owner, count) in enumerate(top_owners_spaces): |
|
if owner == username: |
|
spaces_rank = i+1 |
|
spaces_count = count |
|
break |
|
|
|
|
|
for i, (owner, count) in enumerate(top_owners_models): |
|
if owner == username: |
|
models_rank = i+1 |
|
models_count = count |
|
break |
|
|
|
|
|
rank_chart = create_ranking_chart(username, overall_rank, spaces_rank, models_rank) |
|
if rank_chart: |
|
st.pyplot(rank_chart) |
|
|
|
|
|
commits_by_type = {} |
|
commit_counts_by_type = {} |
|
|
|
|
|
types_to_fetch = [] |
|
if show_models: |
|
types_to_fetch.append("model") |
|
if show_datasets: |
|
types_to_fetch.append("dataset") |
|
if show_spaces: |
|
types_to_fetch.append("space") |
|
|
|
if not types_to_fetch: |
|
st.warning("Please select at least one content type to display (Models, Datasets, or Spaces)") |
|
st.stop() |
|
|
|
|
|
progress_container = st.container() |
|
progress_container.markdown('<h3 style="color: #1E88E5;">Fetching Repository Data...</h3>', unsafe_allow_html=True) |
|
progress_bar = progress_container.progress(0) |
|
|
|
|
|
for type_index, kind in enumerate(types_to_fetch): |
|
try: |
|
items = cached_list_items(username, kind) |
|
|
|
|
|
if kind == "model": |
|
models_count = len(items) |
|
elif kind == "dataset": |
|
datasets_count = len(items) |
|
elif kind == "space": |
|
spaces_count = len(items) |
|
|
|
repo_ids = [item.id for item in items] |
|
|
|
progress_container.info(f"Found {len(repo_ids)} {kind}s for {username}") |
|
|
|
|
|
chunk_size = 5 |
|
total_commits = 0 |
|
all_commit_dates = [] |
|
|
|
for i in range(0, len(repo_ids), chunk_size): |
|
chunk = repo_ids[i:i + chunk_size] |
|
with ThreadPoolExecutor(max_workers=min(5, len(chunk))) as executor: |
|
future_to_repo = { |
|
executor.submit(fetch_commits_for_repo, repo_id, kind, username, selected_year): repo_id |
|
for repo_id in chunk |
|
} |
|
for future in as_completed(future_to_repo): |
|
repo_commits, repo_count = future.result() |
|
if repo_commits: |
|
all_commit_dates.extend(repo_commits) |
|
total_commits += repo_count |
|
|
|
|
|
progress_per_type = 1.0 / len(types_to_fetch) |
|
current_type_progress = min(1.0, (i + len(chunk)) / max(1, len(repo_ids))) |
|
overall_progress = (type_index * progress_per_type) + (current_type_progress * progress_per_type) |
|
progress_bar.progress(overall_progress) |
|
|
|
commits_by_type[kind] = all_commit_dates |
|
commit_counts_by_type[kind] = total_commits |
|
|
|
except Exception as e: |
|
st.warning(f"Error fetching {kind}s for {username}: {str(e)}") |
|
commits_by_type[kind] = [] |
|
commit_counts_by_type[kind] = 0 |
|
|
|
|
|
progress_bar.progress(1.0) |
|
progress_container.success("Data fetching complete!") |
|
time.sleep(0.5) |
|
progress_container.empty() |
|
|
|
|
|
total_commits = sum(commit_counts_by_type.values()) |
|
|
|
|
|
st.markdown(f'<h2 style="color: #1E88E5; border-bottom: 2px solid #E0E0E0; padding-bottom: 8px; margin-top: 2rem;">Activity Overview</h2>', unsafe_allow_html=True) |
|
|
|
|
|
profile_col1, profile_col2 = st.columns([1, 2]) |
|
|
|
with profile_col1: |
|
|
|
st.markdown(f'<div style="background-color: white; padding: 20px; border-radius: 10px; box-shadow: 0 2px 10px rgba(0,0,0,0.1);">' |
|
f'<h3 style="color: #1E88E5; text-align: center; margin-bottom: 15px;">Contribution Stats</h3>' |
|
f'<div style="display: flex; justify-content: space-between; margin-bottom: 10px;">' |
|
f'<span style="font-weight: bold;">Total Commits:</span><span>{total_commits}</span></div>' |
|
f'<div style="display: flex; justify-content: space-between; margin-bottom: 10px;">' |
|
f'<span style="font-weight: bold;">Models:</span><span>{models_count}</span></div>' |
|
f'<div style="display: flex; justify-content: space-between; margin-bottom: 10px;">' |
|
f'<span style="font-weight: bold;">Datasets:</span><span>{datasets_count}</span></div>' |
|
f'<div style="display: flex; justify-content: space-between; margin-bottom: 10px;">' |
|
f'<span style="font-weight: bold;">Spaces:</span><span>{spaces_count}</span></div>' |
|
f'</div>', unsafe_allow_html=True) |
|
|
|
|
|
model_commits = commit_counts_by_type.get("model", 0) |
|
dataset_commits = commit_counts_by_type.get("dataset", 0) |
|
space_commits = commit_counts_by_type.get("space", 0) |
|
|
|
pie_chart = create_contribution_pie(model_commits, dataset_commits, space_commits) |
|
if pie_chart: |
|
st.pyplot(pie_chart) |
|
|
|
with profile_col2: |
|
|
|
radar_fig = create_contribution_radar(username, models_count, spaces_count, datasets_count, total_commits) |
|
st.pyplot(radar_fig) |
|
|
|
|
|
all_commits = [] |
|
for commits in commits_by_type.values(): |
|
all_commits.extend(commits) |
|
all_df = pd.DataFrame(all_commits, columns=["date"]) |
|
if not all_df.empty: |
|
all_df = all_df.drop_duplicates() |
|
|
|
|
|
st.markdown(f'<h2 style="color: #1E88E5; border-bottom: 2px solid #E0E0E0; padding-bottom: 8px; margin-top: 2rem;">Contribution Calendar</h2>', unsafe_allow_html=True) |
|
|
|
if not all_df.empty: |
|
make_calendar_heatmap(all_df, "All Contributions", selected_year) |
|
else: |
|
st.info(f"No contributions found for {username} in {selected_year}") |
|
|
|
|
|
st.markdown(f'<h2 style="color: #1E88E5; border-bottom: 2px solid #E0E0E0; padding-bottom: 8px; margin-top: 2rem;">Monthly Activity</h2>', unsafe_allow_html=True) |
|
|
|
monthly_fig = create_monthly_activity(all_df, selected_year) |
|
if monthly_fig: |
|
st.pyplot(monthly_fig) |
|
else: |
|
st.info(f"No activity data available for {username} in {selected_year}") |
|
|
|
|
|
st.markdown(f'<h2 style="color: #1E88E5; border-bottom: 2px solid #E0E0E0; padding-bottom: 8px; margin-top: 2rem;">Growth Projection</h2>', unsafe_allow_html=True) |
|
st.markdown('<div style="background-color: #EDE7F6; padding: 10px; border-radius: 5px; margin-bottom: 15px;">' |
|
'<p style="font-style: italic; margin: 0;">π This is a simulation based on contribution metrics - for visualization purposes only</p>' |
|
'</div>', unsafe_allow_html=True) |
|
|
|
follower_chart = simulate_follower_data(username, spaces_count, models_count, total_commits) |
|
st.pyplot(follower_chart) |
|
|
|
|
|
if total_commits > 0: |
|
st.markdown(f'<h2 style="color: #1E88E5; border-bottom: 2px solid #E0E0E0; padding-bottom: 8px; margin-top: 2rem;">π Analytics Summary</h2>', unsafe_allow_html=True) |
|
|
|
|
|
monthly_df = pd.DataFrame(all_commits, columns=["date"]) |
|
monthly_df['date'] = pd.to_datetime(monthly_df['date']) |
|
monthly_df['month'] = monthly_df['date'].dt.month |
|
|
|
if not monthly_df.empty: |
|
most_active_month = monthly_df['month'].value_counts().idxmax() |
|
month_name = datetime(2020, most_active_month, 1).strftime('%B') |
|
|
|
|
|
st.markdown(f'<div style="background-color: white; padding: 25px; border-radius: 10px; box-shadow: 0 2px 10px rgba(0,0,0,0.1);">' |
|
f'<h3 style="color: #1E88E5; border-bottom: 1px solid #E0E0E0; padding-bottom: 10px;">Activity Analysis for {username}</h3>' |
|
f'<ul style="list-style-type: none; padding-left: 5px;">' |
|
f'<li style="margin: 15px 0; font-size: 16px;">π <strong>Total Activity:</strong> {total_commits} contributions in {selected_year}</li>' |
|
f'<li style="margin: 15px 0; font-size: 16px;">ποΈ <strong>Most Active Month:</strong> {month_name} with {monthly_df["month"].value_counts().max()} contributions</li>' |
|
f'<li style="margin: 15px 0; font-size: 16px;">𧩠<strong>Repository Breakdown:</strong> {models_count} Models, {spaces_count} Spaces, {datasets_count} Datasets</li>' |
|
f'</ul>', unsafe_allow_html=True) |
|
|
|
|
|
if overall_rank: |
|
percentile = 100 - overall_rank |
|
st.markdown(f'<div style="margin-top: 20px;">' |
|
f'<h3 style="color: #1E88E5; border-bottom: 1px solid #E0E0E0; padding-bottom: 10px;">Ranking Analysis</h3>' |
|
f'<ul style="list-style-type: none; padding-left: 5px;">' |
|
f'<li style="margin: 15px 0; font-size: 16px;">π <strong>Overall Ranking:</strong> #{overall_rank} (Top {percentile}% of contributors)</li>', unsafe_allow_html=True) |
|
|
|
badge_html = '<div style="margin: 20px 0;">' |
|
|
|
if spaces_rank and spaces_rank <= 10: |
|
badge_html += f'<span style="background-color: #FFECB3; color: #FF6F00; padding: 8px 15px; border-radius: 20px; font-weight: bold; margin-right: 10px; display: inline-block; margin-bottom: 10px;">π Elite Spaces Contributor (#{spaces_rank})</span>' |
|
elif spaces_rank and spaces_rank <= 30: |
|
badge_html += f'<span style="background-color: #E1F5FE; color: #0277BD; padding: 8px 15px; border-radius: 20px; font-weight: bold; margin-right: 10px; display: inline-block; margin-bottom: 10px;">β¨ Outstanding Spaces Contributor (#{spaces_rank})</span>' |
|
|
|
if models_rank and models_rank <= 10: |
|
badge_html += f'<span style="background-color: #FFECB3; color: #FF6F00; padding: 8px 15px; border-radius: 20px; font-weight: bold; margin-right: 10px; display: inline-block; margin-bottom: 10px;">π Elite Models Contributor (#{models_rank})</span>' |
|
elif models_rank and models_rank <= 30: |
|
badge_html += f'<span style="background-color: #E1F5FE; color: #0277BD; padding: 8px 15px; border-radius: 20px; font-weight: bold; margin-right: 10px; display: inline-block; margin-bottom: 10px;">β¨ Outstanding Models Contributor (#{models_rank})</span>' |
|
|
|
badge_html += '</div>' |
|
|
|
|
|
if spaces_rank or models_rank: |
|
st.markdown(badge_html, unsafe_allow_html=True) |
|
|
|
st.markdown('</ul></div></div>', unsafe_allow_html=True) |
|
|
|
|
|
st.markdown(f'<h2 style="color: #1E88E5; border-bottom: 2px solid #E0E0E0; padding-bottom: 8px; margin-top: 2rem;">Detailed Category Analysis</h2>', unsafe_allow_html=True) |
|
|
|
|
|
cols = st.columns(len(types_to_fetch)) if types_to_fetch else st.columns(1) |
|
|
|
category_icons = { |
|
"model": "π§ ", |
|
"dataset": "π¦", |
|
"space": "π" |
|
} |
|
|
|
category_colors = { |
|
"model": "#FF9800", |
|
"dataset": "#2196F3", |
|
"space": "#4CAF50" |
|
} |
|
|
|
for i, kind in enumerate(types_to_fetch): |
|
with cols[i]: |
|
try: |
|
emoji = category_icons.get(kind, "π") |
|
label = kind.capitalize() + "s" |
|
color = category_colors.get(kind, "#1E88E5") |
|
|
|
total = len(cached_list_items(username, kind)) |
|
commits = commits_by_type.get(kind, []) |
|
commit_count = commit_counts_by_type.get(kind, 0) |
|
|
|
|
|
st.markdown(f'<div style="background-color: white; padding: 20px; border-radius: 10px; box-shadow: 0 2px 10px rgba(0,0,0,0.1); border-top: 5px solid {color};">' |
|
f'<h3 style="color: {color}; text-align: center;">{emoji} {label}</h3>' |
|
f'<div style="display: flex; justify-content: space-between; margin: 15px 0;">' |
|
f'<span style="font-weight: bold;">Total:</span><span>{total}</span></div>' |
|
f'<div style="display: flex; justify-content: space-between; margin-bottom: 15px;">' |
|
f'<span style="font-weight: bold;">Commits:</span><span>{commit_count}</span></div>' |
|
f'</div>', unsafe_allow_html=True) |
|
|
|
|
|
df_kind = pd.DataFrame(commits, columns=["date"]) |
|
if not df_kind.empty: |
|
df_kind = df_kind.drop_duplicates() |
|
make_calendar_heatmap(df_kind, f"{label} Commits", selected_year) |
|
else: |
|
st.info(f"No {label.lower()} activity in {selected_year}") |
|
|
|
except Exception as e: |
|
st.warning(f"Error processing {kind.capitalize()}s: {str(e)}") |
|
|
|
st.markdown(f'<div style="background-color: white; padding: 20px; border-radius: 10px; box-shadow: 0 2px 10px rgba(0,0,0,0.1); border-top: 5px solid #9E9E9E; text-align: center;">' |
|
f'<h3 style="color: #9E9E9E;">β οΈ Error</h3>' |
|
f'<p>Could not load {kind.capitalize()}s data</p>' |
|
f'</div>', unsafe_allow_html=True) |
|
|
|
|
|
st.markdown('<hr style="margin: 3rem 0 1rem 0;">', unsafe_allow_html=True) |
|
st.markdown('<p style="text-align: center; color: #9E9E9E; font-size: 0.8rem;">Hugging Face Contributions Dashboard | Data fetched from Hugging Face API</p>', unsafe_allow_html=True) |
|
else: |
|
|
|
st.markdown(f'<div style="text-align: center; margin: 50px 0;">' |
|
f'<img src="https://huggingface.co/datasets/huggingface/brand-assets/resolve/main/hf-logo.svg" style="width: 200px; margin-bottom: 30px;">' |
|
f'<h2>Welcome to Hugging Face Contributions Dashboard</h2>' |
|
f'<p style="font-size: 1.2rem;">Please select a contributor from the sidebar to view their activity.</p>' |
|
f'</div>', unsafe_allow_html=True) |