Korea-Leaderboard

Running

App Files Files Community

openfree commited on Dec 14, 2024

Commit

b50e7a2

verified ·

1 Parent(s): 1fed40f

Update app.py

Browse files

Files changed (1) hide show

app.py +38 -54

app.py CHANGED Viewed

@@ -319,28 +319,34 @@ def get_korea_models():
         print(f"Error fetching Korea models: {str(e)}")
         return []
-def get_all_models(limit=1000):
     """모든 모델과 Korea 관련 모델 가져오기"""
     all_models = []
-    # 1. 일반 모델 리스트 가져오기
-    params = {
-        "limit": limit,
-        "full": "True",
-        "config": "True"
-    }
-    response = requests.get(
-        "https://huggingface.co/api/models",
-        headers={'Accept': 'application/json'},
-        params=params
-    )
-    if response.status_code == 200:
-        all_models.extend(response.json())
-        print(f"Fetched {len(all_models)} general models")
-    # 2. Korea 검색 결과 가져오기
     korea_params = {
         "search": "korea",
         "full": "True",
@@ -365,30 +371,6 @@ def get_all_models(limit=1000):
                 all_models.append(model)
                 existing_ids.add(model.get('id', ''))
-    # 3. Korean 검색 결과 가져오기
-    korean_params = {
-        "search": "korean",
-        "full": "True",
-        "config": "True",
-        "limit": limit
-    }
-    korean_response = requests.get(
-        "https://huggingface.co/api/models",
-        headers={'Accept': 'application/json'},
-        params=korean_params
-    )
-    if korean_response.status_code == 200:
-        korean_models = korean_response.json()
-        print(f"Fetched {len(korean_models)} Korean-related models")
-        # 중복 제거하면서 Korean 모델 추가
-        for model in korean_models:
-            if model.get('id', '') not in existing_ids:
-                all_models.append(model)
-                existing_ids.add(model.get('id', ''))
     print(f"Total unique models: {len(all_models)}")
     return all_models[:limit]
@@ -407,8 +389,8 @@ def get_models_data(progress=gr.Progress()):
             empty_df = pd.DataFrame(columns=['Global Rank', 'Model ID', 'Title', 'Downloads', 'Likes', 'Korea Search', 'URL'])
             return fig, error_html, empty_df
-        # 일반 모델과 Korea 관련 모델 모두 가져오기
-        all_global_models = get_all_models(limit=1000)
         korea_models = get_korea_models()
         # 모든 모델 통합 (중복 제거)
@@ -439,7 +421,7 @@ def get_models_data(progress=gr.Progress()):
                     filtered_models.append({
                         'id': model_id,
                         'global_rank': next((idx for idx, m in enumerate(all_models, 1)
-                                          if m.get('id', '').strip() == model_id.strip()), 'Not in top 1000'),
                         'downloads': model_data.get('downloads', 0),
                         'likes': model_data.get('likes', 0),
                         'title': model_data.get('title', 'No Title'),
@@ -448,7 +430,7 @@ def get_models_data(progress=gr.Progress()):
                 else:
                     filtered_models.append({
                         'id': model_id,
-                        'global_rank': 'Not in top 1000',
                         'downloads': 0,
                         'likes': 0,
                         'title': 'No Title',
@@ -470,7 +452,7 @@ def get_models_data(progress=gr.Progress()):
             fig.add_trace(go.Bar(
                 x=ids,
-                y=[1001 - r for r in ranks],  # Y축 반전
                 text=[f"Rank: #{r}<br>Downloads: {format(m['downloads'], ',')}<br>Likes: {format(m['likes'], ',')}"
                       for r, m in zip(ranks, valid_models)],
                 textposition='auto',
@@ -480,27 +462,29 @@ def get_models_data(progress=gr.Progress()):
             ))
             fig.update_layout(
-                title="HuggingFace Models Global Rankings",
                 xaxis_title="Model ID",
                 yaxis_title="Global Rank",
                 yaxis=dict(
-                    ticktext=[f"#{i}" for i in range(1, 1001, 50)],
-                    tickvals=[1001 - i for i in range(1, 1001, 50)],
-                    range=[0, 1000]
                 ),
                 height=800,
-                showlegend=False
             )
         # HTML 카드 생성
         html_content = """
         <div style='padding: 20px; background: #f5f5f5;'>
-            <h2 style='color: #2c3e50;'>Models Rankings</h2>
             <div style='display: grid; grid-template-columns: repeat(auto-fill, minmax(300px, 1fr)); gap: 20px;'>
         """
         for model in filtered_models:
-            rank_display = f"Global Rank #{model['global_rank']}" if isinstance(model['global_rank'], (int, float)) else "Not in top 1000"
             korea_badge = "🇰🇷 Korea Search Result" if model['is_korea'] else ""
             html_content += f"""

         print(f"Error fetching Korea models: {str(e)}")
         return []
+def get_all_models(limit=3000):
     """모든 모델과 Korea 관련 모델 가져오기"""
     all_models = []
+    page_size = 1000  # API의 한 번 요청당 최대 크기
+    # 여러 페이지에 걸쳐 데이터 수집
+    for offset in range(0, limit, page_size):
+        params = {
+            'limit': min(page_size, limit - offset),
+            'full': 'True',
+            'config': 'True',
+            'offset': offset
+        }
+        response = requests.get(
+            "https://huggingface.co/api/models",
+            headers={'Accept': 'application/json'},
+            params=params
+        )
+        if response.status_code == 200:
+            all_models.extend(response.json())
+            print(f"Fetched models {offset+1} to {offset+len(response.json())}")
+        else:
+            print(f"Failed to fetch models at offset {offset}: {response.status_code}")
+            break
+    # Korea 검색 결과도 동일하게 확장
     korea_params = {
         "search": "korea",
         "full": "True",
                 all_models.append(model)
                 existing_ids.add(model.get('id', ''))
     print(f"Total unique models: {len(all_models)}")
     return all_models[:limit]
             empty_df = pd.DataFrame(columns=['Global Rank', 'Model ID', 'Title', 'Downloads', 'Likes', 'Korea Search', 'URL'])
             return fig, error_html, empty_df
+        # 일반 모델과 Korea 관련 모델 모두 가져오기 (3000위까지)
+        all_global_models = get_all_models(limit=3000)
         korea_models = get_korea_models()
         # 모든 모델 통합 (중복 제거)
                     filtered_models.append({
                         'id': model_id,
                         'global_rank': next((idx for idx, m in enumerate(all_models, 1)
+                                          if m.get('id', '').strip() == model_id.strip()), 'Not in top 3000'),
                         'downloads': model_data.get('downloads', 0),
                         'likes': model_data.get('likes', 0),
                         'title': model_data.get('title', 'No Title'),
                 else:
                     filtered_models.append({
                         'id': model_id,
+                        'global_rank': 'Not in top 3000',
                         'downloads': 0,
                         'likes': 0,
                         'title': 'No Title',
             fig.add_trace(go.Bar(
                 x=ids,
+                y=[3001 - r for r in ranks],  # Y축 범위 3000까지 확장
                 text=[f"Rank: #{r}<br>Downloads: {format(m['downloads'], ',')}<br>Likes: {format(m['likes'], ',')}"
                       for r, m in zip(ranks, valid_models)],
                 textposition='auto',
             ))
             fig.update_layout(
+                title="HuggingFace Models Global Rankings (Up to #3000)",
                 xaxis_title="Model ID",
                 yaxis_title="Global Rank",
                 yaxis=dict(
+                    ticktext=[f"#{i}" for i in range(1, 3001, 100)],
+                    tickvals=[3001 - i for i in range(1, 3001, 100)],
+                    range=[0, 3000]
                 ),
                 height=800,
+                showlegend=False,
+                template='plotly_white',
+                xaxis_tickangle=-45
             )
         # HTML 카드 생성
         html_content = """
         <div style='padding: 20px; background: #f5f5f5;'>
+            <h2 style='color: #2c3e50;'>Models Rankings (Up to #3000)</h2>
             <div style='display: grid; grid-template-columns: repeat(auto-fill, minmax(300px, 1fr)); gap: 20px;'>
         """
         for model in filtered_models:
+            rank_display = f"Global Rank #{model['global_rank']}" if isinstance(model['global_rank'], (int, float)) else "Not in top 3000"
             korea_badge = "🇰🇷 Korea Search Result" if model['is_korea'] else ""
             html_content += f"""