Korea-Leaderboard

Running on Zero

App Files Files Community

openfree commited on Dec 14, 2024

Commit

dad05a7

verified ·

1 Parent(s): 58008e9

Update app.py

Browse files

Files changed (1) hide show

app.py +6 -89

app.py CHANGED Viewed

@@ -992,87 +992,6 @@ def refresh_data():
-# 먼저 target_datasets 딕셔너리를 추가합니다
-target_datasets = {
-    "aiqtech/kolaw": "https://huggingface.co/datasets/aiqtech/kolaw",
-    # 추가 데이터셋은 여기에 계속 추가할 수 있습니다
-}
-def get_datasets_data(progress=gr.Progress()):
-    """데이터셋 데이터 가져오기"""
-    def calculate_rank(dataset_id, all_global_datasets, korea_datasets):
-        # 글로벌 순위 확인
-        global_rank = next((idx for idx, d in enumerate(all_global_datasets, 1)
-                          if d.get('id', '').strip() == dataset_id.strip()), None)
-        # Korea 데이터셋인 경우
-        is_korea = any(d.get('id', '').strip() == dataset_id.strip() for d in korea_datasets)
-        if is_korea:
-            # Korea 데이터셋 중에서의 순위 확인
-            korea_rank = next((idx for idx, d in enumerate(korea_datasets, 1)
-                             if d.get('id', '').strip() == dataset_id.strip()), None)
-            if korea_rank:
-                return min(global_rank or 3001, korea_rank + 1000), True
-        return global_rank if global_rank else 'Not in top 3000', is_korea
-    try:
-        progress(0, desc="Fetching datasets...")
-        if not HF_TOKEN:
-            fig = create_error_plot()
-            error_html = """
-            <div style='padding: 20px; background: #fee; border-radius: 10px; margin: 10px 0;'>
-                <h3 style='color: #c00;'>⚠️ API 인증이 필요합니다</h3>
-                <p>HuggingFace API 토큰이 설정되지 않았습니다.</p>
-            </div>
-            """
-            empty_df = pd.DataFrame(columns=['Global Rank', 'Dataset ID', 'Title', 'Downloads', 'Likes', 'Korea Search', 'URL'])
-            return fig, error_html, empty_df
-        # 일반 데이터셋과 Korea 관련 데이터셋 가져오기
-        params = {
-            'limit': 3000,
-            'full': 'true'
-        }
-        all_datasets_response = requests.get(
-            "https://huggingface.co/api/datasets",
-            headers={'Authorization': f'Bearer {HF_TOKEN}'},
-            params=params
-        )
-        korea_params = {
-            'search': 'korea',
-            'limit': 3000,
-            'full': 'true'
-        }
-        korea_datasets_response = requests.get(
-            "https://huggingface.co/api/datasets",
-            headers={'Authorization': f'Bearer {HF_TOKEN}'},
-            params=korea_params
-        )
-        all_global_datasets = all_datasets_response.json()
-        korea_datasets = korea_datasets_response.json()
-        # 시각화를 위한 Figure 생성
-        fig = go.Figure()
-        # 순위 정보 수집
-        filtered_datasets = []
-        for dataset_id in target_datasets.keys():
-            try:
-                normalized_id = dataset_id.strip('/')
-                dataset_url_api = f"https://huggingface.co/api/datasets/{normalized_id}"
-                response# 먼저 target_datasets 딕셔너리를 추가합니다
 target_datasets = {
     "aiqtech/kolaw": "https://huggingface.co/datasets/aiqtech/kolaw",
     "heegyu/korquad-v1-v2": "https://huggingface.co/datasets/heegyu/korquad-v1-v2",
@@ -1089,8 +1008,6 @@ target_datasets = {
 }
 def get_datasets_data(progress=gr.Progress()):
-    try:
     def calculate_rank(dataset_id, all_global_datasets, korea_datasets):
         # 글로벌 순위 확인
         global_rank = next((idx for idx, d in enumerate(all_global_datasets, 1)
@@ -1100,7 +1017,6 @@ def get_datasets_data(progress=gr.Progress()):
         is_korea = any(d.get('id', '').strip() == dataset_id.strip() for d in korea_datasets)
         if is_korea:
-            # Korea 데이터셋 중에서의 순위 확인
             korea_rank = next((idx for idx, d in enumerate(korea_datasets, 1)
                              if d.get('id', '').strip() == dataset_id.strip()), None)
@@ -1283,7 +1199,9 @@ def get_datasets_data(progress=gr.Progress()):
         progress(1.0, desc="Complete!")
         return fig, html_content, df
     except Exception as e:
         print(f"Error in get_datasets_data: {str(e)}")
         error_fig = create_error_plot()
@@ -1296,7 +1214,7 @@ def get_datasets_data(progress=gr.Progress()):
         empty_df = pd.DataFrame(columns=['Global Rank', 'Dataset ID', 'Title', 'Downloads', 'Likes', 'Korea Search', 'URL'])
         return error_fig, error_html, empty_df
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
     # 🤗 허깅페이스 '한국(언어) 리더보드'
@@ -1345,13 +1263,12 @@ with gr.Blocks(theme=gr.themes.Soft()) as demo:
     datasets_results = get_datasets_data()
     trending_plot.value, trending_info.value, trending_df.value = spaces_results
-    models_plot.value, models_
 # Gradio 앱 실행
 demo.launch(
     server_name="0.0.0.0",
     server_port=7860,
     share=False
-)

 target_datasets = {
     "aiqtech/kolaw": "https://huggingface.co/datasets/aiqtech/kolaw",
     "heegyu/korquad-v1-v2": "https://huggingface.co/datasets/heegyu/korquad-v1-v2",
 }
 def get_datasets_data(progress=gr.Progress()):
     def calculate_rank(dataset_id, all_global_datasets, korea_datasets):
         # 글로벌 순위 확인
         global_rank = next((idx for idx, d in enumerate(all_global_datasets, 1)
         is_korea = any(d.get('id', '').strip() == dataset_id.strip() for d in korea_datasets)
         if is_korea:
             korea_rank = next((idx for idx, d in enumerate(korea_datasets, 1)
                              if d.get('id', '').strip() == dataset_id.strip()), None)
         progress(1.0, desc="Complete!")
         return fig, html_content, df
     except Exception as e:
         print(f"Error in get_datasets_data: {str(e)}")
         error_fig = create_error_plot()
         empty_df = pd.DataFrame(columns=['Global Rank', 'Dataset ID', 'Title', 'Downloads', 'Likes', 'Korea Search', 'URL'])
         return error_fig, error_html, empty_df
 with gr.Blocks(theme=gr.themes.Soft()) as demo:
     gr.Markdown("""
     # 🤗 허깅페이스 '한국(언어) 리더보드'
     datasets_results = get_datasets_data()
     trending_plot.value, trending_info.value, trending_df.value = spaces_results
+    models_plot.value, models_info.value, models_df.value = models_results
+    datasets_plot.value, datasets_info.value, datasets_df.value = datasets_results
 # Gradio 앱 실행
 demo.launch(
     server_name="0.0.0.0",
     server_port=7860,
     share=False
+)