Spaces:

librarian-bots
/

dashboard

Runtime error

App Files Files Community

librarian-bot commited on Mar 28, 2023

Commit

4992d0d

1 Parent(s): 931a9a7

Upload 4 files

Browse files

Files changed (4) hide show

app.py +100 -0
description.html +21 -0
requirements.in +8 -0
requirements.txt +226 -0

app.py ADDED Viewed

	@@ -0,0 +1,100 @@

+from typing import Any, List
+import gradio as gr
+from toolz import concat, frequencies
+import httpx
+from functools import lru_cache
+import pandas as pd
+import plotly.express as px
+import polars as pl
+from pathlib import Path
+from datetime import datetime
+librarian_bot_avatar = "https://aeiljuispo.cloudimg.io/v7/https://s3.amazonaws.com/moonup/production/uploads/1674830754237-63d3e0e8ff1384ce6c5dd17d.jpeg?w=200&h=200&f=face"
+@lru_cache(maxsize=512)
+def get_hub_community_activity(user: str) -> List[Any]:
+    all_data = []
+    for i in range(1, 2000, 100):
+        r = httpx.get(
+            f"https://huggingface.co/api/recent-activity?limit=100&type=discussion&skip={i}&user={user}"
+        )
+        activity = r.json()["recentActivity"]
+        all_data.append(activity)
+    return list(concat(all_data))
+@lru_cache(maxsize=512)
+def get_pr_status(user: str):
+    all_data = get_hub_community_activity(user)
+    pr_data = (
+        x["discussionData"] for x in all_data if x["discussionData"]["isPullRequest"]
+    )
+    return frequencies(x["status"] for x in pr_data)
+def create_pie():
+    frequencies = get_pr_status("librarian-bot")
+    df = pd.DataFrame({"status": frequencies.keys(), "number": frequencies.values()})
+    fig = px.pie(df, values="number", names="status", template="seaborn")
+    return gr.Plot(fig)
+def parse_date_time(date_time: str) -> datetime:
+    return datetime.strptime(date_time, "%Y-%m-%dT%H:%M:%S.%fZ")
+def parse_pr_data(data):
+    data = data["discussionData"]
+    createdAt = parse_date_time(data["createdAt"])
+    pr_number = data["num"]
+    status = data["status"]
+    repo_id = data["repo"]["name"]
+    return {
+        "createdAt": createdAt,
+        "pr_number": pr_number,
+        "status": status,
+        "repo_id": repo_id,
+    }
+def group_status_by_pr_number():
+    all_data = get_hub_community_activity("librarian-bot")
+    all_data = [parse_pr_data(d) for d in all_data]
+    return (
+        pl.DataFrame(all_data).groupby("status").agg(pl.mean("pr_number")).to_pandas()
+    )
+def plot_over_time():
+    all_data = get_hub_community_activity("librarian-bot")
+    all_data = [parse_pr_data(d) for d in all_data]
+    df = pl.DataFrame(all_data).with_columns(pl.col("createdAt").cast(pl.Date))
+    df = df.pivot(
+        values=["status"],
+        index=["createdAt"],
+        columns=["status"],
+        aggregate_function="count",
+    )
+    df = df.fill_null(0)
+    df = df.with_columns(pl.sum(["open", "closed", "merged"])).sort("createdAt")
+    df = df.to_pandas().set_index("createdAt").cumsum()
+    return px.line(df, x=df.index, y=[c for c in df.columns if c != "sum"])
+with gr.Blocks() as demo:
+    frequencies = get_pr_status("librarian-bot")
+    gr.HTML(Path("description.html").read_text())
+    gr.Markdown(f"Total PRs opened: {sum(frequencies.values())}")
+    with gr.Column():
+        gr.Markdown("## Pull requests Status")
+        gr.Markdown(
+            "The below pie chart shows the percentage of pull requests made by librarian bot that are open, closed or merged"
+        )
+        create_pie()
+    with gr.Column():
+        gr.Markdown("## Pull requests status by PR number")
+        gr.DataFrame(group_status_by_pr_number())
+    with gr.Column():
+        gr.Plot(plot_over_time())
+demo.launch(debug=True)

description.html ADDED Viewed

	@@ -0,0 +1,21 @@

+<!DOCTYPE html>
+<html>
+<head>
+<meta name="viewport" content="width=device-width, initial-scale=1">
+<style>
+.avatar {
+  vertical-align: middle;
+  width: 50px;
+  height: 50px;
+  border-radius: 50%;
+}
+</style>
+</head>
+<body>
+<h1>Librarian Bot Dashboard</h2>
+<img align="left" src="https://aeiljuispo.cloudimg.io/v7/https://s3.amazonaws.com/moonup/production/uploads/1674830754237-63d3e0e8ff1384ce6c5dd17d.jpeg?w=200&h=200&f=face" alt="Avatar" class="avatar">
+<p>Librarian-bot is a bot that suggests changes to metadata for models and datasets hosted on the hub. This dashboard gives an overview of these pull requests</p>
+</body>
+</html>

requirements.in ADDED Viewed

	@@ -0,0 +1,8 @@

+httpx
+toolz
+gradio
+plotly
+pandas
+polars
+datasets
+pyarrow

requirements.txt ADDED Viewed

	@@ -0,0 +1,226 @@

+#
+# This file is autogenerated by pip-compile with Python 3.11
+# by the following command:
+#
+#    pip-compile --resolver=backtracking requirements.in
+#
+aiofiles==23.1.0
+    # via gradio
+aiohttp==3.8.4
+    # via
+    #   datasets
+    #   fsspec
+    #   gradio
+aiosignal==1.3.1
+    # via aiohttp
+altair==4.2.2
+    # via gradio
+anyio==3.6.2
+    # via
+    #   httpcore
+    #   starlette
+async-timeout==4.0.2
+    # via aiohttp
+attrs==22.2.0
+    # via
+    #   aiohttp
+    #   jsonschema
+certifi==2022.12.7
+    # via
+    #   httpcore
+    #   httpx
+    #   requests
+charset-normalizer==3.1.0
+    # via
+    #   aiohttp
+    #   requests
+click==8.1.3
+    # via uvicorn
+contourpy==1.0.7
+    # via matplotlib
+cycler==0.11.0
+    # via matplotlib
+datasets==2.10.1
+    # via -r requirements.in
+dill==0.3.6
+    # via
+    #   datasets
+    #   multiprocess
+entrypoints==0.4
+    # via altair
+fastapi==0.95.0
+    # via gradio
+ffmpy==0.3.0
+    # via gradio
+filelock==3.10.6
+    # via huggingface-hub
+fonttools==4.39.2
+    # via matplotlib
+frozenlist==1.3.3
+    # via
+    #   aiohttp
+    #   aiosignal
+fsspec[http]==2023.3.0
+    # via
+    #   datasets
+    #   gradio
+gradio==3.23.0
+    # via -r requirements.in
+h11==0.14.0
+    # via
+    #   httpcore
+    #   uvicorn
+httpcore==0.16.3
+    # via httpx
+httpx==0.23.3
+    # via
+    #   -r requirements.in
+    #   gradio
+huggingface-hub==0.13.3
+    # via
+    #   datasets
+    #   gradio
+idna==3.4
+    # via
+    #   anyio
+    #   requests
+    #   rfc3986
+    #   yarl
+jinja2==3.1.2
+    # via
+    #   altair
+    #   gradio
+jsonschema==4.17.3
+    # via altair
+kiwisolver==1.4.4
+    # via matplotlib
+linkify-it-py==2.0.0
+    # via markdown-it-py
+markdown-it-py[linkify]==2.2.0
+    # via
+    #   gradio
+    #   mdit-py-plugins
+markupsafe==2.1.2
+    # via
+    #   gradio
+    #   jinja2
+matplotlib==3.7.1
+    # via gradio
+mdit-py-plugins==0.3.3
+    # via gradio
+mdurl==0.1.2
+    # via markdown-it-py
+multidict==6.0.4
+    # via
+    #   aiohttp
+    #   yarl
+multiprocess==0.70.14
+    # via datasets
+numpy==1.24.2
+    # via
+    #   altair
+    #   contourpy
+    #   datasets
+    #   gradio
+    #   matplotlib
+    #   pandas
+    #   pyarrow
+orjson==3.8.8
+    # via gradio
+packaging==23.0
+    # via
+    #   datasets
+    #   huggingface-hub
+    #   matplotlib
+pandas==1.5.3
+    # via
+    #   -r requirements.in
+    #   altair
+    #   datasets
+    #   gradio
+pillow==9.4.0
+    # via
+    #   gradio
+    #   matplotlib
+plotly==5.13.1
+    # via -r requirements.in
+polars==0.16.16
+    # via -r requirements.in
+pyarrow==11.0.0
+    # via
+    #   -r requirements.in
+    #   datasets
+pydantic==1.10.7
+    # via
+    #   fastapi
+    #   gradio
+pydub==0.25.1
+    # via gradio
+pyparsing==3.0.9
+    # via matplotlib
+pyrsistent==0.19.3
+    # via jsonschema
+python-dateutil==2.8.2
+    # via
+    #   matplotlib
+    #   pandas
+python-multipart==0.0.6
+    # via gradio
+pytz==2023.2
+    # via pandas
+pyyaml==6.0
+    # via
+    #   datasets
+    #   gradio
+    #   huggingface-hub
+requests==2.28.2
+    # via
+    #   datasets
+    #   fsspec
+    #   gradio
+    #   huggingface-hub
+    #   responses
+responses==0.18.0
+    # via datasets
+rfc3986[idna2008]==1.5.0
+    # via httpx
+semantic-version==2.10.0
+    # via gradio
+six==1.16.0
+    # via python-dateutil
+sniffio==1.3.0
+    # via
+    #   anyio
+    #   httpcore
+    #   httpx
+starlette==0.26.1
+    # via fastapi
+tenacity==8.2.2
+    # via plotly
+toolz==0.12.0
+    # via
+    #   -r requirements.in
+    #   altair
+tqdm==4.65.0
+    # via
+    #   datasets
+    #   huggingface-hub
+typing-extensions==4.5.0
+    # via
+    #   gradio
+    #   huggingface-hub
+    #   pydantic
+uc-micro-py==1.0.1
+    # via linkify-it-py
+urllib3==1.26.15
+    # via
+    #   requests
+    #   responses
+uvicorn==0.21.1
+    # via gradio
+websockets==10.4
+    # via gradio
+xxhash==3.2.0
+    # via datasets
+yarl==1.8.2
+    # via aiohttp