Spaces:

avid-ml
/

indie-label

Running

App Files Files Community

Michelle Lam commited on Jan 26, 2024

Commit

4021c8c

unverified ·

2 Parent(s): 37d1f1c b77ac12

Merge pull request #1 from Christina-A-Pan/hf-refactor

Browse files

Files changed (2) hide show

audit_utils.py +90 -0
server.py +22 -0

audit_utils.py CHANGED Viewed

@@ -23,6 +23,7 @@ import time
 from sentence_transformers import SentenceTransformer, util
 import torch
 from bertopic import BERTopic
 ########################################
 # PRE-LOADING
@@ -314,6 +315,95 @@ def get_grp_model_labels(n_label_per_bin, score_bins, grp_ids):
     return ratings_grp
 ########################################
 # GET_PERSONALIZED_MODEL utils
 def fetch_existing_data(user, model_name):

 from sentence_transformers import SentenceTransformer, util
 import torch
 from bertopic import BERTopic
+from datetime import date
 ########################################
 # PRE-LOADING
     return ratings_grp
+########################################
+# SAVE_REPORT utils
+# Convert indielabel json to AVID json format.
+# See the AVID format in https://avidml.org/avidtools/reference/report
+#
+# Important mappings:
+#   IndieLabel Attribute        AVID Attribute          Example
+#   text_entry                  description             "I think the Perspective API
+#                                                       is too sensitive. Here are some examples."
+#   topic                       feature                 0_shes_woman_lady_face
+#   persp_score                 model_score             0.94
+#   comment                     ori_input               "She looks beautiful"
+#   user_rating                 personal_model_score    0.92
+#   user_decision               user_decision           "Non-toxic"
+# Note that this is at the individual report level.
+def convert_indie_label_json_to_avid_json(indie_label_json):
+    # Setting up the structure with a dict to enable programmatic additions
+    avid_json_dict = {
+        "data_type": "AVID",
+        "data_version": None,
+        "metadata": None,
+        "affects": {
+            "developer": [],
+            "deployer": [
+              "Hugging Face"
+            ],
+            # TODO: Make artifacts malleable during modularity work
+            "artifacts": [
+              {
+                "type": "Model",
+                "name": "Perspective API"
+              }
+            ]
+        },
+        "problemtype": {
+            "classof": "Undefined", # I don't think any of the other ClassEnums are applicable. Link: https://avidml.org/avidtools/_modules/avidtools/datamodels/enums#ClassEnum
+            "type": "Detection",
+            "description": {
+              "lang": "eng", # TODO: Make language selectable
+              "value": "This report contains results from an end user audit conducted on Hugging Face."
+            }
+          },
+        "metrics": [ # Note: For the end users use case, I made each comment an example.
+          ],
+        "references": [],
+        "description": {
+            "lang": "eng", # TODO: Make language selectable
+            "value": "" # Leaving empty so the report comments can be contained here.
+          },
+          "impact": {
+            "avid": {
+              "risk_domain": [
+                "Ethics"
+              ],
+              "sep_view": [
+                "E0101: Group fairness"
+              ],
+              "lifecycle_view": [
+                "L05: Evaluation"
+              ],
+              "taxonomy_version": "0.2"
+            }
+          },
+          "credit": None,
+          "reported_date": "" # Leaving empty so that it can be dynamically filled in
+    }
+    avid_json_dict["description"] = indie_label_json["text_entry"]
+    avid_json_dict["reported_date"] = str(date.today())
+    for e in indie_label_json["evidence"]:
+        curr_metric = {}
+        curr_metric["name"] = "Perspective API"
+        curr_metric["detection_method"] = {
+            "type": "Detection",
+            "name": "Individual Example from End User Audit"
+        }
+        res_dict = {}
+        res_dict["feature"] = e["topic"]
+        res_dict["model_score"] = str(e["persp_score"]) # Converted to string to avoid Float type error with DB
+        res_dict["ori_input"] = e["comment"]
+        res_dict["personal_model_score"] = str(e["user_rating"]) # See above
+        res_dict["user_decision"] = e["user_decision"]
+        curr_metric["results"] = res_dict
+        avid_json_dict["metrics"].append(curr_metric)
+    new_report = json.dumps(avid_json_dict)
+    return new_report
 ########################################
 # GET_PERSONALIZED_MODEL utils
 def fetch_existing_data(user, model_name):

server.py CHANGED Viewed

@@ -21,6 +21,9 @@ import friendlywords as fw
 import audit_utils as utils
 app = Flask(__name__)
 DEBUG = False  # Debug flag for development; set to False for production
@@ -635,6 +638,21 @@ def get_prompts_scaffold():
         },
     ]
 ########################################
 # ROUTE: /SAVE_REPORTS
 @app.route("/save_reports")
@@ -645,6 +663,9 @@ def save_reports():
     scaffold_method = request.args.get("scaffold_method")
     model = request.args.get("model")
     # Save reports for current user to file
     reports_file = utils.get_reports_file(cur_user, model)
     with open(reports_file, "w", encoding ='utf8') as f:
@@ -653,6 +674,7 @@ def save_reports():
     results = {
         "status": "success",
     }
     return json.dumps(results)
 ########################################

 import audit_utils as utils
+import requests
 app = Flask(__name__)
 DEBUG = False  # Debug flag for development; set to False for production
         },
     ]
+# Submit all reports to AVID
+# Logs the responses
+def submit_reports_to_AVID(reports):
+    #Set up the connection to AVID
+    root = environ.get('AVID_API_URL')
+    api_key = environ.get('AVID_API_KEY')
+    key = {"Authorization": api_key}
+    for r in reports:
+        new_report = utils.convert_indie_label_json_to_avid_json(r)
+        url = root + "submit"
+        response = requests.post(url, json=json.loads(new_report), headers=key) # The loads ensures type compliance
+        uuid = response.json()
+        print("AVID API response:", response, uuid)
 ########################################
 # ROUTE: /SAVE_REPORTS
 @app.route("/save_reports")
     scaffold_method = request.args.get("scaffold_method")
     model = request.args.get("model")
+    # Submit reports to AVID
+    submit_reports_to_AVID(reports)
     # Save reports for current user to file
     reports_file = utils.get_reports_file(cur_user, model)
     with open(reports_file, "w", encoding ='utf8') as f:
     results = {
         "status": "success",
     }
+    print(results)
     return json.dumps(results)
 ########################################