Spaces:

camlsys
/

compliancecards

Sleeping

App Files Files Community

wlmbrown commited on Aug 29, 2024

Commit

8f91f41

1 Parent(s): 6d40ad6

comments and minor changes to model and data cards

Browse files

Files changed (2) hide show

data_cc.yaml +12 -6
model_cc.yaml +20 -10

data_cc.yaml CHANGED Viewed

@@ -1,5 +1,7 @@
 card_type: "data" # "project", "data" or "model"
 intended_purpose:
   safety_component:
     article: 'Art. 6(1)(a)'
@@ -54,6 +56,8 @@ intended_purpose:
     verbose: 'This dataset is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
     value: !!bool false
 high_risk_ai_systems:
   data_and_data_governance_data_governance:
     article: 'Art. 10(1)-(2)'
@@ -105,15 +109,15 @@ high_risk_ai_systems:
     value: !!bool false
   data_and_data_governance_data_completeness:
     article: 'Art. 10(3); Rec. 67'
-    verbose: 'Training data is complete in view of the intended purpose of system'
     value: !!bool false
   data_and_data_governance_statistical_properties:
     article: 'Art. 10(3)'
-    verbose: 'Training data possesses the appropriate statistical properties, including, where applicable, as regards the people in relation to whom the system is intended to be used'
     value: !!bool false
   data_and_data_governance_contextual:
     article: 'Art. 10(4)'
-    verbose: 'Training data takes into account, to the extent required by the intended purpose, the characteristics or elements that are particular to the specific geographical, contextual, behavioural or functional setting within which the system is intended to be used'
     value: !!bool false
   data_and_data_governance_personal_data_necessary:
     article: 'Art. 10(5)'
@@ -177,17 +181,19 @@ high_risk_ai_systems:
     value: !!bool false
   technical_documentation_cybersecurity:
     article: 'Art. 11; Annex IV(2)(h)'
-    verbose: 'Cybersecurity measures put in place as regards the data (e.g., scanning for data poisoning)'
     value: !!bool false
   transparency_and_provision_of_information_to_deployers:
     article: '# Art. 13(3)(b)(vi)'
-    verbose: 'Specifications for the input data, or any other relevant information in terms of the training, validation and testing data sets used, taking into account the intended purpose of the AI system'
     value: !!bool false
   quality_management_system:
     article: 'Art. 17(1)(f)'
-    verbose: 'Systems and procedures for data management, including data acquisition, data collection, data analysis, data labelling, data storage, data filtration, data mining, data aggregation, data retention and any other operation regarding the data that is performed before and for the purposes of the placing on the market or putting into service of high-risk AI systems'
     value: !!bool false
 gpai_requirements:
   data_type:
     article: 'Art. 53(1); Annex XI(2)(c)'

 card_type: "data" # "project", "data" or "model"
+# Meta data related to intended purpose(s) of data
 intended_purpose:
   safety_component:
     article: 'Art. 6(1)(a)'
     verbose: 'This dataset is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
     value: !!bool false
+# Metadata related to data-related requirements for high-risk AI systems
 high_risk_ai_systems:
   data_and_data_governance_data_governance:
     article: 'Art. 10(1)-(2)'
     value: !!bool false
   data_and_data_governance_data_completeness:
     article: 'Art. 10(3); Rec. 67'
+    verbose: 'Training data is complete in view of the intended purpose'
     value: !!bool false
   data_and_data_governance_statistical_properties:
     article: 'Art. 10(3)'
+    verbose: 'Training data possesses the appropriate statistical properties, including, where applicable, as regards the people in relation to whom it is intended to be used'
     value: !!bool false
   data_and_data_governance_contextual:
     article: 'Art. 10(4)'
+    verbose: 'Training data takes into account, to the extent required by the intended purpose, the characteristics or elements that are particular to the specific geographical, contextual, behavioural or functional setting within which it is intended to be used'
     value: !!bool false
   data_and_data_governance_personal_data_necessary:
     article: 'Art. 10(5)'
     value: !!bool false
   technical_documentation_cybersecurity:
     article: 'Art. 11; Annex IV(2)(h)'
+    verbose: 'Cybersecurity measures were put in place as regards the data (e.g., scanning for data poisoning)'
     value: !!bool false
   transparency_and_provision_of_information_to_deployers:
     article: '# Art. 13(3)(b)(vi)'
+    verbose: 'Dataset is accompanied by instructions for use that convery relevant information about it, taking into account its intended purpose'
     value: !!bool false
   quality_management_system:
     article: 'Art. 17(1)(f)'
+    verbose: 'Datset was subject to a quality management system that is documented in a systematic and orderly manner in the form of written policies, procedures and instructions, and includes a description of the systems and procedures for data management, including data acquisition, data collection, data analysis, data labelling, data storage, data filtration, data mining, data aggregation, data retention and any other operation regarding the data'
     value: !!bool false
+# Meta data related to data-relaed requirements for GPAI models
 gpai_requirements:
   data_type:
     article: 'Art. 53(1); Annex XI(2)(c)'

model_cc.yaml CHANGED Viewed

@@ -1,5 +1,7 @@
 card_type: "model" # "project", "data" or "model"
 intended_purpose:
   safety_component:
     article: 'Art. 6(1)(a)'
@@ -54,6 +56,20 @@ intended_purpose:
     verbose: 'This model is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
     value: !!bool false
 high_risk_ai_models:
   risk_management_system_general:
     article: 'Art. 9(2)'
@@ -192,15 +208,7 @@ high_risk_ai_models:
     verbose: 'Examination, test and validation procedures to be carried out before, during and after the development of the high-risk AI system, and the frequency with which they have to be carried out'
     value: !!bool false
-classification_of_gpai_models:
-  high_impact_capabilities:
-    article: 'Art. 51(1)(a)'
-    verbose: 'Whether model has high impact capabilities evaluated on the basis of appropriate technical tools and methodologies, including indicators and benchmarks'
-    value: !!bool false
-  flops:
-    article: 'Art. 51(2)'
-    verbose: 'Cumulative compute used for training measured in floating point operations (FLOPs)'
-    value: !!bool false
 obligations_for_providers_of_gpai_models:
   task:
@@ -302,10 +310,12 @@ obligations_for_providers_of_gpai_models_with_systemic_risk:
     verbose: 'Ensure an adequate level of cybersecurity protection for the GPAI model with systemic risk and the physical infrastructure of the mode'
     value: !!bool false
 transparency_obligations:
   generates_media: # clean this up
     article: 'Art. 50(2)'
-    verbose: 'If the AI project generates synthetic audio, image, video or text content'
     value: !!bool false
   marked_as_generated:
     article: 'Art. 50(2)'

 card_type: "model" # "project", "data" or "model"
+# Metadata related to intended purpose(s) of model
 intended_purpose:
   safety_component:
     article: 'Art. 6(1)(a)'
     verbose: 'This model is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
     value: !!bool false
+# Metadata that will help us determine if the model itself is a GPAI and, therefore, must satisfy the requirements of GPAI models
+classification_of_gpai_models:
+  high_impact_capabilities:
+    article: 'Art. 51(1)(a)'
+    verbose: 'The model has high impact capabilities evaluated on the basis of appropriate technical tools and methodologies, including indicators and benchmarks'
+    value: !!bool false
+  flops:
+    article: 'Art. 51(2)'
+    verbose: 'The cumulative compute used for training the model, as measured in floating point operations (FLOPs), was greater than 10^25.'
+    value: !!bool false
+# Metadata related to model-related requirements for high-risk AI systems
 high_risk_ai_models:
   risk_management_system_general:
     article: 'Art. 9(2)'
     verbose: 'Examination, test and validation procedures to be carried out before, during and after the development of the high-risk AI system, and the frequency with which they have to be carried out'
     value: !!bool false
+# Meta data related to model-related requirements for GPAI models
 obligations_for_providers_of_gpai_models:
   task:
     verbose: 'Ensure an adequate level of cybersecurity protection for the GPAI model with systemic risk and the physical infrastructure of the mode'
     value: !!bool false
+# Metadata related to transparency requirements for some AI systems (Article 50)
 transparency_obligations:
   generates_media: # clean this up
     article: 'Art. 50(2)'
+    verbose: 'If the model generates synthetic audio, image, video or text content'
     value: !!bool false
   marked_as_generated:
     article: 'Art. 50(2)'