wlmbrown commited on
Commit
8f91f41
·
1 Parent(s): 6d40ad6

comments and minor changes to model and data cards

Browse files
Files changed (2) hide show
  1. data_cc.yaml +12 -6
  2. model_cc.yaml +20 -10
data_cc.yaml CHANGED
@@ -1,5 +1,7 @@
1
  card_type: "data" # "project", "data" or "model"
2
 
 
 
3
  intended_purpose:
4
  safety_component:
5
  article: 'Art. 6(1)(a)'
@@ -54,6 +56,8 @@ intended_purpose:
54
  verbose: 'This dataset is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
55
  value: !!bool false
56
 
 
 
57
  high_risk_ai_systems:
58
  data_and_data_governance_data_governance:
59
  article: 'Art. 10(1)-(2)'
@@ -105,15 +109,15 @@ high_risk_ai_systems:
105
  value: !!bool false
106
  data_and_data_governance_data_completeness:
107
  article: 'Art. 10(3); Rec. 67'
108
- verbose: 'Training data is complete in view of the intended purpose of system'
109
  value: !!bool false
110
  data_and_data_governance_statistical_properties:
111
  article: 'Art. 10(3)'
112
- verbose: 'Training data possesses the appropriate statistical properties, including, where applicable, as regards the people in relation to whom the system is intended to be used'
113
  value: !!bool false
114
  data_and_data_governance_contextual:
115
  article: 'Art. 10(4)'
116
- verbose: 'Training data takes into account, to the extent required by the intended purpose, the characteristics or elements that are particular to the specific geographical, contextual, behavioural or functional setting within which the system is intended to be used'
117
  value: !!bool false
118
  data_and_data_governance_personal_data_necessary:
119
  article: 'Art. 10(5)'
@@ -177,17 +181,19 @@ high_risk_ai_systems:
177
  value: !!bool false
178
  technical_documentation_cybersecurity:
179
  article: 'Art. 11; Annex IV(2)(h)'
180
- verbose: 'Cybersecurity measures put in place as regards the data (e.g., scanning for data poisoning)'
181
  value: !!bool false
182
  transparency_and_provision_of_information_to_deployers:
183
  article: '# Art. 13(3)(b)(vi)'
184
- verbose: 'Specifications for the input data, or any other relevant information in terms of the training, validation and testing data sets used, taking into account the intended purpose of the AI system'
185
  value: !!bool false
186
  quality_management_system:
187
  article: 'Art. 17(1)(f)'
188
- verbose: 'Systems and procedures for data management, including data acquisition, data collection, data analysis, data labelling, data storage, data filtration, data mining, data aggregation, data retention and any other operation regarding the data that is performed before and for the purposes of the placing on the market or putting into service of high-risk AI systems'
189
  value: !!bool false
190
 
 
 
191
  gpai_requirements:
192
  data_type:
193
  article: 'Art. 53(1); Annex XI(2)(c)'
 
1
  card_type: "data" # "project", "data" or "model"
2
 
3
+ # Meta data related to intended purpose(s) of data
4
+
5
  intended_purpose:
6
  safety_component:
7
  article: 'Art. 6(1)(a)'
 
56
  verbose: 'This dataset is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
57
  value: !!bool false
58
 
59
+ # Metadata related to data-related requirements for high-risk AI systems
60
+
61
  high_risk_ai_systems:
62
  data_and_data_governance_data_governance:
63
  article: 'Art. 10(1)-(2)'
 
109
  value: !!bool false
110
  data_and_data_governance_data_completeness:
111
  article: 'Art. 10(3); Rec. 67'
112
+ verbose: 'Training data is complete in view of the intended purpose'
113
  value: !!bool false
114
  data_and_data_governance_statistical_properties:
115
  article: 'Art. 10(3)'
116
+ verbose: 'Training data possesses the appropriate statistical properties, including, where applicable, as regards the people in relation to whom it is intended to be used'
117
  value: !!bool false
118
  data_and_data_governance_contextual:
119
  article: 'Art. 10(4)'
120
+ verbose: 'Training data takes into account, to the extent required by the intended purpose, the characteristics or elements that are particular to the specific geographical, contextual, behavioural or functional setting within which it is intended to be used'
121
  value: !!bool false
122
  data_and_data_governance_personal_data_necessary:
123
  article: 'Art. 10(5)'
 
181
  value: !!bool false
182
  technical_documentation_cybersecurity:
183
  article: 'Art. 11; Annex IV(2)(h)'
184
+ verbose: 'Cybersecurity measures were put in place as regards the data (e.g., scanning for data poisoning)'
185
  value: !!bool false
186
  transparency_and_provision_of_information_to_deployers:
187
  article: '# Art. 13(3)(b)(vi)'
188
+ verbose: 'Dataset is accompanied by instructions for use that convery relevant information about it, taking into account its intended purpose'
189
  value: !!bool false
190
  quality_management_system:
191
  article: 'Art. 17(1)(f)'
192
+ verbose: 'Datset was subject to a quality management system that is documented in a systematic and orderly manner in the form of written policies, procedures and instructions, and includes a description of the systems and procedures for data management, including data acquisition, data collection, data analysis, data labelling, data storage, data filtration, data mining, data aggregation, data retention and any other operation regarding the data'
193
  value: !!bool false
194
 
195
+ # Meta data related to data-relaed requirements for GPAI models
196
+
197
  gpai_requirements:
198
  data_type:
199
  article: 'Art. 53(1); Annex XI(2)(c)'
model_cc.yaml CHANGED
@@ -1,5 +1,7 @@
1
  card_type: "model" # "project", "data" or "model"
2
 
 
 
3
  intended_purpose:
4
  safety_component:
5
  article: 'Art. 6(1)(a)'
@@ -54,6 +56,20 @@ intended_purpose:
54
  verbose: 'This model is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
55
  value: !!bool false
56
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
57
  high_risk_ai_models:
58
  risk_management_system_general:
59
  article: 'Art. 9(2)'
@@ -192,15 +208,7 @@ high_risk_ai_models:
192
  verbose: 'Examination, test and validation procedures to be carried out before, during and after the development of the high-risk AI system, and the frequency with which they have to be carried out'
193
  value: !!bool false
194
 
195
- classification_of_gpai_models:
196
- high_impact_capabilities:
197
- article: 'Art. 51(1)(a)'
198
- verbose: 'Whether model has high impact capabilities evaluated on the basis of appropriate technical tools and methodologies, including indicators and benchmarks'
199
- value: !!bool false
200
- flops:
201
- article: 'Art. 51(2)'
202
- verbose: 'Cumulative compute used for training measured in floating point operations (FLOPs)'
203
- value: !!bool false
204
 
205
  obligations_for_providers_of_gpai_models:
206
  task:
@@ -302,10 +310,12 @@ obligations_for_providers_of_gpai_models_with_systemic_risk:
302
  verbose: 'Ensure an adequate level of cybersecurity protection for the GPAI model with systemic risk and the physical infrastructure of the mode'
303
  value: !!bool false
304
 
 
 
305
  transparency_obligations:
306
  generates_media: # clean this up
307
  article: 'Art. 50(2)'
308
- verbose: 'If the AI project generates synthetic audio, image, video or text content'
309
  value: !!bool false
310
  marked_as_generated:
311
  article: 'Art. 50(2)'
 
1
  card_type: "model" # "project", "data" or "model"
2
 
3
+ # Metadata related to intended purpose(s) of model
4
+
5
  intended_purpose:
6
  safety_component:
7
  article: 'Art. 6(1)(a)'
 
56
  verbose: 'This model is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
57
  value: !!bool false
58
 
59
+ # Metadata that will help us determine if the model itself is a GPAI and, therefore, must satisfy the requirements of GPAI models
60
+
61
+ classification_of_gpai_models:
62
+ high_impact_capabilities:
63
+ article: 'Art. 51(1)(a)'
64
+ verbose: 'The model has high impact capabilities evaluated on the basis of appropriate technical tools and methodologies, including indicators and benchmarks'
65
+ value: !!bool false
66
+ flops:
67
+ article: 'Art. 51(2)'
68
+ verbose: 'The cumulative compute used for training the model, as measured in floating point operations (FLOPs), was greater than 10^25.'
69
+ value: !!bool false
70
+
71
+ # Metadata related to model-related requirements for high-risk AI systems
72
+
73
  high_risk_ai_models:
74
  risk_management_system_general:
75
  article: 'Art. 9(2)'
 
208
  verbose: 'Examination, test and validation procedures to be carried out before, during and after the development of the high-risk AI system, and the frequency with which they have to be carried out'
209
  value: !!bool false
210
 
211
+ # Meta data related to model-related requirements for GPAI models
 
 
 
 
 
 
 
 
212
 
213
  obligations_for_providers_of_gpai_models:
214
  task:
 
310
  verbose: 'Ensure an adequate level of cybersecurity protection for the GPAI model with systemic risk and the physical infrastructure of the mode'
311
  value: !!bool false
312
 
313
+ # Metadata related to transparency requirements for some AI systems (Article 50)
314
+
315
  transparency_obligations:
316
  generates_media: # clean this up
317
  article: 'Art. 50(2)'
318
+ verbose: 'If the model generates synthetic audio, image, video or text content'
319
  value: !!bool false
320
  marked_as_generated:
321
  article: 'Art. 50(2)'