Spaces:
Sleeping
Sleeping
wlmbrown
commited on
Commit
·
8f91f41
1
Parent(s):
6d40ad6
comments and minor changes to model and data cards
Browse files- data_cc.yaml +12 -6
- model_cc.yaml +20 -10
data_cc.yaml
CHANGED
@@ -1,5 +1,7 @@
|
|
1 |
card_type: "data" # "project", "data" or "model"
|
2 |
|
|
|
|
|
3 |
intended_purpose:
|
4 |
safety_component:
|
5 |
article: 'Art. 6(1)(a)'
|
@@ -54,6 +56,8 @@ intended_purpose:
|
|
54 |
verbose: 'This dataset is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
|
55 |
value: !!bool false
|
56 |
|
|
|
|
|
57 |
high_risk_ai_systems:
|
58 |
data_and_data_governance_data_governance:
|
59 |
article: 'Art. 10(1)-(2)'
|
@@ -105,15 +109,15 @@ high_risk_ai_systems:
|
|
105 |
value: !!bool false
|
106 |
data_and_data_governance_data_completeness:
|
107 |
article: 'Art. 10(3); Rec. 67'
|
108 |
-
verbose: 'Training data is complete in view of the intended purpose
|
109 |
value: !!bool false
|
110 |
data_and_data_governance_statistical_properties:
|
111 |
article: 'Art. 10(3)'
|
112 |
-
verbose: 'Training data possesses the appropriate statistical properties, including, where applicable, as regards the people in relation to whom
|
113 |
value: !!bool false
|
114 |
data_and_data_governance_contextual:
|
115 |
article: 'Art. 10(4)'
|
116 |
-
verbose: 'Training data takes into account, to the extent required by the intended purpose, the characteristics or elements that are particular to the specific geographical, contextual, behavioural or functional setting within which
|
117 |
value: !!bool false
|
118 |
data_and_data_governance_personal_data_necessary:
|
119 |
article: 'Art. 10(5)'
|
@@ -177,17 +181,19 @@ high_risk_ai_systems:
|
|
177 |
value: !!bool false
|
178 |
technical_documentation_cybersecurity:
|
179 |
article: 'Art. 11; Annex IV(2)(h)'
|
180 |
-
verbose: 'Cybersecurity measures put in place as regards the data (e.g., scanning for data poisoning)'
|
181 |
value: !!bool false
|
182 |
transparency_and_provision_of_information_to_deployers:
|
183 |
article: '# Art. 13(3)(b)(vi)'
|
184 |
-
verbose: '
|
185 |
value: !!bool false
|
186 |
quality_management_system:
|
187 |
article: 'Art. 17(1)(f)'
|
188 |
-
verbose: '
|
189 |
value: !!bool false
|
190 |
|
|
|
|
|
191 |
gpai_requirements:
|
192 |
data_type:
|
193 |
article: 'Art. 53(1); Annex XI(2)(c)'
|
|
|
1 |
card_type: "data" # "project", "data" or "model"
|
2 |
|
3 |
+
# Meta data related to intended purpose(s) of data
|
4 |
+
|
5 |
intended_purpose:
|
6 |
safety_component:
|
7 |
article: 'Art. 6(1)(a)'
|
|
|
56 |
verbose: 'This dataset is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
|
57 |
value: !!bool false
|
58 |
|
59 |
+
# Metadata related to data-related requirements for high-risk AI systems
|
60 |
+
|
61 |
high_risk_ai_systems:
|
62 |
data_and_data_governance_data_governance:
|
63 |
article: 'Art. 10(1)-(2)'
|
|
|
109 |
value: !!bool false
|
110 |
data_and_data_governance_data_completeness:
|
111 |
article: 'Art. 10(3); Rec. 67'
|
112 |
+
verbose: 'Training data is complete in view of the intended purpose'
|
113 |
value: !!bool false
|
114 |
data_and_data_governance_statistical_properties:
|
115 |
article: 'Art. 10(3)'
|
116 |
+
verbose: 'Training data possesses the appropriate statistical properties, including, where applicable, as regards the people in relation to whom it is intended to be used'
|
117 |
value: !!bool false
|
118 |
data_and_data_governance_contextual:
|
119 |
article: 'Art. 10(4)'
|
120 |
+
verbose: 'Training data takes into account, to the extent required by the intended purpose, the characteristics or elements that are particular to the specific geographical, contextual, behavioural or functional setting within which it is intended to be used'
|
121 |
value: !!bool false
|
122 |
data_and_data_governance_personal_data_necessary:
|
123 |
article: 'Art. 10(5)'
|
|
|
181 |
value: !!bool false
|
182 |
technical_documentation_cybersecurity:
|
183 |
article: 'Art. 11; Annex IV(2)(h)'
|
184 |
+
verbose: 'Cybersecurity measures were put in place as regards the data (e.g., scanning for data poisoning)'
|
185 |
value: !!bool false
|
186 |
transparency_and_provision_of_information_to_deployers:
|
187 |
article: '# Art. 13(3)(b)(vi)'
|
188 |
+
verbose: 'Dataset is accompanied by instructions for use that convery relevant information about it, taking into account its intended purpose'
|
189 |
value: !!bool false
|
190 |
quality_management_system:
|
191 |
article: 'Art. 17(1)(f)'
|
192 |
+
verbose: 'Datset was subject to a quality management system that is documented in a systematic and orderly manner in the form of written policies, procedures and instructions, and includes a description of the systems and procedures for data management, including data acquisition, data collection, data analysis, data labelling, data storage, data filtration, data mining, data aggregation, data retention and any other operation regarding the data'
|
193 |
value: !!bool false
|
194 |
|
195 |
+
# Meta data related to data-relaed requirements for GPAI models
|
196 |
+
|
197 |
gpai_requirements:
|
198 |
data_type:
|
199 |
article: 'Art. 53(1); Annex XI(2)(c)'
|
model_cc.yaml
CHANGED
@@ -1,5 +1,7 @@
|
|
1 |
card_type: "model" # "project", "data" or "model"
|
2 |
|
|
|
|
|
3 |
intended_purpose:
|
4 |
safety_component:
|
5 |
article: 'Art. 6(1)(a)'
|
@@ -54,6 +56,20 @@ intended_purpose:
|
|
54 |
verbose: 'This model is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
|
55 |
value: !!bool false
|
56 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
57 |
high_risk_ai_models:
|
58 |
risk_management_system_general:
|
59 |
article: 'Art. 9(2)'
|
@@ -192,15 +208,7 @@ high_risk_ai_models:
|
|
192 |
verbose: 'Examination, test and validation procedures to be carried out before, during and after the development of the high-risk AI system, and the frequency with which they have to be carried out'
|
193 |
value: !!bool false
|
194 |
|
195 |
-
|
196 |
-
high_impact_capabilities:
|
197 |
-
article: 'Art. 51(1)(a)'
|
198 |
-
verbose: 'Whether model has high impact capabilities evaluated on the basis of appropriate technical tools and methodologies, including indicators and benchmarks'
|
199 |
-
value: !!bool false
|
200 |
-
flops:
|
201 |
-
article: 'Art. 51(2)'
|
202 |
-
verbose: 'Cumulative compute used for training measured in floating point operations (FLOPs)'
|
203 |
-
value: !!bool false
|
204 |
|
205 |
obligations_for_providers_of_gpai_models:
|
206 |
task:
|
@@ -302,10 +310,12 @@ obligations_for_providers_of_gpai_models_with_systemic_risk:
|
|
302 |
verbose: 'Ensure an adequate level of cybersecurity protection for the GPAI model with systemic risk and the physical infrastructure of the mode'
|
303 |
value: !!bool false
|
304 |
|
|
|
|
|
305 |
transparency_obligations:
|
306 |
generates_media: # clean this up
|
307 |
article: 'Art. 50(2)'
|
308 |
-
verbose: 'If the
|
309 |
value: !!bool false
|
310 |
marked_as_generated:
|
311 |
article: 'Art. 50(2)'
|
|
|
1 |
card_type: "model" # "project", "data" or "model"
|
2 |
|
3 |
+
# Metadata related to intended purpose(s) of model
|
4 |
+
|
5 |
intended_purpose:
|
6 |
safety_component:
|
7 |
article: 'Art. 6(1)(a)'
|
|
|
56 |
verbose: 'This model is appropriate to use for AI projects intended to be used by a judicial authority or on their behalf to assist a judicial authority in researching and interpreting facts and the law and in applying the law to a concrete set of facts, or to be used in a similar way in alternative dispute resolution'
|
57 |
value: !!bool false
|
58 |
|
59 |
+
# Metadata that will help us determine if the model itself is a GPAI and, therefore, must satisfy the requirements of GPAI models
|
60 |
+
|
61 |
+
classification_of_gpai_models:
|
62 |
+
high_impact_capabilities:
|
63 |
+
article: 'Art. 51(1)(a)'
|
64 |
+
verbose: 'The model has high impact capabilities evaluated on the basis of appropriate technical tools and methodologies, including indicators and benchmarks'
|
65 |
+
value: !!bool false
|
66 |
+
flops:
|
67 |
+
article: 'Art. 51(2)'
|
68 |
+
verbose: 'The cumulative compute used for training the model, as measured in floating point operations (FLOPs), was greater than 10^25.'
|
69 |
+
value: !!bool false
|
70 |
+
|
71 |
+
# Metadata related to model-related requirements for high-risk AI systems
|
72 |
+
|
73 |
high_risk_ai_models:
|
74 |
risk_management_system_general:
|
75 |
article: 'Art. 9(2)'
|
|
|
208 |
verbose: 'Examination, test and validation procedures to be carried out before, during and after the development of the high-risk AI system, and the frequency with which they have to be carried out'
|
209 |
value: !!bool false
|
210 |
|
211 |
+
# Meta data related to model-related requirements for GPAI models
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
212 |
|
213 |
obligations_for_providers_of_gpai_models:
|
214 |
task:
|
|
|
310 |
verbose: 'Ensure an adequate level of cybersecurity protection for the GPAI model with systemic risk and the physical infrastructure of the mode'
|
311 |
value: !!bool false
|
312 |
|
313 |
+
# Metadata related to transparency requirements for some AI systems (Article 50)
|
314 |
+
|
315 |
transparency_obligations:
|
316 |
generates_media: # clean this up
|
317 |
article: 'Art. 50(2)'
|
318 |
+
verbose: 'If the model generates synthetic audio, image, video or text content'
|
319 |
value: !!bool false
|
320 |
marked_as_generated:
|
321 |
article: 'Art. 50(2)'
|