File size: 16,815 Bytes
6571e75
d5428ff
6571e75
7269140
6571e75
7269140
 
cfd40e9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
7269140
 
6571e75
 
 
 
 
7269140
6571e75
 
 
 
 
 
7269140
6571e75
 
 
 
 
7269140
6571e75
 
 
7269140
6571e75
 
 
 
 
 
7269140
6571e75
7269140
 
6571e75
 
7269140
cfd40e9
 
5be1f85
7269140
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6571e75
7269140
 
 
6571e75
7269140
6571e75
7269140
 
6571e75
7269140
 
 
6571e75
7269140
6571e75
7269140
6571e75
7269140
 
 
 
 
 
 
 
d5428ff
7269140
 
 
 
 
 
 
 
 
 
 
 
cfd40e9
 
 
7269140
 
cfd40e9
7269140
 
 
 
 
 
 
 
 
 
 
cfd40e9
 
 
 
 
 
 
 
 
 
 
7269140
 
cfd40e9
7269140
cfd40e9
 
7269140
5be1f85
 
 
 
 
 
 
7269140
5be1f85
 
 
7269140
 
 
 
 
 
 
 
 
 
 
 
 
d5428ff
7269140
 
cfd40e9
7269140
6571e75
7269140
 
 
cfd40e9
7269140
 
 
 
 
 
 
6571e75
7269140
 
6571e75
7269140
 
6571e75
 
 
d5428ff
 
6571e75
d5428ff
6571e75
 
 
 
 
 
 
 
 
 
 
 
 
cfd40e9
6571e75
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
import os
import sys
import yaml
from enum import Enum

# Create some variables we will use throughout our analysis

project_variables = {
    "ai_project_type": {
        "ai_system": False,
        "gpai_model": False,
        "high_risk_ai_system": False,
        "gpai_model_systematic_risk": False
    },
    "operator_role": {
        "provider": False,
        "deployer": False,
        "importer": False,
        "distributor": False,
        "product_manufacturer": False,
        "eu_located": False
    },
    "eu_market_status": {
        "placed_on_market": False,
        "put_into_service": False,
        "output_used": False
    }
}

#Define a function that creates a list of all the files in a provided folder. We will use this list for different things.
def create_list_of_files(folder_path):
    for root, dirs, files in os.walk(folder_path):
        for filename in files:
            found_files.append(os.path.join(root, filename))

#Define a function that checks for a Project CC. Without this, there simply cannot be an analysis.
def check_for_project_cc(folder_path):
    found_files = []

    # Walk through the directory
    for root, dirs, files in os.walk(folder_path):
        for filename in files:
            if filename.lower() == 'project_cc.yaml':
                found_files.append(os.path.join(root, filename))

    # Check the results
    if len(found_files) == 0:
        print(f"We did not find a Project CC in your folder. We cannot run a compliance analysis without a Project CC.")
        sys.exit()
    elif len(found_files) == 1:
        print(f"We found exactly one Project CC in your folder. Great job!:")
        print(f"  - {found_files[0]}")
        run_compliance_analysis(folder_path)
    else:
        print(f"Multiple Project CCs found:")
        for file_path in found_files:
            print(f"  - {file_path}")
        print("We found multiple Project CCs in your folder. There should only be one Project CC per project.")

def run_compliance_analysis(folder_path):

    # Load the Project CC YAML file from the supplied folder. This will be our starting point. 
    with open(folder_path + 'project_cc.yaml', 'r') as file:
        project_cc_yaml = yaml.safe_load(file)

    # Determine project type (AI system vs. GPAI model) as well as operator type. We will use these for different things.
    set_type(project_variables, project_cc_yaml)
    set_operator_role_and_location(project_variables, project_cc_yaml)
    set_eu_market_status(project_variables, project_cc_yaml)

    # Check if the project is within scope of the Act. If it's not, the analysis is over.
    if check_within_scope(project_cc_yaml):
        print("Project is within the scope of Act. Let's continue...") 
    else: 
        sys.exit("Project is not within the scope of what is regulated by the Act.")

    # Check for prohibited practices. If any exist, the analysis is over.
    if check_prohibited(project_cc_yaml) == True: 
        print("Project contains prohibited practices and is therefore non-compliant.")
        sys.exit("Project is non-compliant due to a prohibited practice.")
    else: 
        print("Project does not contain prohibited practies. Let's continue...")

    # If project is high-risk AI system, check that is has met all the requirements for such systems: 

    if high_risk_ai_system:

    # Do this by examining the Project CC

        for key, value in project_cc_yaml['risk_management_system']:
            if not value:
                sys.exit("Because of project-level characteristics, this high-risk AI system fails the risk management requirements under Article 9.")
        for key, value in project_cc_yaml['technical_documentation']:
            if not value:
                sys.exit("Because of project-level characteristics, this high-risk AI system fails the risk management requirements under Article 11.")            
        for key, value in project_cc_yaml['record_keeping']:
            if not value:
                sys.exit("Because of project-level characteristics, this high-risk AI system fails the risk management requirements under Article 12.")     
        for key, value in project_cc_yaml['transparency_and_provision_of_information_to_deployers']:
            if not value:
                sys.exit("Because of project-level characteristics, this high-risk AI system fails the transparency requirements under Article 13.")  
        for key, value in project_cc_yaml['human_oversight']:
            if not value:
                sys.exit("Because of project-level characteristics, this high-risk AI system fails the human oversight requirements under Article 14.")  
        for key, value in project_cc_yaml['accuracy_robustness_cybersecurity']:
            if not value:
                sys.exit("Because of project-level characteristics, this high-risk AI system fails the accuracy, robustness, and cybersecurity requirements under Article 15.")  
        for key, value in project_cc_yaml['quality_management_system']:
            if not value:
                sys.exit("Because of project-level characteristics, this high-risk AI system fails the accuracy, robustness, and cybersecurity requirements under Article 17.") 

    # Do this by examining any and all Data CCs too

        for filename in os.listdir(folder_path):
            # Check if the search word is in the filename
            if "data_cc.md" in filename.lower():

                # If it is, load the yaml

                with open(folder_path + filename, 'r') as file:
                    data_cc_yaml = yaml.safe_load(file)

                for key, value in data_cc_yaml['data_and_data_governance']:
                    if not value:
                        sys.exit(f"Because of the dataset represented by {filename}, this high-risk AI system fails the data and data governance requirements under Article 10.")
                for key, value in data_cc_yaml['technical_documentation']:
                    if not value:
                        sys.exit(f"Because of the dataset represented by {filename}, this high-risk AI system fails the technical documentation requirements under Article 11.")
                for key, value in data_cc_yaml['transparency_and_provision_of_information_to_deployers']:
                    if not value:
                        sys.exit(f"Because of the dataset represented by {filename}, this high-risk  AI system fails the transparency requirements under Article 13.")
                for key, value in data_cc_yaml['quality_management_system']:
                    if not value:
                        sys.exit(f"Because of the dataset represented by {filename}, this high-risk  AI system fails the quality management requirements under Article 17.")

    # Do this by examining any and all Model CCs too

        for filename in os.listdir(folder_path):
            # Check if the search word is in the filename
            if "model_cc.md" in filename.lower():

                # If it is, load the yaml

                with open(folder_path + filename, 'r') as file:
                    model_cc_yaml = yaml.safe_load(file)

                for key, value in model_cc_yaml['risk_management_system']:
                    if not value:
                        sys.exit(f"Because of the model represented by {filename}, this high-risk AI system fails the risk management requirements under Article 9.")
                for key, value in data_cc_yaml['technical_documentation']:
                    if not value:
                        sys.exit(f"Because of the model represented by {filename}, this high-risk AI system fails the technical documentation requirements under Article 11.")
                for key, value in data_cc_yaml['transparency_and_provision_of_information_to_deployers']:
                    if not value:
                        sys.exit(f"Because of the model represented by {filename}, this high-risk  AI system fails the transparency requirements under Article 13.")
                for key, value in data_cc_yaml['accuracy_robustness_cybersecurity']:
                    if not value:
                        sys.exit(f"Because of the model represented by {filename}, this high-risk  AI system fails the quality management requirements under Article 15.")
                for key, value in data_cc_yaml['quality_management_system']:
                    if not value:
                        sys.exit(f"Because of the model represented by {filename}, this high-risk  AI system fails the quality management requirements under Article 17.")

    # If the project is a GPAI model, check that is has met all the requirements for such systems: 

    if gpai_model:

    # Do this by examining the Project CC

        for key, value in project_cc_yaml['gpai_model_provider_obligations']:
            if not value:
                sys.exit("GPAI model fails the transparency requirements under Article 53.")

    # Do this by examining any and all Data CCs too

        for filename in os.listdir(folder_path):
            # Check if the search word is in the filename
            if "data_cc.md" in filename.lower():

                # If it is, load the yaml

                with open(folder_path + filename, 'r') as file:
                    data_cc_yaml = yaml.safe_load(file)

                for key, value in data_cc_yaml['gpai_requirements']['gpai_requirements']:
                    if not value:
                        sys.exit(f"Because of the dataset represented by {filename}, this GPAI fails the transparency requirements under Article 53.")

    # Do this by examining any and all Model CCs too
    
        for filename in os.listdir(folder_path):
            # Check if the search word is in the filename
            if "model_cc.md" in filename.lower():

                # If it is, load the yaml

                with open(folder_path + filename, 'r') as file:
                    model_cc_yaml = yaml.safe_load(file)

                for key, value in model_cc_yaml['obligations_for_providers_of_gpai_models']:
                    if not value:
                        sys.exit(f"Because of the model represented by {filename}, this GPAI fails the transparency requirements under Article 53.")

    # If the project is a GPAI model with systematic risk, check that is has additionally met all the requirements for such systems: 

    if gpai_model_systematic_risk:

    # Do this by examining the Project CC

        for key, value in project_cc_yaml['gpai_obligations_for_systemic_risk_models']:
            if not value:
                sys.exit("GPAI model with systematic risk fails the transparency requirements under Article 55.")

    # Do this by examining any and all Model CCs too

        for filename in os.listdir(folder_path):
            # Check if the search word is in the filename
            if "model_cc.md" in filename.lower():

                # If it is, load the yaml

                with open(folder_path + filename, 'r') as file:
                    model_cc_yaml = yaml.safe_load(file)

                for key, value in model_cc_yaml['obligations_for_providers_of_gpai_models_with_systemic_risk']:
                    if not value:
                        sys.exit(f"Because of the model represented by {filename}, this GPAI model with systematic risk fails the transparency requirements under Article 55.")

def set_type(project_variables, project_cc_yaml):
    ai_system = project_variables['ai_project_type']['ai_system']
    gpai_model = project_variables['ai_project_type']['gpai_model']
    if project_cc_yaml['ai_system']['ai_system']['value']:
        ai_system = True
    if project_cc_yaml['gpai_model']['gpai_model']['value']:
        gpai_model = True
    if ai_system and gpai_model:
        sys.exit("Your project cannot be both an AI system and a GPAI model. Please revise your Project CC accordingly.")
    if ai_system == True:
        for key, value in project_cc_yaml['high_risk_ai_system']:
            if value and sum(map(bool, [project_cc_yaml['high_risk_ai_system']['filter_exception_rights'],project_cc_yaml['high_risk_ai_system']['filter_exception_narrow'],project_cc_yaml['high_risk_ai_system']['filter_exception_human'],project_cc_yaml['high_risk_ai_system']['filter_exception_deviation'], project_cc_yaml['high_risk_ai_system']['filter_exception_prep']])) < 1:
                high_risk_ai_system == True
    if gpai_model == True:
        if project_cc_yaml['gpai_model_systematic_risk']['evaluation'] or project_cc_yaml['gpai_model_systematic_risk']['flops']:
            gpai_model_systematic_risk == True

def set_operator_role_and_location(project_variables, project_cc_yaml):
    operators = 0
    
    ai_system = project_variables['ai_project_type']['ai_system']
    gpai_model = project_variables['ai_project_type']['gpai_model']
    
    for var in project_variables['operator_role']:
        if project_cc_yaml['operator_role'][f'{var}']['value']:
            project_variables['operator_role'][f'{var}'] = True
            operators += 1 
        
    if ai_system and gpai_model:
        sys.exit("Your project cannot be both an AI system and a GPAI model. Please revise your Project CC accordingly.")
    if operators != 1:
        sys.exit("Please specify exactly one operator role.")
    
    return project_variables

def set_eu_market_status(project_variables, project_cc_yaml):
    
    if project_cc_yaml['eu_market_status']['placed_on_market']['value']:
        project_variables['eu_market_status']["placed_on_market"] = True
    if project_cc_yaml['eu_market_status']['put_into_service']['value']:
        project_variables['eu_market_status']["put_into_service"] = True
        
    if project_cc_yaml['operator_role']['output_used']['value']:
        project_variables['operator_role']["output_used"] = True
        
    return project_variables

def check_within_scope(project_cc):
    if not check_excepted(project_cc):
        if provider and ((ai_system and (placed_on_market or put_into_service)) or (gpai_model and placed_on_market)):   # Article 2.1(a)
            return True
        if deployer and eu_located: # Article 2.1(b)
            return True
        if (provider or deployer) and (ai_system and eu_located and output_used): # Article 2.1(c)
            return True
        if (importer or distributor) and ai_system: # Article 2.1(d)
            return True
        if product_manufacturer and ai_system and (placed_on_market or put_into_service): # Article 2.1(e)
            return True
    else:
        return False

def check_excepted(project_cc_yaml):
    if project_cc_yaml['excepted']['scientific'] or project_cc_yaml['excepted']['pre_market'] or (ai_system and project_cc_yaml['excepted']['open_source_ai_system']) or (gpai_model and project_cc_yaml['excepted']['open_source_gpai_system']):
        return True
    else:
        return False 

def check_prohibited (project_cc_yaml):
    if ai_system:
        for key in project_cc_yaml['prohibited_practice']['ai_system']:
            if key[value]: 
                print("You are engaged in a prohibited practice and thus the project is non-compliant.")
                return True
    if project_cc_yaml['prohibited_practice']['biometric']['categorization']:
        print("You are engaged in a prohibited practice and thus the project is non-compliant.")
        return True
    if project_cc_yaml['prohibited_practice']['biometric']['real_time'] and sum(map(bool, [project_cc['prohibited_practice']['biometric']['real_time_exception_victim'],project_cc['prohibited_practice']['biometric']['real_time_exception_threat'], project_cc['prohibited_practice']['biometric']['real_time_exception_investigation']])) == 0:
        print("You are engaged in a prohibited practice and thus the project is non-compliant.")
        return True
    else: 
        print("You are not engaged in any prohibited practices.")
        return False

def check_all_true(file_path):
    # Load the YAML file
    with open("./project_cc.yaml", 'r') as file:
        data = yaml.safe_load(file)

    # Iterate through top-level keys
    for top_key, top_value in data.items():
        if isinstance(top_value, dict):
            # Iterate through second-level keys
            for second_key, second_value in top_value.items():
                if not second_value:
                    print("You are non-compliant with the Act")
                    break
            else:
                print("No problems here")

def main():
    # Prompt the user to enter a filename
    file_path = "./" # input("Please enter a file path to the folder containing all your AI project's Compliance Cards: ")

    # Call the function with the entered filename
    check_for_project_cc(file_path)

if __name__ == "__main__":
    main()