# IMPORT DATA, PACKAGES, AND FUNCTIONS

## import the relevant functions and packages

In [1]:
import pandas as pd
import numpy as np
from test_case_generator_functions import alphabet

# TEST CASE TYPE REFERENCE INFORMATION

In [2]:
uid = 'UID-241' 
theme = 'Names where name parts are Modified'
category = 'Repetitions'
sub_category = 'Very Short Name'
entity_type = 'Entity'

## download the OFAC list from the web

In [3]:
ofac_list_download = pd.read_csv('https://www.treasury.gov/ofac/downloads/sdn.csv', header=None)

In [4]:
ofac_list = ofac_list_download[[0,1,2]]
ofac_list.columns = ['uid', 'name', 'entity_type']

# FILTER FOR THE REQUIREMENTS OF THE TEST CASE TYPE

## filter for the requirements of the specific test case type

In [5]:
ofac_list_filtered = ofac_list[(ofac_list.entity_type == '-0- ')] # only evaluate entities

In [6]:
ofac_list_filtered = ofac_list_filtered.reset_index(drop = True)
ofac_list_filtered_short_name = pd.DataFrame(columns=['uid', 'name', 'entity_type'])

for ind, name in enumerate(ofac_list_filtered['name']):
    if len(name) <= 10:
        ofac_list_filtered_short_name.loc[len(ofac_list_filtered_short_name)] = list(ofac_list_filtered.loc[ind])

ofac_list_filtered_short_name

Unnamed: 0,uid,name,entity_type
0,535,CIMEX,-0-
1,578,COTEI,-0-
2,591,CUBAEXPORT,-0-
3,592,CUBAFRUTAS,-0-
4,621,CUBANATUR,-0-
...,...,...,...
199,37023,LADOGA OOO,-0-
200,37070,BLENDER.IO,-0-
201,37485,TREND GYO,-0-
202,37768,ZALOG OOO,-0-


## randomly choose 10 rows

In [7]:
ofac_list_sampled = ofac_list_filtered_short_name.sample(n = 10)
ofac_list_sampled

Unnamed: 0,uid,name,entity_type
187,34673,PASKAL OOO,-0-
29,9367,EIRIN FARM,-0-
38,10492,GHORB NOOH,-0-
175,32022,EDE 2 EOOD,-0-
89,16811,CJSC ZEST,-0-
158,28533,AL KAWTHAR,-0-
127,23628,HASM,-0-
61,12927,MAHAN AIR,-0-
147,26664,EVIL CORP,-0-
156,28177,MINOCONGO,-0-


# CREATE THE TEST CASES

## create blank final test cases table

In [8]:
final_test_cases = pd.DataFrame(columns=['UID', 'Theme','Category','Sub-category','Entity-Type','Test Case ID' , 'OFAC List UID', 'Original Name','Test Case Name'])
final_test_cases

Unnamed: 0,UID,Theme,Category,Sub-category,Entity-Type,Test Case ID,OFAC List UID,Original Name,Test Case Name


## run loop to generate the test cases

In [9]:
for index, row in ofac_list_sampled.iterrows():
    original_name = row['name'].upper()
    original_name_list = list(original_name) # transfer name string into letter list
    
    final_test_name = original_name_list.copy()
    
    repeat_list = [] # get index of alphabets in each name
    for i in range(len(original_name)):
        if original_name[i] in alphabet():
            repeat_list.append(i)
    
    random_index = np.random.choice(repeat_list) # randomly choose letter to be repeated
    repeat_list.remove(random_index) # remove chosen letter

    final_test_name[random_index] += original_name_list[random_index] # add repeated letter

    final_test_name = ''.join(final_test_name)
    
    final_test_cases.loc[len(final_test_cases)] = [uid, theme, category, sub_category, entity_type, uid + ' - ' + str(index), row['uid'], row['name'], final_test_name] # append to the dataframe

final_test_cases

Unnamed: 0,UID,Theme,Category,Sub-category,Entity-Type,Test Case ID,OFAC List UID,Original Name,Test Case Name
0,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 187,34673,PASKAL OOO,PASKAL OOOO
1,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 29,9367,EIRIN FARM,EIRIIN FARM
2,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 38,10492,GHORB NOOH,GHORB NOOOH
3,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 175,32022,EDE 2 EOOD,EDEE 2 EOOD
4,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 89,16811,CJSC ZEST,CJSC ZZEST
5,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 158,28533,AL KAWTHAR,AL KAWTTHAR
6,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 127,23628,HASM,HASMM
7,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 61,12927,MAHAN AIR,MAHAAN AIR
8,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 147,26664,EVIL CORP,EVVIL CORP
9,UID-241,Names where name parts are Modified,Repetitions,Very Short Name,Entity,UID-241 - 156,28177,MINOCONGO,MIINOCONGO
