In [1]:
import os
from Bio import SeqIO
import io
from Bio.Seq import Seq
import subprocess

In [2]:
from IPython.display import display, HTML
display(HTML("<style>.container { width:100% !important; }</style>"))

In [3]:
def make_raw_files_for_alignment(gene_sequence,annotated_genome_location,annotated_species_name,error_exon,query_fasta_sequence,query_length):
    for offset in range(3):
        translated_sequence = str(gene_sequence[offset:].translate()).split("*")
        for i in range(len(translated_sequence)):
            if len(translated_sequence[i])> 0.8*query_length:
                sequence_set = f">set{i+1}_frame{offset}\n{translated_sequence[i]}\n\n"
                # print(i+1, offset)
                
                with open(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_alignment/{error_exon}_translated_genomic_sequence_{i+1}_frame{offset}.fa",'w') as out_file:
                    output = f"{query_fasta_sequence}\n\n{sequence_set}"
                    out_file.write(output)

In [4]:
def run_mafft(annotated_genome_location,annotated_species_name,error_exon):
    location = f'{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_alignment'
    list_of_files_to_run_mafft_on = os.listdir(location)
    for file in list_of_files_to_run_mafft_on:
        if file.endswith(".fa"):
            command = f'"mafft" --localpair --maxiterate 16 --reorder --distout "{location}/{file}" > "{location}/alignment_{file}.txt"'
            # print(command)
            subprocess.run(f'{command}', shell=True, stderr = subprocess.DEVNULL) 
            # os.system(f'{command}')
            command = f'"mafft" --localpair --clustalout --maxiterate 16 --reorder "{location}/{file}" > "{location}/alignment_clustal_{file}.txt"'
            subprocess.run(f'{command}', shell=True, stderr = subprocess.DEVNULL) 
            
            # os.system(f'{command}')
    return(location)

In [5]:
def process_mafft_output(mafft_run_folder, error_exon):
    list_of_files_in_mafft_run_folder = os.listdir(mafft_run_folder)
    score_output = []
    score = 99
    min_score_sequence = ''
    alignment_file = ''
    for file in list_of_files_in_mafft_run_folder:
        if file.endswith(".fa.hat2"):
            with io.open(f"{mafft_run_folder}/{file}", 'r') as dist_matrix_file:
                dist_matrix_list = dist_matrix_file.readlines()
            
            sequence_name = dist_matrix_list[-2].rstrip().split("=")[1]
            distance_score = float(dist_matrix_list[-1].rstrip())
            if len(score_output) < 5:
                score_output.append( [sequence_name,distance_score])
            else:
                for i in range(len(score_output)):
                    score_at_this_index = score_output[i][1]
                    if distance_score < score_at_this_index:
                        score_output[i] = [sequence_name,distance_score]
                        break
            if distance_score < score:
                score = distance_score
                min_score_sequence = sequence_name
                alignment_file = f'alignment_{file.replace(".hat2",".txt")}'
    # print(score_output)
    print(f"min = {min_score_sequence}, {score}" )
    # score_out_merged = '\n'.join(score_output)
    print(f"5 top scores:\n{score_output}")
    print(f"{mafft_run_folder}/{alignment_file}")
    
    alignment_file = SeqIO.parse(f"{mafft_run_folder}/{alignment_file}", 'fasta')
    # print (records.id)
    fasta_start_position = 0
    fasta_end_position = 0
    start_switch = 0
    end_switch = 0
    alignment_name = ''
    for records in alignment_file:
        
        
        
        if error_exon in records.id:
            gap_counter = 0
            base_counter = 0
            for current_position in range(len(records.seq)):
                sequence_length = len(records.seq) - records.seq.count('-')
                # print(f"fasta_end_position {fasta_end_position} fasta_start_position {fasta_start_position}")
                # print(f"current_position = {current_position}, {len(records.seq)}")
                # print(records.seq[current_position])
                # print("fasta_start_position",fasta_start_position)
                # print("start_switch",start_switch)
                
                # print(gap_counter, base_counter)
                # print(5,0.2*sequence_length)
                if start_switch == 1 and records.seq[current_position] == "-" and gap_counter > 3 and (len(records.seq[:current_position]) - records.seq[:current_position].count('-')) < (0.1*sequence_length):
                #  :
                    # print("\n\nhere\n\n")
                    start_switch = 0
                    gap_counter = 0

                if "-" not in records.seq[current_position] and start_switch == 0 :
                    fasta_start_position = current_position
                    start_switch = 1
                
                    
                
                    
                if end_switch == 1 and "-" not in records.seq[current_position] and (len(records.seq[current_position:]) - records.seq[current_position:].count('-')) > 0.1*sequence_length :
                    end_switch = 0
                    gap_counter = 0
                
                    
                if start_switch == 1 and records.seq[current_position] == "-" and end_switch == 0:
                    # print(f"base_counter {base_counter}")
                    # print(f"fasta_end_position {fasta_end_position}")
                    
                    # print(f"fasta_end_position {fasta_end_position}")
                    
                    fasta_end_position = current_position
                    end_switch = 1
                if "-" in records.seq[current_position]:
                    gap_counter += 1
                else:
                    gap_counter = 0
                    base_counter += 1
        else:
            alignment_name = records.id
            if fasta_end_position == 0:
                
                fasta_end_position = current_position
            end_switch = 1
            start_switch = 1

        if start_switch == 1 and end_switch == 1:
            print(fasta_start_position, fasta_end_position)
            gene_sequence = records.seq[fasta_start_position:fasta_end_position]
            print(f"{records.id}\n{gene_sequence}")
    return(gene_sequence, alignment_name)

# process_mafft_output(mafft_run_folder, error_exon)

In [6]:
def get_genome_file(genome_location,species):
    list_of_files_in_genome_folder = os.listdir(f"{genome_location}/{species}")
    for file in list_of_files_in_genome_folder:
        if file.endswith("_genomic.fna"):
            genome_file = file
    return(genome_file)  

def get_annotated_genome_name(annotated_genome_location, species):
    list_of_annotated_genomes = os.listdir(annotated_genome_location)
  
    # print(annotated_species)
    for annotated_species in list_of_annotated_genomes:
        if annotated_species.endswith(species):
            return(annotated_species)
             
    if annotated_species_name == '':
        print(f"Error with annotated species name")
        assert False

def check_and_make_folders(annotated_genome_location,annotated_species_name,error_exon):
    list_of_files_inside_annotated_species_folder = os.listdir(f"{annotated_genome_location}/{annotated_species_name}")

    if f"Period_gene_genomic_sequence_individual_exon_{query_species}" not in list_of_files_inside_annotated_species_folder:
        os.mkdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}")
    
    list_of_exon_directories = os.listdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/")
    
    if error_exon not in list_of_exon_directories:
        os.mkdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}")
        os.mkdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_alignment")
    elif error_exon in list_of_exon_directories:
        list_of_folders_1 = os.listdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}")
        if "for_alignment" not in list_of_folders_1:
            os.mkdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_alignment")
        list_of_files = os.listdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_alignment")
        for file in list_of_files:
            os.remove(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_alignment/{file}")


In [7]:
def get_gene_sequence(genome_location, species, genome_file, scaffold,gene_start,gene_end,complement,annotated_genome_location,annotated_species_name):
    from Bio import SeqIO
    print("Getting Gene")
    list_of_files_inside_annotated_species_folder = os.listdir(f"{annotated_genome_location}/{annotated_species_name}")
    # print(list_of_files_inside_annotated_species_folder)
    # print(
    if f"Period_gene_genomic_sequence_individual_exon_{query_species}" not in list_of_files_inside_annotated_species_folder:
        os.mkdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}")

    list_of_files_inside_indiv_exon_folder = os.listdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}")
    if "temp" not in list_of_files_inside_indiv_exon_folder:
         os.mkdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/temp")

    # os.system(f'samtools faidx "{genome_location}/{species}/{genome_file}"')
    # subprocess.run("pwd")
    subprocess.run(f'samtools faidx "{genome_location}/{species}/{genome_file}"', shell = True, stderr = subprocess.DEVNULL)
    # os.system(f'samtools faidx "{genome_location}/{species}/{genome_file}" {scaffold}:{gene_start}-{gene_end} > "{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/temp/temp_genome.fa"')
    subprocess.run(f'samtools faidx "{genome_location}/{species}/{genome_file}" {scaffold}:{gene_start}-{gene_end} > "{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/temp/temp_genome.fa"', shell = True, stderr = subprocess.DEVNULL)
    genome = SeqIO.parse(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/temp/temp_genome.fa", "fasta")
    for entries in genome:
        gene_sequence = entries.seq
        if complement == "1":
            gene_sequence = gene_sequence.reverse_complement()
        break
    # print(gene_sequence)
    return (gene_sequence)

In [8]:
def mafft_process(previous_exon_coordinates,
                  next_exon_coordinates,
                  current_exon_coordinates,
                  query_species,
                  query_transcript,
                  query_location,
                  annotated_genome_location,
                 genome_location):
    query_exon = current_exon_coordinates[6].split("query")[-1][1:]
    error_exon = query_exon
    # print("AA")
    genome_file = get_genome_file(genome_location,species)
    
    upstream_exon_line, downstream_exon_line = previous_exon_coordinates.split(","),next_exon_coordinates.split(",")
    complement,scaffold = upstream_exon_line[4], upstream_exon_line[1]

    if complement == "0":
        gene_start = min(int(upstream_exon_line[2]),int(upstream_exon_line[3]))
        gene_end = max(int(downstream_exon_line[2]),int(downstream_exon_line[3]))
    
    if complement == "1":
        gene_start = min(int(downstream_exon_line[2]),int(downstream_exon_line[3]))
        gene_end = max(int(upstream_exon_line[2]),int(upstream_exon_line[3]))
    
    
    with open(f"{query_location}/{query_species}/{query_transcript}/query_{query_exon}.fa", 'r') as query_file:
        query_file_list = query_file.readlines()
        query_fasta_sequence = "".join(query_file_list)
        left_overhang = query_file_list[0].split("Frame")[1][1]
        right_overhang = query_file_list[0].split("rightoh")[1][1]
        original_query_name = query_file_list[0]
        original_query = query_file_list[1]
        
    query_length = len(query_fasta_sequence.split("\n")[1])
    
    annotated_species_name = get_annotated_genome_name(annotated_genome_location, species)
    # print(annotated_species_name)

    # print(annotated_genome_location)
    gene_sequence = get_gene_sequence(genome_location, species, genome_file, scaffold,gene_start,gene_end,complement,annotated_genome_location,annotated_species_name)
    # assert False
    check_and_make_folders(annotated_genome_location,annotated_species_name,error_exon)
    
    
    make_raw_files_for_alignment(gene_sequence,annotated_genome_location,annotated_species_name,error_exon,query_fasta_sequence,query_length)
    
    return(annotated_species_name, error_exon,species, genome_file,gene_sequence,left_overhang,right_overhang,scaffold, original_query_name,original_query )


In [None]:
family_group = "5.Coliadinae"
blast_output_location = f"/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/{family_group}/1.Blast_result"
species_list = os.listdir(blast_output_location)

if "desktop.ini" in species_list:
    species_list.remove("desktop.ini")
species_list = ["Eurema_hecabe","Phoebis_sennae","Zerene_cesonia","Leptidea_juvernica","Leptidea_reali","Leptidea_sinapis"]
for species in species_list:
    annotated_genome_location = f"/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/{family_group}/1.Blast_result"
    query_location = f"/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/{family_group}/1.Query"
    list_of_query_species = os.listdir(query_location)
    if "desktop.ini" in list_of_query_species:
        list_of_query_species.remove("desktop.ini")
#     list_of_query_species = ["Papilio_xuthus"]
    for query_species in list_of_query_species:
        list_of_query_transcripts = os.listdir(f"{query_location}/{query_species}")
        if "desktop.ini" in list_of_query_transcripts:
            list_of_query_transcripts.remove("desktop.ini")
        for query_transcript in list_of_query_transcripts:


            genome_location = "/mnt/f/Genomes_2023-12-26"



            output_coordinate_file = "Species," + "Scaffold," + "Start," + "Stop," + "Complement," + "Error," + "Gene,"+ "Query_start," + "Query_stop,"+ "Query_Length," +  "AG_GT," + "Spliceator_prediction\n"
            exons_to_check_list = ["Exon_2","Exon_3","Exon_4","Exon_5","Exon_6","Exon_7","Exon_8","Exon_9","Exon_10","Exon_11","Exon_12","Exon_13","Exon_14","Exon_15"]
#             exons_to_check_list = ["Exon_9"]

            list_of_files_in_species_folder = os.listdir(f"{blast_output_location}/{species}")
            coordinate_file_name = ''
        #     print(list_of_files_in_species_folder)
            for file_names in list_of_files_in_species_folder:

                if file_names.endswith("_coordinates_old.csv"):
                    coordinate_file_name = file_names
            if coordinate_file_name =='':
                print(f"Coordinate file error")
                assert False

            with io.open(f"{blast_output_location}/{species}/{coordinate_file_name}", 'r') as temp_file_open:
                coordinate_file_lines = temp_file_open.readlines()
            # print(coordinate_file_lines[0])
            for exons_to_check in exons_to_check_list:

                for i in range(1,len(coordinate_file_lines)):
                    coordinate_file_lines_split = coordinate_file_lines[i].split(",")
                    current_exon_coordinates = coordinate_file_lines[i].split(",")
                    if i == 1:
                        scaffold_first_exon = coordinate_file_lines[i].split(",")[1]
                        first_exon_start, first_exon_end = coordinate_file_lines[i].split(",")[2],coordinate_file_lines[i].split(",")[3]
                    # if coordinate_file_lines_split[5] == "Y":
                    if  coordinate_file_lines_split[6].endswith(exons_to_check):
                        if i == 1:
                            print(f'First Exon has errors\n{coordinate_file_lines[i]}')
                            assert False
                        else:
                            print(f"Scaffold = {scaffold_first_exon}, start = {first_exon_start}, end = {first_exon_end}")
                            print(coordinate_file_lines[i])
                            # process_current_exon = input("Error Found! Process?")
                            process_current_exon = 'y'
                            if process_current_exon.lower()[0] == "y":
                                if i>2:
                                    previous_exon_number = i-2
                                else:
                                    previous_exon_number = i-1
                                if i+2 <=int(exons_to_check_list[-1].split("_")[1]):
                                    next_exon_number = i+2
                                else:
                                    next_exon_number = i+1
                                if i >= int(exons_to_check_list[-1].split("_")[1]):
                                    next_exon_number = int(exons_to_check_list[-1].split("_")[1])
#                                     continue

                                '''
                                the above code ensures that missing exons do not cause issues
                                '''

                                previous_exon_coordinates = ''
                                next_exon_coordinates = ''
                                while True:
                                    print(previous_exon_number)
                                    if coordinate_file_lines[previous_exon_number].split(",")[5] == "N":
                                        previous_exon_coordinates = coordinate_file_lines[previous_exon_number]
                                        break
                                    # else:
                                    #     proceed_prompt = input(f"Previous exon coordinate\n{coordinate_file_lines[previous_exon_number]}\nProceed?")
                                    #     if proceed_prompt.lower()[0] == "y":
                                    #         previous_exon_coordinates = coordinate_file_lines[previous_exon_number]
                                    #         break
                                    previous_exon_number -= 1
                                while True:
                                    print(next_exon_number)
                                    try:
                                        if coordinate_file_lines[next_exon_number].split(",")[5] == "N":
                                            next_exon_coordinates = coordinate_file_lines[next_exon_number]
                                            break
                                    except:
                                        if coordinate_file_lines[next_exon_number-1].split(",")[5] == "N":
                                            next_exon_coordinates = coordinate_file_lines[next_exon_number-1]
                                            break
                                   
                                    next_exon_number += 1


                                print(previous_exon_coordinates)
                                print(next_exon_coordinates)
                                annotated_species_name, error_exon, species, genome_file, gene_sequence,left_overhang,right_overhang,scaffold,original_query_name, original_query = mafft_process(previous_exon_coordinates,
                                                                                                                                  next_exon_coordinates,
                                                                                                                                  current_exon_coordinates,
                                                                                                                                  query_species,
                                                                                                                                  query_transcript,
                                                                                                                                  query_location,
                                                                                                                                  annotated_genome_location,
                                                                                                                                     genome_location)

                                mafft_run_folder = run_mafft(annotated_genome_location,annotated_species_name,error_exon)

                                possible_gene_sequence, alignment_name = process_mafft_output(mafft_run_folder, error_exon)

                                print(f"Original query = {original_query}")
                                print(f"New query = {possible_gene_sequence}")
                                
                                list_of_folders_inside_exon_folder = os.listdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}")
                                if "for_blast" not in list_of_folders_inside_exon_folder:
                                    os.mkdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_blast")
                                else:
                                    list_of_files = os.listdir(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_blast")
                                    for file in list_of_files:
                                        os.remove(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_blast/{file}")


                                with open(f"{annotated_genome_location}/{annotated_species_name}/Period_gene_genomic_sequence_individual_exon_{query_species}/{error_exon}/for_blast/new_query.txt",'w') as query_file:
                                    query = f">Query_{error_exon}_{alignment_name}\n{possible_gene_sequence}"
                                    query_file.write(query)
                    

Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6805578,6806125,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_0_query_Exon_2,1,182,182

1
4
Colias_behrii,JARWMC010000003.1,6804607,6804703,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_1_query_Exon_1,1,32,32

Colias_behrii,JARWMC010000003.1,6806922,6807151,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_0_query_Exon_4,1,76,76

Getting Gene
min = set19_frame1, 0.099
5 top scores:
[['set19_frame1', 0.099]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_2/for_alignment/alignment_Exon_2_translated_genomic_sequence_19_frame1.fa.txt
4 187
Zerene_cesonia_XM_038355360.1_Frame_2_rightoh_0_query_Exon_2
ALESILHNILTEDKNLRTYRRSISFGQNIKKDIIPLLINVKDEKTIELLIKILVNLTIPVECLLSVETISNTDIGRHTIFEINSLLASTKSAFIDHRATKVIIEFLKKNSDVEQKSKLSSEQCTNISNTLLFLRNILHIPEDVNNISSNYNSPPHTIQNQILWN

min = set30_frame2, 0.076
5 top scores:
[['set30_frame2', 0.076], ['set26_frame2', 1.69], ['set44_frame2', 1.708], ['set17_frame0', 1.741], ['set45_frame0', 1.772]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_8/for_alignment/alignment_Exon_8_translated_genomic_sequence_30_frame2.fa.txt
0 33
Zerene_cesonia_XM_038355360.1_Frame_0_rightoh_2_query_Exon_8
DLVVTNHILLMFLDSVMKLPDYKGSGKLVDHIK
0 33
set30_frame2
DLVVTNHILLMFLDSVMKLPDYKGSAKLIDHIK
Original query = DLVVTNHILLMFLDSVMKLPDYKGSGKLVDHIK
New query = DLVVTNHILLMFLDSVMKLPDYKGSAKLIDHIK
Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6809014,6809212,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_0_query_Exon_9,1,66,66

7
11
Colias_behrii,JARWMC010000003.1,6808344,6808535,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_0_query_Exon_7,1,64,64

Colias_behrii,JARWM

Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6812823,6813026,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
Colias_behrii,JARWMC010000003.1,6810753,6810921,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias_behrii,JARWMC010000003.1,6812823,6813026,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

Getting Gene
min = set45_frame1, 0.782
5 top scores:
[['set2_frame2', 1.817], ['set40_frame0', 1.866], ['set15_frame1', 1.845], ['set29_frame1', 1.858], ['set45_frame1', 0.782]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_15/for_alignment/alignment_Exon_15_translated_genomic_sequence_45_frame1.fa.txt
11 78
set45_frame1
TIIQSEIP-ANKPDGQETTAKTSRTPEINKEECYVAAESTLLIHTDNEVKGEPSYFNISQAESEYCN
Original query = TIIQSEIQDMSKLVGKEPTANTL

Getting Gene
min = set39_frame2, 0.306
5 top scores:
[['set39_frame2', 0.306], ['set44_frame2', 1.815], ['set5_frame1', 1.8], ['set8_frame1', 1.759], ['set22_frame1', 1.844]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_39_frame2.fa.txt
0 64
Pieris_brassicae_XM_045665865.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
0 64
set39_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6808638,6808738,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Col

Getting Gene
min = set49_frame1, 1.016
5 top scores:
[['set49_frame1', 1.016], ['set1_frame2', 1.569], ['set5_frame2', 1.627], ['set34_frame2', 1.707], ['set15_frame2', 1.725]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_49_frame1.fa.txt
23 47
Pieris_brassicae_XM_045665865.1_Frame_1_rightoh_2_query_Exon_14
ETTGAGWLQVVQKSHEIKFTMDRE
23 47
set49_frame1
ERAVPSWLDVVQKSQEFKLTLELE
Original query = ETTGAGWLQVVQKSHEIKFTMDRE
New query = ERAVPSWLDVVQKSQEFKLTLELE
Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6812823,6813026,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
Colias_behrii,JARWMC010000003.1,6810753,6810921,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias_behrii,JARWMC010000003.1

min = set39_frame2, 0.339
5 top scores:
[['set39_frame2', 0.339], ['set18_frame0', 1.846], ['set5_frame1', 1.753], ['set8_frame1', 1.811], ['set44_frame2', 1.875]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_39_frame2.fa.txt
0 64
Maniola_jurtina_XM_045907399.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
0 64
set39_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6808638,6808738,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_behrii,JA

min = set49_frame1, 0.726
5 top scores:
[['set49_frame1', 0.726], ['set56_frame1', 1.559], ['set4_frame2', 1.766], ['set5_frame2', 1.774], ['set34_frame2', 1.774]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_49_frame1.fa.txt
13 47
Maniola_jurtina_XM_045907399.1_Frame_1_rightoh_2_query_Exon_14
PGSSFTTTDDNVTKPSWLEVVQKSQEYKITLDLG
13 47
set49_frame1
PGSSFNIACDERAVPSWLDVVQKSQEFKLTLELE
Original query = PGSSFTTTDDNVTKPSWLEVVQKSQEYKITLDLG
New query = PGSSFNIACDERAVPSWLDVVQKSQEFKLTLELE
Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6812823,6813026,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
Colias_behrii,JARWMC010000003.1,6810753,6810921,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias

min = set39_frame2, 0.0
5 top scores:
[['set39_frame2', 0.0], ['set18_frame0', 1.832], ['set5_frame1', 1.803], ['set8_frame1', 1.762], ['set34_frame1', 1.859]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Colias_croceus/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_39_frame2.fa.txt
0 64
Colias_croceus_XM_045654792.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
0 64
set39_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6808638,6808738,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_behrii,JARWMC01

Scaffold = JARWMC010000003.1, start = 6804607, end = 6804703
Colias_behrii,JARWMC010000003.1,6812385,6812489,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14,1,34,34

12
15
Colias_behrii,JARWMC010000003.1,6810396,6810596,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_1_query_Exon_12,1,66,66

Colias_behrii,JARWMC010000003.1,6812823,6813026,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

Getting Gene
min = set49_frame1, 0.127
5 top scores:
[['set49_frame1', 0.127], ['set56_frame1', 1.654], ['set1_frame2', 1.736], ['set5_frame2', 1.756], ['set19_frame2', 1.784]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_behrii/Period_gene_genomic_sequence_individual_exon_Colias_croceus/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_49_frame1.fa.txt
13 47
Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14
PGSSFNMACDEHAVPSWLDVVQKSQEFKLTLELE
13 47
set49_frame1
PGSSFN

Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6063957,6064148,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_0_query_Exon_7,1,64,64

5
9
Colias_croceus,NC_059539.1,6062827,6063119,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_5,1,97,97

Colias_croceus,NC_059539.1,6064592,6064790,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_0_query_Exon_9,1,66,66

Getting Gene
min = set27_frame2, 0.066
5 top scores:
[['set1_frame0', 1.84], ['set4_frame0', 1.772], ['set5_frame1', 1.786], ['set20_frame2', 1.81], ['set27_frame2', 0.066]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_27_frame2.fa.txt
0 64
Zerene_cesonia_XM_038355360.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSVHICQHDKDILLDLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
0 64
set27_frame2
VVTAIREFV

Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6074184,6074288,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14,1,34,34

12
15
Colias_croceus,NC_059539.1,6065937,6066137,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_1_query_Exon_12,1,66,66

Colias_croceus,NC_059539.1,6074947,6075150,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

Getting Gene
min = set166_frame1, 0.122
5 top scores:
[['set166_frame1', 0.122], ['set44_frame2', 1.648], ['set190_frame2', 1.699], ['set14_frame2', 1.734], ['set179_frame2', 1.746]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_166_frame1.fa.txt
8 42
Zerene_cesonia_XM_038355360.1_Frame_1_rightoh_2_query_Exon_14
PGSSFNIACDERSVPSWLDVVQKSQEFKLTLELE
8 42
set166_frame1
PGSSFNMACDEHAVPSWLDV

Getting Gene
min = set27_frame2, 0.306
5 top scores:
[['set1_frame0', 1.825], ['set4_frame0', 1.799], ['set5_frame1', 1.75], ['set20_frame2', 1.778], ['set27_frame2', 0.306]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_27_frame2.fa.txt
0 64
Pieris_brassicae_XM_045665865.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
0 64
set27_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6064225,6064325,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_croceu

Getting Gene
min = set166_frame1, 1.024
5 top scores:
[['set166_frame1', 1.024], ['set168_frame2', 1.555], ['set71_frame2', 1.587], ['set91_frame2', 1.629], ['set115_frame2', 1.643]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_166_frame1.fa.txt
18 42
Pieris_brassicae_XM_045665865.1_Frame_1_rightoh_2_query_Exon_14
ETTGAGWLQVVQKSHEIKFTMDRE
18 42
set166_frame1
EHAVPSWLDVVQKSQEFKLTLELE
Original query = ETTGAGWLQVVQKSHEIKFTMDRE
New query = EHAVPSWLDVVQKSQEFKLTLELE
Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6074947,6075150,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
Colias_croceus,NC_059539.1,6066302,6066467,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,1,54,54

Colias_croceus,NC_059539.1,6074947,607

min = set27_frame2, 0.339
5 top scores:
[['set1_frame0', 1.818], ['set4_frame0', 1.835], ['set5_frame1', 1.74], ['set20_frame2', 1.83], ['set27_frame2', 0.339]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_27_frame2.fa.txt
0 64
Maniola_jurtina_XM_045907399.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
0 64
set27_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6064225,6064325,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_croceus,NC_059539.1,60

Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6074184,6074288,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14,1,34,34

12
15
Colias_croceus,NC_059539.1,6065937,6066137,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_1_query_Exon_12,1,66,66

Colias_croceus,NC_059539.1,6074947,6075150,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

Getting Gene
min = set166_frame1, 0.732
5 top scores:
[['set166_frame1', 0.732], ['set190_frame2', 1.616], ['set168_frame2', 1.689], ['set14_frame2', 1.72], ['set53_frame1', 1.729]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_166_frame1.fa.txt
8 42
Maniola_jurtina_XM_045907399.1_Frame_1_rightoh_2_query_Exon_14
PGSSFTTTDDNVTKPSWLEVVQKSQEYKITLDLG
8 42
set166_frame1
PGSSFNMACDEHAVPSWLD

min = set27_frame2, 0.0
5 top scores:
[['set1_frame0', 1.811], ['set4_frame0', 1.773], ['set5_frame1', 1.778], ['set20_frame2', 1.781], ['set27_frame2', 0.0]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Colias_croceus/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_27_frame2.fa.txt
0 64
Colias_croceus_XM_045654792.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
0 64
set27_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6064225,6064325,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_croceus,NC_059539.1,606341

Scaffold = NC_059539.1, start = 6060936, end = 6061032
Colias_croceus,NC_059539.1,6074184,6074288,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14,1,34,34

12
15
Colias_croceus,NC_059539.1,6065937,6066137,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_1_query_Exon_12,1,66,66

Colias_croceus,NC_059539.1,6074947,6075150,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

Getting Gene
min = set166_frame1, 0.0
5 top scores:
[['set166_frame1', 0.0], ['set44_frame2', 1.626], ['set10_frame0', 1.655], ['set190_frame2', 1.715], ['set79_frame1', 1.724]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_croceus/Period_gene_genomic_sequence_individual_exon_Colias_croceus/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_166_frame1.fa.txt
8 42
Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14
PGSSFNMACDEHAVPSWLDVVQKSQEFKLTLELE
8 42
set166_frame1
PGSSFNMACDEHAVPSWLDVVQKSQ

Getting Gene
min = set20_frame1, 0.099
5 top scores:
[['set1_frame0', 1.837], ['set38_frame2', 1.847], ['set4_frame1', 1.799], ['set8_frame1', 1.802], ['set20_frame1', 0.099]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_20_frame1.fa.txt
0 64
Zerene_cesonia_XM_038355360.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSVHICQHDKDILLDLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
0 64
set20_frame1
VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSVHICQHDKDILLDLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,83183,83283,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_e

min = set9_frame0, 0.03
5 top scores:
[['set11_frame1', 1.693], ['set1_frame2', 1.759], ['set9_frame0', 0.03], ['set27_frame1', 1.796], ['set20_frame0', 1.701]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_9_frame0.fa.txt
3 37
Zerene_cesonia_XM_038355360.1_Frame_1_rightoh_2_query_Exon_14
PGSSFNIACDERSVPSWLDVVQKSQEFKLTLELE
3 37
set9_frame0
PGSSFNIACDERAVPSWLDVVQKSQEFKLTLELE
Original query = PGSSFNIACDERSVPSWLDVVQKSQEFKLTLELE
New query = PGSSFNIACDERAVPSWLDVVQKSQEFKLTLELE
Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,85992,86192,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
Colias_eurytheme,CAJQZN010043793.1,85245,85416,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias_eurytheme,C

Getting Gene
min = set20_frame1, 0.313
5 top scores:
[['set1_frame0', 1.803], ['set38_frame2', 1.833], ['set4_frame1', 1.787], ['set8_frame1', 1.778], ['set20_frame1', 0.313]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_20_frame1.fa.txt
0 64
Pieris_brassicae_XM_045665865.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
0 64
set20_frame1
VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,83183,83283,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Coli

min = set9_frame0, 1.016
5 top scores:
[['set1_frame2', 1.569], ['set28_frame2', 1.604], ['set30_frame1', 1.726], ['set27_frame1', 1.736], ['set9_frame0', 1.016]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_9_frame0.fa.txt
13 37
Pieris_brassicae_XM_045665865.1_Frame_1_rightoh_2_query_Exon_14
ETTGAGWLQVVQKSHEIKFTMDRE
13 37
set9_frame0
ERAVPSWLDVVQKSQEFKLTLELE
Original query = ETTGAGWLQVVQKSHEIKFTMDRE
New query = ERAVPSWLDVVQKSQEFKLTLELE
Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,85992,86192,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
Colias_eurytheme,CAJQZN010043793.1,85245,85416,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias_eurytheme,CAJQZN010043793.1,85992,86192,0,N

Getting Gene
min = set20_frame1, 0.355
5 top scores:
[['set1_frame0', 1.818], ['set12_frame0', 1.835], ['set4_frame1', 1.753], ['set8_frame1', 1.83], ['set20_frame1', 0.355]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_20_frame1.fa.txt
0 64
Maniola_jurtina_XM_045907399.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
0 64
set20_frame1
VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,83183,83283,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_

min = set9_frame0, 0.726
5 top scores:
[['set3_frame0', 1.716], ['set13_frame2', 1.72], ['set9_frame0', 0.726], ['set15_frame0', 1.787], ['set20_frame0', 1.623]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_9_frame0.fa.txt
3 37
Maniola_jurtina_XM_045907399.1_Frame_1_rightoh_2_query_Exon_14
PGSSFTTTDDNVTKPSWLEVVQKSQEYKITLDLG
3 37
set9_frame0
PGSSFNIACDERAVPSWLDVVQKSQEFKLTLELE
Original query = PGSSFTTTDDNVTKPSWLEVVQKSQEYKITLDLG
New query = PGSSFNIACDERAVPSWLDVVQKSQEFKLTLELE
Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,85992,86192,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
Colias_eurytheme,CAJQZN010043793.1,85245,85416,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias_eurythem

min = set20_frame1, 0.034
5 top scores:
[['set1_frame0', 1.808], ['set38_frame2', 1.828], ['set4_frame1', 1.798], ['set8_frame1', 1.781], ['set20_frame1', 0.034]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Colias_croceus/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_20_frame1.fa.txt
0 64
Colias_croceus_XM_045654792.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
0 64
set20_frame1
VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQYDKNILINLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,83183,83283,0,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_eurytheme,CAJQ

Scaffold = CAJQZN010043793.1, start = 79574, end = 79670
Colias_eurytheme,CAJQZN010043793.1,85503,85607,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14,1,34,34

12
15
Colias_eurytheme,CAJQZN010043793.1,84886,85086,0,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_1_query_Exon_12,1,66,66

Colias_eurytheme,CAJQZN010043793.1,85992,86192,0,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

Getting Gene
min = set9_frame0, 0.127
5 top scores:
[['set1_frame2', 1.736], ['set7_frame0', 1.802], ['set9_frame0', 0.127], ['set24_frame2', 1.808], ['set20_frame0', 1.715]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_eurytheme/Period_gene_genomic_sequence_individual_exon_Colias_croceus/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_9_frame0.fa.txt
3 37
Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14
PGSSFNMACDEHAVPSWLDVVQKSQEFKLTLELE
3 37
set9_frame0
PGSSFNIACDERAVPS

Getting Gene
min = set22_frame2, 0.079
5 top scores:
[['set22_frame2', 0.079], ['set27_frame0', 1.863], ['set36_frame0', 1.863], ['set5_frame1', 1.84], ['set13_frame2', 1.81]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_nastes/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_22_frame2.fa.txt
0 64
Zerene_cesonia_XM_038355360.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSVHICQHDKDILLDLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
0 64
set22_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPRYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSVHICQHDKDILLDLQMKMCETEELRSLLVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPRYHSKQYLQ
Scaffold = CAJQZM010003197.1, start = 2118, end = 2214
Colias_nastes,CAJQZM010025505.1,6871,6971,1,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_nastes,CAJQ

Scaffold = CAJQZM010003197.1, start = 2118, end = 2214
Colias_nastes,CAJQZM010037571.1,657,761,0,Y,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_14,1,32,34

12
15
16
Colias_nastes,CAJQZM010025505.1,5037,5237,1,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_1_query_Exon_12,1,66,66

Colias_nastes,CAJQZM010025505.1,3593,3776,1,N,Colias_croceus_XM_045654792.1_Frame_1_rightoh_0_query_Exon_16,1,61,61

Getting Gene
min = set19_frame1, 0.076
5 top scores:
[['set19_frame1', 0.076], ['set33_frame1', 1.637], ['set25_frame0', 1.686], ['set30_frame0', 1.718], ['set30_frame2', 1.727]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_nastes/Period_gene_genomic_sequence_individual_exon_Zerene_cesonia/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_19_frame1.fa.txt
9 43
Zerene_cesonia_XM_038355360.1_Frame_1_rightoh_2_query_Exon_14
PGSSFNIACDERSVPSWLDVVQKSQEFKLTLELE
9 43
set19_frame1
PGSSFNIACEERAVPSWLDVVQKSQEFKL

Getting Gene
min = set22_frame2, 0.32
5 top scores:
[['set22_frame2', 0.32], ['set27_frame0', 1.839], ['set23_frame2', 1.849], ['set5_frame1', 1.788], ['set13_frame2', 1.778]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_nastes/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_22_frame2.fa.txt
0 64
Pieris_brassicae_XM_045665865.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
0 64
set22_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPRYHSKQYLQ
Original query = VVTAIREFVQAIEVYQKSNHISQKDKEVLVQLQMKMSETNELRSLFVLLLRHYNPKYHSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPRYHSKQYLQ
Scaffold = CAJQZM010003197.1, start = 2118, end = 2214
Colias_nastes,CAJQZM010025505.1,6871,6971,1,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_nastes,

Getting Gene
min = set19_frame1, 1.016
5 top scores:
[['set19_frame1', 1.016], ['set1_frame2', 1.569], ['set30_frame2', 1.605], ['set19_frame2', 1.726], ['set36_frame0', 1.665]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_nastes/Period_gene_genomic_sequence_individual_exon_Pieris_brassicae/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_19_frame1.fa.txt
19 43
Pieris_brassicae_XM_045665865.1_Frame_1_rightoh_2_query_Exon_14
ETTGAGWLQVVQKSHEIKFTMDRE
19 43
set19_frame1
ERAVPSWLDVVQKSQEFKLTLELE
Original query = ETTGAGWLQVVQKSHEIKFTMDRE
New query = ERAVPSWLDVVQKSQEFKLTLELE
Scaffold = CAJQZM010003197.1, start = 2118, end = 2214
Colias_nastes,CAJQZM010025505.1,3919,4122,1,Y,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
16
Colias_nastes,CAJQZM010025505.1,4720,4894,1,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias_nastes,CAJQZM010025505.1,3593,3776,1,N

min = set22_frame2, 0.353
5 top scores:
[['set22_frame2', 0.353], ['set23_frame2', 1.885], ['set36_frame0', 1.848], ['set5_frame1', 1.77], ['set13_frame2', 1.83]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_nastes/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_7/for_alignment/alignment_Exon_7_translated_genomic_sequence_22_frame2.fa.txt
0 64
Maniola_jurtina_XM_045907399.1_Frame_0_rightoh_0_query_Exon_7
VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
0 64
set22_frame2
VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPRYHSKQYLQ
Original query = VVTAIREFVQAIEVYKKSAHICNNDKDELDKLQVKMCETDELRSLLVLLLRYYNPKYQSKQYLQ
New query = VVTAIREFVQAIEVYKKSVHICQHDKNILINLQMKMCETEELRSLLVLLLRHYNPRYHSKQYLQ
Scaffold = CAJQZM010003197.1, start = 2118, end = 2214
Colias_nastes,CAJQZM010025505.1,6871,6971,1,N,Colias_croceus_XM_045654792.1_Frame_0_rightoh_2_query_Exon_8,1,33,33

6
10
Colias_nastes,CAJQZM010025505

Getting Gene
min = set19_frame1, 0.772
5 top scores:
[['set19_frame1', 0.772], ['set30_frame2', 1.708], ['set25_frame0', 1.666], ['set30_frame0', 1.726], ['set33_frame1', 1.782]]
/mnt/h/My Drive/Circadian Rhythm Genes Project/7.Timeless Exon Analysis/5.Coliadinae/1.Blast_result/Colias_nastes/Period_gene_genomic_sequence_individual_exon_Maniola_jurtina/Exon_14/for_alignment/alignment_Exon_14_translated_genomic_sequence_19_frame1.fa.txt
9 43
Maniola_jurtina_XM_045907399.1_Frame_1_rightoh_2_query_Exon_14
PGSSFTTTDDNVTKPSWLEVVQKSQEYKITLDLG
9 43
set19_frame1
PGSSFNIACEERAVPSWLDVVQKSQEFKLTLELE
Original query = PGSSFTTTDDNVTKPSWLEVVQKSQEYKITLDLG
New query = PGSSFNIACEERAVPSWLDVVQKSQEFKLTLELE
Scaffold = CAJQZM010003197.1, start = 2118, end = 2214
Colias_nastes,CAJQZM010025505.1,3919,4122,1,Y,Colias_croceus_XM_045654792.1_Frame_1_rightoh_2_query_Exon_15,1,67,67

13
15
16
Colias_nastes,CAJQZM010025505.1,4720,4894,1,N,Colias_croceus_XM_045654792.1_Frame_2_rightoh_2_query_Exon_13,2,54,54

Colias_n