In [None]:
# ===============================
# IMPORT LIBRARIES
# ===============================
from Bio.Seq import Seq
import matplotlib.pyplot as plt

# ===============================
# INPUT DNA SEQUENCESs
# ===============================
sequence_A = Seq("ATGCGTCAGTCGCGATCGCTAGCGCCAGTCGATCGC")
sequence_B = Seq("CGCTAGCGCATCGCAGTCCGATCGCGTCAGTCGATC")

# ===============================
# 1️⃣ FIND LENGTH OF BOTH SEQUENCES
# ===============================
len_A = len(sequence_A)
len_B = len(sequence_B)

print("Length of Sequence A:", len_A)
print("Length of Sequence B:", len_B)

# ===============================
# 2️⃣ COUNT CODON (CGC)
# ===============================
codon = "CGC"

count_A = sequence_A.count(codon)
count_B = sequence_B.count(codon)

print("\nNumber of CGC in Sequence A:", count_A)
print("Number of CGC in Sequence B:", count_B)

# ===============================
# 3️⃣ FIND FIRST OCCURRENCE OF SUB-SEQUENCE (CAGTC)
# ===============================
subseq = "CAGTC"

index_A = sequence_A.find(subseq)
index_B = sequence_B.find(subseq)

print("\nFirst index of CAGTC in Sequence A:", index_A)
print("First index of CAGTC in Sequence B:", index_B)

# ===============================
# 4️⃣ CREATE SEQUENCE C
# (First 15 nt of A + Last 10 nt of B)
# ===============================
sequence_C = sequence_A[:15] + sequence_B[-10:]

print("\nSequence C:", sequence_C)

# ===============================
# 5️⃣ REVERSE SEQUENCE C
# ===============================
reverse_C = sequence_C[::-1]

print("Reversed Sequence C:", reverse_C)

# ===============================
# 6️⃣ NUCLEOTIDE FREQUENCY FUNCTION
# ===============================
def nucleotide_frequency(seq):
    return {
        "A": seq.count("A"),
        "C": seq.count("C"),
        "G": seq.count("G"),
        "T": seq.count("T")
    }

freq_A = nucleotide_frequency(sequence_A)
freq_B = nucleotide_frequency(sequence_B)
freq_C = nucleotide_frequency(sequence_C)

print("\nNucleotide Frequency:")
print("Sequence A:", freq_A)
print("Sequence B:", freq_B)
print("Sequence C:", freq_C)

# ===============================
# 7️⃣ PLOT NUCLEOTIDE FREQUENCY
# ===============================
bases = ["A", "C", "G", "T"]

plt.figure(figsize=(8,5))

bar_width = 0.25
x = range(len(bases))

plt.bar(x, [freq_A[b] for b in bases], width=bar_width, label="Sequence A")
plt.bar([i + bar_width for i in x], [freq_B[b] for b in bases], width=bar_width, label="Sequence B")
plt.bar([i + 2*bar_width for i in x], [freq_C[b] for b in bases], width=bar_width, label="Sequence C")

plt.xticks([i + bar_width for i in x], bases)
plt.xlabel("Nucleotide Base")
plt.ylabel("Frequency")
plt.title("Nucleotide Base Frequency")
plt.legend()

plt.show()
