In [3]:
def check_gene_expression(expression):
    """
    Classify gene expression values into categories.

    Parameters:
    expression (float): The numeric gene expression value.

    Returns:
    str: The classification of the gene expression.
    """
    if expression >= 1000:
        return "High"
    elif 500 <= expression < 1000:
        return "Moderate"
    elif 100 <= expression < 500:
        return "Low"
    else:  # expression < 100
        return "Undetected"

# Example usage
expression_values = [1200, 800, 450, 80]
for value in expression_values:
    classification = check_gene_expression(value)
    print(f"Expression Value: {value} - Classification: {classification}")

Expression Value: 1200 - Classification: High
Expression Value: 800 - Classification: Moderate
Expression Value: 450 - Classification: Low
Expression Value: 80 - Classification: Undetected


In [4]:
# List of gene expression values
gene_expression_values = [1500, 2000, 2500, 3000, 3500]

# Initialize variables to compute the sum and count
total_sum = 0
count = 0

# Use a for loop to iterate through the list and calculate the sum
for value in gene_expression_values:
    total_sum += value  # Add each value to total_sum
    count += 1          # Increment the count

# Calculate the average
average_expression = total_sum / count if count > 0 else 0

# Print the result
print(f"The average gene expression value is: {average_expression:.2f}")

The average gene expression value is: 2500.00


In [5]:
# List of gene expression values
gene_expression_values = [1, 1, 2, 3, 5, 8, 13, 21]

# Define the threshold
threshold = 10

# Initialize variables for counting
count = 0
index = 0

# Use a while loop to iterate through the list
while index < len(gene_expression_values):
    if gene_expression_values[index] > threshold:
        count += 1  # Increment count if the expression value is above the threshold
    index += 1  # Move to the next index

# Print the result
print(f"The number of genes with expression values above {threshold} is: {count}")

The number of genes with expression values above 10 is: 2


In [7]:
def count_gene_occurrences(gene_list):
    """
    Count occurrences of each gene in the list.

    Parameters:
    gene_list (list): A list of gene names.

    Returns:
    dict: A dictionary with gene names as keys and their counts as values.
    """
    gene_count = {}  # Initialize an empty dictionary to hold gene counts

    for gene in gene_list:
        if gene in gene_count:
            gene_count[gene] += 1  # Increment count if gene is already in the dictionary
        else:
            gene_count[gene] = 1  # Initialize count for new genes

    return gene_count

# Test the function with a list of gene names
test_genes = ['GeneA', 'GeneB', 'GeneA', 'GeneC', 'GeneB', 'GeneB']
result = count_gene_occurrences(test_genes)

# Print the result
print(result)

{'GeneA': 2, 'GeneB': 3, 'GeneC': 1}


In [9]:
def compute_gc_content(dna_sequence):
    """
    Calculate the GC content of a given DNA sequence.

    Parameters:
    dna_sequence (str): The DNA sequence to analyze.

    Returns:
    float: The GC content as a percentage of the total sequence length.
    """
    # Ensure the sequence is in uppercase to handle case insensitivity
    dna_sequence = dna_sequence.upper()

    # Count the occurrences of G and C
    g_count = dna_sequence.count('G')
    c_count = dna_sequence.count('C')

    # Calculate total length of the sequence
    total_length = len(dna_sequence)

    # Avoid division by zero if the sequence is empty
    if total_length == 0:
        return 0.0  # Return 0% if there are no nucleotides

    # Calculate GC content as a percentage
    gc_content = (g_count + c_count) / total_length * 100

    return gc_content

# Example usage
dna_seq = "ATGCGTACG"
gc_percentage = compute_gc_content(dna_seq)
print(f"GC Content: {gc_percentage:.2f}%")

GC Content: 55.56%


In [10]:
def compute_gc_content(dna_sequence):
    """
    Calculate the GC content of a given DNA sequence.

    Parameters:
    dna_sequence (str): The DNA sequence to analyze.

    Returns:
    float: The GC content as a percentage of the total sequence length.
    """
    # Ensure the sequence is in uppercase to handle case insensitivity
    dna_sequence = dna_sequence.upper()

    # Count the occurrences of G and C
    g_count = dna_sequence.count('G')
    c_count = dna_sequence.count('C')

    # Calculate total length of the sequence
    total_length = len(dna_sequence)

    # Avoid division by zero if the sequence is empty
    if total_length == 0:
        return 0.0  # Return 0% if there are no nucleotides

    # Calculate GC content as a percentage
    gc_content = (g_count + c_count) / total_length * 100

    return gc_content

# Call the function with the DNA sequence "ATGCGTACG"
dna_seq = "ATGCGTACG"
gc_percentage = compute_gc_content(dna_seq)

# Print the GC content
print(f"GC Content for the DNA sequence '{dna_seq}': {gc_percentage:.2f}%")

GC Content for the DNA sequence 'ATGCGTACG': 55.56%
