In [9]:
import pandas as pd

# Create a Series
data = [1, 2, 3, 4, 5]
s = pd.Series(data, index=['a','b','c','d','e'])

# 1. Accessing elements by index
element_at_index_2 = s[0]

# 2. Accessing elements by label
element_with_label_3 = s.loc['b']

# 3. Accessing elements by position
element_at_position_1 = s.iloc[3]

# 4. Slicing a Series
subset_s = s[1:4]

# 5. Checking the length of a Series
length_of_s = len(s)

# 6. Checking if a value is present in the Series
is_value_present = 4 in s

# 7. Adding two Series
s1 = pd.Series([1, 2, 3])
s2 = pd.Series([4, 5, 6])
sum_of_series = s1 + s2

# 8. Element-wise multiplication
product_of_series = s * 2

# 9. Applying a function to each element
squared_values = s.apply(lambda x: x**2)

# 10. Finding unique values
unique_values = s.unique()

# 11. Counting occurrences of each unique value
value_counts = s.value_counts()

# 12. Checking for null values
has_null_values = s.isnull().any()

# 13. Filling null values
s_with_null = pd.Series([1, 2, None, 4, 5])
filled_s = s_with_null.fillna(0)

# 14. Removing null values
s_without_null = s_with_null.dropna()

# 15. Sorting a Series
sorted_s = s.sort_values(ascending=False)

# 16. Finding the minimum and maximum values
min_value = s.min()
max_value = s.max()

# 17. Calculating the mean and median
mean_value = s.mean()
median_value = s.median()

# 18. Applying cumulative operations
cumulative_sum = s.cumsum()
cumulative_product = s.cumprod()

# 19. Converting the Series to a list or NumPy array
list_from_series = s.tolist()
array_from_series = s.to_numpy()

# 20. Describing the Series
description = s.describe()

# Display results
print("Original Series:", s)
print("Element at index 2:", element_at_index_2)
print("Element with label 3:", element_with_label_3)
print("Element at position 1:", element_at_position_1)
print("Subset of Series:", subset_s)
print("Length of Series:", length_of_s)
print("Is 4 present in Series:", is_value_present)
print("Sum of two Series:", sum_of_series)
print("Product of Series by 2:", product_of_series)
print("Squared values of Series:", squared_values)
print("Unique values in Series:", unique_values)
print("Value counts in Series:", value_counts)
print("Series with null values:", s_with_null)
print("Filled Series:", filled_s)
print("Series without null values:", s_without_null)
print("Sorted Series:", sorted_s)
print("Minimum value:", min_value)
print("Maximum value:", max_value)
print("Mean value:", mean_value)
print("Median value:", median_value)
print("Cumulative sum:", cumulative_sum)
print("Cumulative product:", cumulative_product)
print("List from Series:", list_from_series)
print("Array from Series:", array_from_series)
print("Series description:", description)


Original Series: a    1
b    2
c    3
d    4
e    5
dtype: int64
Element at index 2: 1
Element with label 3: 2
Element at position 1: 4
Subset of Series: b    2
c    3
d    4
dtype: int64
Length of Series: 5
Is 4 present in Series: False
Sum of two Series: 0    5
1    7
2    9
dtype: int64
Product of Series by 2: a     2
b     4
c     6
d     8
e    10
dtype: int64
Squared values of Series: a     1
b     4
c     9
d    16
e    25
dtype: int64
Unique values in Series: [1 2 3 4 5]
Value counts in Series: 1    1
2    1
3    1
4    1
5    1
Name: count, dtype: int64
Series with null values: 0    1.0
1    2.0
2    NaN
3    4.0
4    5.0
dtype: float64
Filled Series: 0    1.0
1    2.0
2    0.0
3    4.0
4    5.0
dtype: float64
Series without null values: 0    1.0
1    2.0
3    4.0
4    5.0
dtype: float64
Sorted Series: e    5
d    4
c    3
b    2
a    1
dtype: int64
Minimum value: 1
Maximum value: 5
Mean value: 3.0
Median value: 3.0
Cumulative sum: a     1
b     3
c     6
d    10
e    15
dtype

In [10]:
import pandas as pd

# Create a DataFrame
data = {'Name': ['Alice', 'Bob', 'Charlie'],
        'Age': [25, 30, 35],
        'City': ['New York', 'San Francisco', 'Los Angeles']}
df = pd.DataFrame(data)

# 1. Display the first n rows of a DataFrame
head_df = df.head(2)

# 2. Display basic statistics of a DataFrame
describe_df = df.describe()

# 3. Select specific columns from a DataFrame
selected_columns = df[['Name', 'City']]

# 4. Filter rows based on a condition
filtered_df = df[df['Age'] > 30]

# 5. Sort DataFrame by a specific column
sorted_df = df.sort_values(by='Age', ascending=False)

# 6. Group data by a column and perform aggregation
grouped_df = df.groupby('City')['Age'].mean()

# 7. Fill missing values in a DataFrame
filled_df = df.fillna(0)

# 8. Drop columns or rows from a DataFrame
dropped_df = df.drop(['Age'], axis=1)

# 9. Merge two DataFrames
df1 = pd.DataFrame({'A': [1, 2], 'B': [3, 4]})
df2 = pd.DataFrame({'A': [5, 6], 'B': [7, 8]})
merged_df = pd.merge(df1, df2, on='A')

# 10. Pivot a DataFrame
pivot_df = df.pivot(index='Name', columns='City', values='Age')

# 11. Apply a function to each element in a DataFrame
apply_func_df = df['Age'].apply(lambda x: x + 2)

# 12. Rename columns in a DataFrame
renamed_df = df.rename(columns={'Name': 'Full Name', 'Age': 'Years'})

# 13. Remove duplicate rows from a DataFrame
deduplicated_df = df.drop_duplicates()

# 14. Save DataFrame to a CSV file
df.to_csv('output.csv', index=False)

# 15. Check for null values in a DataFrame
null_check = df.isnull().sum()

# 16. Calculate the correlation matrix
correlation_matrix = df.corr()

# 17. Resample time series data
time_series_df = pd.read_csv('time_series_data.csv')
resampled_df = time_series_df.resample('M').mean()

# 18. Apply a rolling window to time series data
rolling_window_df = time_series_df['Value'].rolling(window=3).mean()

# 19. Apply a custom function to each row
def custom_function(row):
    return row['Age'] * 2

custom_applied_df = df.apply(custom_function, axis=1)

# 20. Concatenate DataFrames along rows or columns
df3 = pd.DataFrame({'Name': ['David'], 'Age': [28], 'City': ['Chicago']})
concatenated_rows = pd.concat([df, df3])
concatenated_columns = pd.concat([df, df3], axis=1)

# Display results
print("Original DataFrame:")
print(df)
print("\nFirst 2 rows of DataFrame:")
print(head_df)
print("\nBasic statistics of DataFrame:")
print(describe_df)
print("\nSelected columns from DataFrame:")
print(selected_columns)
print("\nFiltered rows based on condition:")
print(filtered_df)
print("\nSorted DataFrame:")
print(sorted_df)
print("\nGrouped DataFrame:")
print(grouped_df)
print("\nFilled DataFrame:")
print(filled_df)
print("\nDataFrame after dropping columns:")
print(dropped_df)
print("\nMerged DataFrames:")
print(merged_df)
print("\nPivoted DataFrame:")
print(pivot_df)
print("\nDataFrame with applied function:")
print(apply_func_df)
print("\nDataFrame with renamed columns:")
print(renamed_df)
print("\nDeduplicated DataFrame:")
print(deduplicated_df)
print("\nDataFrame with null value check:")
print(null_check)
print("\nCorrelation matrix of DataFrame:")
print(correlation_matrix)
print("\nResampled DataFrame:")
print(resampled_df)
print("\nDataFrame with rolling window applied:")
print(rolling_window_df)
print("\nDataFrame with custom function applied to each row:")
print(custom_applied_df)
print("\nConcatenated DataFrame along rows:")
print(concatenated_rows)
print("\nConcatenated DataFrame along columns:")
print(concatenated_columns)



ValueError: could not convert string to float: 'Alice'