Download as txt, pdf, or txt
Download as txt, pdf, or txt
You are on page 1of 1

import pandas as pd

# Load the dataset from the .csv file


data = pd.read_csv('your_dataset.csv')

# Character Map: Convert text in a column to lowercase


data['text_column'] = data['text_column'].str.lower()

# Multicast: Duplicate data for parallel processing (not directly available in


pandas, but you can create multiple copies of DataFrame)
data_copy1 = data.copy()
data_copy2 = data.copy()

# Conditional Split: Split data based on a condition


high_sales = data[data['sales'] > 1000] # Example condition
low_sales = data[data['sales'] <= 1000] # Example condition

# Aggregation: Calculate total sales by product category


sales_by_category = data.groupby('category')['sales'].sum()

# Sort: Sort data by a column


sorted_data = data.sort_values(by='date_column')

# Derived Column: Create a new column based on existing columns


data['discounted_price'] = data['price'] * 0.9 # Example calculation for discount

# Output transformed data


# You can save these transformed datasets to new .csv files or use them further in
your analysis.
high_sales.to_csv('high_sales.csv', index=False)
low_sales.to_csv('low_sales.csv', index=False)
sales_by_category.to_csv('sales_by_category.csv')
sorted_data.to_csv('sorted_data.csv', index=False)
data.to_csv('derived_data.csv', index=False)

You might also like