0% found this document useful (0 votes)

10 views3 pages

Code Python

Uploaded by

peopleslively

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

10 views3 pages

Code Python

Uploaded by

peopleslively

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 3

import pandas as pd

import numpy as np

# Read the CSV file

def read_and_process_bank_data():
# Read the CSV file
df = pd.read_csv('/content/Book1 (1).csv')
print("Column names:", list([Link]))

# Clean column names by stripping whitespace early

[Link] = [Link]()

# Clean the data by removing rows where all key columns are NaN
df = [Link](subset=['Date', 'Description', 'Category'], how='all')

# Remove rows where Category is NaN (these are header rows or empty rows)
df = df[df['Category'].notna()]

# Convert Amount columns to numeric, handling commas and quotes

for col in ['Debit', 'Credit', 'Balance']:
if col in [Link]:
df[col] = df[col].astype(str).[Link](',', '').[Link]('"', '')
df[col] = pd.to_numeric(df[col], errors='coerce')

return df
def group_by_category_and_save():
try:
# Read and process the data
df = read_and_process_bank_data()

print("Original data shape:", [Link])

print("Categories found:", df['Category'].unique())

# Group by category and calculate summary statistics

category_summary = [Link]('Category').agg({
'Debit': ['count', 'sum', 'mean'],
'Credit': ['count', 'sum', 'mean'],
'Description': 'count' # Total number of transactions per category
}).round(2)

# Flatten column names

category_summary.columns = ['_'.join(col).strip() for col in
category_summary.columns]

# Rename columns for clarity

category_summary = category_summary.rename(columns={
'Debit_count': 'Debit_Transaction_Count',
'Debit_sum': 'Total_Debit_Amount',
'Debit_mean': 'Average_Debit_Amount',
'Credit_count': 'Credit_Transaction_Count',
'Credit_sum': 'Total_Credit_Amount',
'Credit_mean': 'Average_Credit_Amount',
'Description_count': 'Total_Transactions'
})

# Calculate net amount (Credit - Debit) for each category

category_summary['Net_Amount'] = (
category_summary['Total_Credit_Amount'].fillna(0) -
category_summary['Total_Debit_Amount'].fillna(0)
).round(2)

# Reset index to make Category a column

category_summary = category_summary.reset_index()

# Sort by total transaction count (descending)

category_summary = category_summary.sort_values('Total_Transactions',
ascending=False)

# Save to CSV
output_filename = 'bank_transactions_grouped_by_category.csv'
#category_summary.to_csv(output_filename, index=False)

print(f"\nData successfully grouped by category and saved to

'{output_filename}'")
print(f"\nSummary of categories:")
print("=" * 80)

# Display summary
for _, row in category_summary.iterrows():
print(f"Category: {row['Category']}")
print(f" Total Transactions: {row['Total_Transactions']}")
print(f" Total Debit: ₹{row['Total_Debit_Amount']:,.2f}" if not
[Link](row['Total_Debit_Amount']) else " Total Debit: ₹0.00")
print(f" Total Credit: ₹{row['Total_Credit_Amount']:,.2f}" if not
[Link](row['Total_Credit_Amount']) else " Total Credit: ₹0.00")
print(f" Net Amount: ₹{row['Net_Amount']:,.2f}")
print("-" * 40)

# Create detailed transactions by category

detailed_by_category = [Link]('Category').apply(
lambda x: x[['Date', 'Description', 'Debit', 'Credit', 'Balance',
'Name', 'Bank Name']].copy()
).reset_index(drop=True)

# Save detailed transactions by category

detailed_filename = 'detailed_transactions_by_category.csv'
for category in df['Category'].dropna().unique():
# Filter transactions for this category
category_df = df[df['Category'] == category].copy()

# Clean the category name to make it a safe filename

safe_category = "".join(c if [Link]() or c in (' ', '-', '_') else '_'
for c in category).strip().replace(' ', '_')
filename = f'category_{safe_category}.csv'

# Save to CSV
#category_df.to_csv(filename, index=False)
print(f" Saved: {filename}")

print(f"\nDetailed transactions by category saved to

'{detailed_filename}'")
# Combine all category CSVs into a single text file
combined_txt_filename = 'all_categories.txt'
with open(combined_txt_filename, 'w', encoding='utf-8') as combined_file:
for category in df['Category'].dropna().unique():
# Filter transactions
category_df = df[df['Category'] == category].copy()
# Clean category name
safe_category = "".join(c if [Link]() or c in (' ', '-', '_')
else '_' for c in category).strip().replace(' ', '_')

# Write header
combined_file.write(f"{'=' * 80}\n")
combined_file.write(f"CATEGORY: {category}\n")
combined_file.write(f"{'=' * 80}\n\n")

# Write DataFrame as text

combined_file.write(category_df.to_string(index=False))
combined_file.write("\n\n")

print(f"\nCombined category transactions written to

'{combined_txt_filename}'")

return category_summary

except FileNotFoundError:
print("Error: '[Link]' file not found. Please make sure the file is in
the same directory as this script.")
return None
except Exception as e:
print(f"An error occurred: {str(e)}")
return None

# Execute the function

if __name__ == "__main__":
result = group_by_category_and_save()

if result is not None:

print("\n" + "="*80)
print("EXECUTION COMPLETED SUCCESSFULLY")
print("="*80)
print("Files created:")
print("1. bank_transactions_grouped_by_category.csv - Summary by category")
print("2. detailed_transactions_by_category.csv - All transactions grouped
by category")
# Create separate CSV for each category
print("\nCreating separate CSV files for each category...")

A Project Report On Bank Management System
No ratings yet
A Project Report On Bank Management System
20 pages
Online Bank Portal PROJECT
No ratings yet
Online Bank Portal PROJECT
29 pages
Analyzing Supermarket Sales Data
No ratings yet
Analyzing Supermarket Sales Data
6 pages
Excel to Pandas: Data Analysis Guide
No ratings yet
Excel to Pandas: Data Analysis Guide
9 pages
Daily Transactions Problem Statement
No ratings yet
Daily Transactions Problem Statement
27 pages
Finance Report
No ratings yet
Finance Report
5 pages
Pandas Trampas
No ratings yet
Pandas Trampas
9 pages
Python - Pandas - Numpy Interview Q&A
No ratings yet
Python - Pandas - Numpy Interview Q&A
12 pages
Project Ip
No ratings yet
Project Ip
20 pages
Pandas Introduction: What Is Python Pandas Used For?
No ratings yet
Pandas Introduction: What Is Python Pandas Used For?
28 pages
Pandas Data Manipulation Extended CheatSheet 1731972219
No ratings yet
Pandas Data Manipulation Extended CheatSheet 1731972219
9 pages
GR12 Record Programs 6TH Onwards
No ratings yet
GR12 Record Programs 6TH Onwards
18 pages
DHP Journal
No ratings yet
DHP Journal
29 pages
Prac 1
No ratings yet
Prac 1
5 pages
Oddstudents
No ratings yet
Oddstudents
35 pages
Lab 1 ML
No ratings yet
Lab 1 ML
2 pages
ProductionMGmt XII IP ProjectReprotFinal
No ratings yet
ProductionMGmt XII IP ProjectReprotFinal
16 pages
Expense Categorization
No ratings yet
Expense Categorization
15 pages
Paridhi Batla IP Project
No ratings yet
Paridhi Batla IP Project
44 pages
Data Wrangling & Data Manipulation With Pandas
No ratings yet
Data Wrangling & Data Manipulation With Pandas
6 pages
Cleaning Data in Python
No ratings yet
Cleaning Data in Python
8 pages
File Code
No ratings yet
File Code
13 pages
Ippython Pushpa
No ratings yet
Ippython Pushpa
9 pages
Class 12 IP Practical Questions
No ratings yet
Class 12 IP Practical Questions
7 pages
Lab Record IP
No ratings yet
Lab Record IP
13 pages
IP Practical PRGM
No ratings yet
IP Practical PRGM
41 pages
Inbound 2665441404356826662
No ratings yet
Inbound 2665441404356826662
13 pages
Supermarket Sales Insights
No ratings yet
Supermarket Sales Insights
8 pages
Ip Projrct Ii
No ratings yet
Ip Projrct Ii
31 pages
Ip HW
No ratings yet
Ip HW
15 pages
Library Management System Code
No ratings yet
Library Management System Code
7 pages
Pandas Operations Guide
No ratings yet
Pandas Operations Guide
6 pages
Python Interviews
No ratings yet
Python Interviews
154 pages
Practical File IP
No ratings yet
Practical File IP
27 pages
Prac 1
No ratings yet
Prac 1
5 pages
Using Groupby and Pivot
No ratings yet
Using Groupby and Pivot
7 pages
Python 2.1.3
No ratings yet
Python 2.1.3
6 pages
Practice Questions2
No ratings yet
Practice Questions2
2 pages
EDA With Pandas
No ratings yet
EDA With Pandas
8 pages
Learn Pandas
No ratings yet
Learn Pandas
37 pages
Pandas Tutorial
No ratings yet
Pandas Tutorial
9 pages
Sales Management Project Report
No ratings yet
Sales Management Project Report
18 pages
Pandas Fuction Notes
No ratings yet
Pandas Fuction Notes
3 pages
Problem Statement Major Project
No ratings yet
Problem Statement Major Project
8 pages
Task 1 Vijaya Lakshman PDF
No ratings yet
Task 1 Vijaya Lakshman PDF
10 pages
Fraud 2
No ratings yet
Fraud 2
20 pages
Bank Churn Prediction Guide
No ratings yet
Bank Churn Prediction Guide
15 pages
Vraj Patel
No ratings yet
Vraj Patel
19 pages
Module 3
No ratings yet
Module 3
5 pages
Lab 1 ML Lab
No ratings yet
Lab 1 ML Lab
15 pages
Pandas Research
No ratings yet
Pandas Research
14 pages
Sample Project 1
No ratings yet
Sample Project 1
14 pages
Even Students
No ratings yet
Even Students
36 pages
New Green Field School
No ratings yet
New Green Field School
33 pages
IP Project I
No ratings yet
IP Project I
56 pages
Pandas Syntax Revision For ML
No ratings yet
Pandas Syntax Revision For ML
10 pages
Pandas Library: Data Manipulation & Analysis Guide
No ratings yet
Pandas Library: Data Manipulation & Analysis Guide
9 pages
NumPy and Pandas Step
No ratings yet
NumPy and Pandas Step
9 pages
Textile Garment Division Case Study
No ratings yet
Textile Garment Division Case Study
13 pages
Design of Ejectors
86% (7)
Design of Ejectors
238 pages
Experiment 9 Young S Modulus
100% (2)
Experiment 9 Young S Modulus
4 pages
Brasília STAR Arrival Chart RNAV 1A
No ratings yet
Brasília STAR Arrival Chart RNAV 1A
2 pages
Transformer Testing Guide
No ratings yet
Transformer Testing Guide
8 pages
SIPROTEC 5 Over-Voltage Protection Guide
No ratings yet
SIPROTEC 5 Over-Voltage Protection Guide
3 pages
14 Building Works Dismantaling Demolishing
No ratings yet
14 Building Works Dismantaling Demolishing
5 pages
Python Basics: Practical Programming Tasks
No ratings yet
Python Basics: Practical Programming Tasks
14 pages
6500 Loop Commissioning
No ratings yet
6500 Loop Commissioning
40 pages
Buck Converter
No ratings yet
Buck Converter
7 pages
Swimming Pool BOQ
100% (6)
Swimming Pool BOQ
5 pages
Tensile Membrane Structure Solutions
No ratings yet
Tensile Membrane Structure Solutions
6 pages
Permeation Grouting in Sandy Soil Study
No ratings yet
Permeation Grouting in Sandy Soil Study
6 pages
Behringer Industrial Pipe Clamps 2016 PDF
No ratings yet
Behringer Industrial Pipe Clamps 2016 PDF
38 pages
Correl-1-Drills-Hydrau-Fluids E01 E02
No ratings yet
Correl-1-Drills-Hydrau-Fluids E01 E02
5 pages
Atlas Honda Casestudy
0% (1)
Atlas Honda Casestudy
20 pages
Strategy Pricing Manager JD - v0.1
No ratings yet
Strategy Pricing Manager JD - v0.1
3 pages
Yelp Case
No ratings yet
Yelp Case
8 pages
SAP Plant Maintenance Training Overview
No ratings yet
SAP Plant Maintenance Training Overview
4 pages
Factors Affecting Students Buying Behavior of Smartphone
100% (1)
Factors Affecting Students Buying Behavior of Smartphone
9 pages
Proslect Filter Grille PSFGW
No ratings yet
Proslect Filter Grille PSFGW
2 pages
Google Search Techniques Guide
No ratings yet
Google Search Techniques Guide
3 pages
Student Contests and Vacation Experiences
No ratings yet
Student Contests and Vacation Experiences
8 pages
Fibran GEO - Katalog PDF
No ratings yet
Fibran GEO - Katalog PDF
20 pages
DASA 2016: SAT Cutoffs for Indian Institutes
No ratings yet
DASA 2016: SAT Cutoffs for Indian Institutes
8 pages
Group 9 - Fdas
No ratings yet
Group 9 - Fdas
52 pages
Data Processing and Management
No ratings yet
Data Processing and Management
28 pages
Simple Machines Test
No ratings yet
Simple Machines Test
7 pages
Exploring Cloud Incidents - Short Paper
No ratings yet
Exploring Cloud Incidents - Short Paper
14 pages
3-1 Circuito Hidraulico
No ratings yet
3-1 Circuito Hidraulico
1 page

Code Python

Uploaded by

Code Python

Uploaded by

import pandas as pd

# Read the CSV file

# Clean column names by stripping whitespace **early**

# Convert Amount columns to numeric, handling commas and quotes

print("Original data shape:", [Link])

# Group by category and calculate summary statistics

# Flatten column names

# Rename columns for clarity

# Calculate net amount (Credit - Debit) for each category

# Reset index to make Category a column

# Sort by total transaction count (descending)

print(f"\nData successfully grouped by category and saved to

# Create detailed transactions by category

# Save detailed transactions by category

# Clean the category name to make it a safe filename

print(f"\nDetailed transactions by category saved to

# Write DataFrame as text

print(f"\nCombined category transactions written to

# Execute the function

if result is not None:

You might also like

# Clean column names by stripping whitespace early