0% found this document useful (0 votes)

5 views5 pages

Version 2 of Employee_contract

The document is a Python script that automates the generation of employee agreements using data from an Excel file and a Word template. It includes functions for cleaning data, creating employee-specific directories, generating DOCX files, converting them to PDF, and handling user input for selecting which employee data to process. The script ensures that all required data is populated before generating the agreements and provides error handling for file operations.

Uploaded by

govardhanyadav.cfa.2026

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

5 views5 pages

Version 2 of Employee_contract

Uploaded by

govardhanyadav.cfa.2026

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 5

import os

import pandas as pd
from docxtpl import DocxTemplate
import re
from datetime import datetime
import subprocess
import glob

# File paths - modify these to match your file names in /content

EXCEL_PATH = "/content/Employee_Data (Employee Agreement).xlsx"
TEMPLATE_PATH = "/content/Utsuk_Employee agreement.docx"
BASE_OUTPUT_DIR = "/content/drive/MyDrive/Employee_Contracts/Generated_Contracts"

# Constants remain the same

COLUMN_TO_PLACEHOLDER = {
'Date': 'date',
'Month': 'month',
'Year': 'year',
'Full Name': 'employee_name',
'House Address': 'house_address',
'PAN': 'PAN_card_number',
'Effective Date': 'effective_date',
'Effective Month': 'effective_month',
'Effective Year': 'effective_year',
'Designation': 'designation',
'Annual Pay (No.)': 'annual_pay_in_numbers',
'Annual Pay (words)': 'annual_pay_in_words',
'Basic (Monthly)': 'Basic_monthly',
'Basic (Annual)': 'Basic',
'HRA (Monthly)': 'HRA_monthly',
'HRA (Annual)': 'HRA',
'Bonus (Monthly)': 'Bonus_monthly',
'Bonus (Annual)': 'Bonus',
'Special Allowance (Monthly)': 'SA_monthly',
'Special Allowance (Annual)': 'SA',
'PF (Monthly)': 'PF_monthly',
'PF (Annual)': 'PF',
'CTC (Monthly)': 'CTC_monthly',
'CTC (Annual)': 'CTC',
'Personal Email': 'employee_personal_email_id'
}

def get_safe_employee_name(full_name):
"""Convert employee name to a safe folder name"""
return re.sub(r'[^\w\s-]', '', full_name).strip().replace(' ', '_')

def clean_employee_folder(folder_path):
"""Remove old DOCX and PDF files from the employee folder"""
for ext in ['*.docx', '*.pdf']:
for file in glob.glob(os.path.join(folder_path, ext)):
try:
os.remove(file)
print(f"Removed old file: {os.path.basename(file)}")
except Exception as e:
print(f"Error removing old file {file}: {str(e)}")

def setup_employee_folder(employee_name):
"""Create or clean employee-specific folder and return its path"""
safe_name = get_safe_employee_name(employee_name)
employee_dir = os.path.join(BASE_OUTPUT_DIR, safe_name)

if os.path.exists(employee_dir):
print(f"\nExisting folder found for {employee_name}")
print("Cleaning old files...")
clean_employee_folder(employee_dir)
else:
print(f"\nCreating new folder for {employee_name}")
os.makedirs(employee_dir)

return employee_dir

def docx_to_pdf(docx_path, pdf_path):

"""Convert DOCX to PDF using unoconv"""
try:
subprocess.run(['unoconv', '-f', 'pdf', '-o', pdf_path, docx_path],
check=True)
print(f"Converted {docx_path} to {pdf_path}")
except subprocess.CalledProcessError as e:
print(f"Error converting to PDF: {e}")
raise

def check_files_exist():
"""Check if required files exist"""
if not os.path.exists(EXCEL_PATH):
raise FileNotFoundError(f"Excel file not found at {EXCEL_PATH}")
if not os.path.exists(TEMPLATE_PATH):
raise FileNotFoundError(f"Template file not found at {TEMPLATE_PATH}")

def clean_currency(value):
"""Clean currency values and convert to string"""
if pd.isna(value):
return ""
if isinstance(value, (int, float)):
return f"{int(value):,}"
if isinstance(value, str):
numeric_value = float(re.sub(r'[^\d.]', '', value))
return f"{int(numeric_value):,}"
return str(value).strip()

def clean_numeric(value):
"""Clean numeric values to ensure they're integers"""
if pd.isna(value):
return ""
if isinstance(value, (int, float)):
return str(int(value))
return str(value).strip()

def clean_data(value, is_currency=False, is_numeric=False):

"""Clean and sanitize data"""
if is_currency:
return clean_currency(value)
if is_numeric:
return clean_numeric(value)
if pd.isna(value):
return ""
return str(value).strip()

def get_fully_populated_rows(df):
"""Return indices of rows that have all required columns populated"""
required_columns = list(COLUMN_TO_PLACEHOLDER.keys())
fully_populated = df.dropna(subset=required_columns)
return [idx + 2 for idx in fully_populated.index.tolist()]

def get_user_row_selection(populated_rows):
"""Get user input for row selection"""
while True:
print(f"\nAvailable Excel row numbers with complete data:
{populated_rows}")
print("Enter Excel row numbers to process. You can:")
print("1. Enter a single row number")
print("2. Enter a range (e.g., '2-5')")
print("3. Enter multiple rows separated by commas (e.g., '2,3,5')")

user_input = input("\nEnter your selection: ").strip()

try:
selected_indices = set()
for part in user_input.split(','):
part = part.strip()
if '-' in part:
start, end = map(int, part.split('-'))
if start not in populated_rows or end not in populated_rows:
raise ValueError(f"Row {start} or {end} is not available")
selected_indices.update([i for i in range(start, end + 1) if i
in populated_rows])
else:
row_num = int(part)
if row_num not in populated_rows:
raise ValueError(f"Row {row_num} is not available")
selected_indices.add(row_num)

return sorted([row_num - 2 for row_num in selected_indices])

except ValueError as e:
print(f"Invalid input: {e}. Please try again.")

def create_context(employee_data):
"""Create template context from employee data"""
context = {}
currency_columns = [
'Annual Pay (No.)', 'Basic (Monthly)', 'Basic (Annual)',
'HRA (Monthly)', 'HRA (Annual)', 'Bonus (Monthly)', 'Bonus (Annual)',
'Special Allowance (Monthly)', 'Special Allowance (Annual)',
'PF (Monthly)', 'PF (Annual)', 'CTC (Monthly)', 'CTC (Annual)'
]
numeric_columns = ['Date', 'Effective Date', 'Year', 'Effective Year']

for excel_col, template_key in COLUMN_TO_PLACEHOLDER.items():

if excel_col in employee_data:
is_currency = excel_col in currency_columns
is_numeric = excel_col in numeric_columns
context[template_key] = clean_data(employee_data[excel_col],
is_currency, is_numeric)
return context

def generate_filename(timestamp):
"""Generate a filename with timestamp"""
return f"Employment_Agreement_{timestamp}"

def process_employees(df, selected_indices):

"""Process employee data and generate documents"""
try:
generated_files = []
for index in selected_indices:
try:
employee_data = df.iloc[index].to_dict()
context = create_context(employee_data)

# Get employee name and setup/clean folder

employee_name = employee_data['Full Name']
employee_dir = setup_employee_folder(employee_name)

# Generate filenames (without timestamp for consistency)

base_filename = "Employment_Agreement"
docx_path = os.path.join(employee_dir, f"{base_filename}.docx")
pdf_path = os.path.join(employee_dir, f"{base_filename}.pdf")

# Generate and save DOCX

doc = DocxTemplate(TEMPLATE_PATH)
doc.render(context)
doc.save(docx_path)
print(f"Created new DOCX for {employee_name}")

# Convert to PDF
try:
docx_to_pdf(docx_path, pdf_path)
generated_files.append((employee_name, docx_path, pdf_path))
print(f"Created new PDF for {employee_name}")
except Exception as pdf_error:
print(f"Error converting to PDF for {employee_name}:
{str(pdf_error)}")
generated_files.append((employee_name, docx_path, None))
print(f"Only DOCX was saved for {employee_name}")

except Exception as e:
print(f"Error processing Excel row {index + 2}: {str(e)}")

return generated_files
except Exception as e:
print(f"Error in process_employees: {str(e)}")
return []

def main():
try:
# Create base output directory
os.makedirs(BASE_OUTPUT_DIR, exist_ok=True)

# Check if files exist

check_files_exist()

# Load Excel data

print("Loading Excel data...")
df = pd.read_excel(EXCEL_PATH)

# Get fully populated rows

populated_rows = get_fully_populated_rows(df)
if not populated_rows:
print("No fully populated rows found in the Excel file.")
return

# Get user selection for rows

selected_indices = get_user_row_selection(populated_rows)

# Process selected employees

print(f"\nProcessing selected rows...")
generated_files = process_employees(df, selected_indices)

if generated_files:
print("\nGenerated files summary:")
for employee_name, docx_path, pdf_path in generated_files:
print(f"\nEmployee: {employee_name}")
print(f"Location: {os.path.dirname(docx_path)}")
print(f"Files generated:")
print(f"- {os.path.basename(docx_path)}")
if pdf_path:
print(f"- {os.path.basename(pdf_path)}")
else:
print("- PDF conversion failed")

print("\nProcess completed!")

except Exception as e:
print(f"An error occurred: {str(e)}")

if __name__ == "__main__":
main()

Aastha IP Employee Project
No ratings yet
Aastha IP Employee Project
32 pages
Source Code55
No ratings yet
Source Code55
18 pages
Kunj 3
No ratings yet
Kunj 3
34 pages
Search Operations in Binary File
No ratings yet
Search Operations in Binary File
1 page
IP Employee Project
No ratings yet
IP Employee Project
32 pages
EMPLOYEE RECORD STORING SYSTEM
No ratings yet
EMPLOYEE RECORD STORING SYSTEM
20 pages
a5
No ratings yet
a5
28 pages
Parth IP Employee Management Project (1)
No ratings yet
Parth IP Employee Management Project (1)
32 pages
hope IP Employee Project
No ratings yet
hope IP Employee Project
34 pages
ip
No ratings yet
ip
35 pages
IP project file 2
No ratings yet
IP project file 2
34 pages
FDS RECORD-1-4
No ratings yet
FDS RECORD-1-4
18 pages
New Final Ip Project
No ratings yet
New Final Ip Project
33 pages
employee management-Ghanim,Rudra
No ratings yet
employee management-Ghanim,Rudra
25 pages
Emp Project
No ratings yet
Emp Project
40 pages
Ip Project File
No ratings yet
Ip Project File
46 pages
Pay. Roll
No ratings yet
Pay. Roll
11 pages
Viksit Ip Project File
No ratings yet
Viksit Ip Project File
33 pages
version 4 of contract_automation
No ratings yet
version 4 of contract_automation
7 pages
Unit 4
No ratings yet
Unit 4
25 pages
Kunj Project 1
No ratings yet
Kunj Project 1
34 pages
Kunj Project 1
No ratings yet
Kunj Project 1
34 pages
20 Pandas Codes to Master Data Analysis
No ratings yet
20 Pandas Codes to Master Data Analysis
3 pages
Raghavippracticalfile_organized(0)
No ratings yet
Raghavippracticalfile_organized(0)
12 pages
Python Assignment-2
No ratings yet
Python Assignment-2
3 pages
Ali Bhai's IP Project
No ratings yet
Ali Bhai's IP Project
31 pages
Apr 2023
No ratings yet
Apr 2023
32 pages
New Microsoft Word Document
No ratings yet
New Microsoft Word Document
11 pages
Informatics Practices: Data Handling Experiment
No ratings yet
Informatics Practices: Data Handling Experiment
5 pages
NEEL (1)_edited
No ratings yet
NEEL (1)_edited
12 pages
NEEL (1) Edited Edited
No ratings yet
NEEL (1) Edited Edited
12 pages
Neel
No ratings yet
Neel
12 pages
NEEL (1)
No ratings yet
NEEL (1)
12 pages
IP PROJECT Old
No ratings yet
IP PROJECT Old
18 pages
Employee Payroll System Description verru anna
No ratings yet
Employee Payroll System Description verru anna
10 pages
Practical Questions
No ratings yet
Practical Questions
7 pages
Employee Management System
No ratings yet
Employee Management System
33 pages
Monthly Basic Salary
No ratings yet
Monthly Basic Salary
16 pages
Employee Management System
No ratings yet
Employee Management System
32 pages
Employ Management System
No ratings yet
Employ Management System
29 pages
Source Code
No ratings yet
Source Code
49 pages
202101445_lab01
No ratings yet
202101445_lab01
6 pages
Project - Employee Management System
No ratings yet
Project - Employee Management System
23 pages
Program
No ratings yet
Program
11 pages
Kartikey
No ratings yet
Kartikey
19 pages
EMPLOYEE MANAGEMENT SYSTEM
No ratings yet
EMPLOYEE MANAGEMENT SYSTEM
18 pages
Python
No ratings yet
Python
5 pages
211423205137 EX 6B
No ratings yet
211423205137 EX 6B
3 pages
Stefan Thurner, Rudolf Hanel, Peter Klimek - Introduction to the Theory of Complex Systems-Oxford University Press (2018)
100% (1)
Stefan Thurner, Rudolf Hanel, Peter Klimek - Introduction to the Theory of Complex Systems-Oxford University Press (2018)
446 pages
Payroll Management System
No ratings yet
Payroll Management System
10 pages
Absenteeism_module
No ratings yet
Absenteeism_module
2 pages
EmployeeMgmt XII IP ProjectReprot 2022 23
No ratings yet
EmployeeMgmt XII IP ProjectReprot 2022 23
16 pages
Document
No ratings yet
Document
1 page
Employee Data Analysis IP Sample Project
No ratings yet
Employee Data Analysis IP Sample Project
11 pages
Binary File Project
No ratings yet
Binary File Project
7 pages
Project On Payroll System
No ratings yet
Project On Payroll System
10 pages
What Can You Do With Dataframes Using Pandas?: Pandas Is A High-Level Data Manipulation Tool Developed by Wes Mckinney
No ratings yet
What Can You Do With Dataframes Using Pandas?: Pandas Is A High-Level Data Manipulation Tool Developed by Wes Mckinney
10 pages
Untitled 1
No ratings yet
Untitled 1
5 pages
Practice Question For Python
No ratings yet
Practice Question For Python
4 pages
Investing In Battery Technology
No ratings yet
Investing In Battery Technology
35 pages
lib_burst_generated
No ratings yet
lib_burst_generated
109 pages
_OceanofPDF.com_The_Economic_Times_Wealth_-_Vol_15_No_19_May_1218_2025_-_The_Economic_Times_Wealth
No ratings yet
_OceanofPDF.com_The_Economic_Times_Wealth_-_Vol_15_No_19_May_1218_2025_-_The_Economic_Times_Wealth
24 pages
career
No ratings yet
career
13 pages
Ethical Hacking Journal
No ratings yet
Ethical Hacking Journal
23 pages
The Web Design Book Vol 5 - 2015 UK
100% (1)
The Web Design Book Vol 5 - 2015 UK
196 pages
Software Design Document Sample
No ratings yet
Software Design Document Sample
22 pages
Gaudi2 Whitepaper
No ratings yet
Gaudi2 Whitepaper
34 pages
dbms explaination
No ratings yet
dbms explaination
4 pages
ICT Notes Class 12
No ratings yet
ICT Notes Class 12
24 pages
Browser SSO Guide 2020.1.0
No ratings yet
Browser SSO Guide 2020.1.0
28 pages
Devops
No ratings yet
Devops
20 pages
Ms Excel Lesson 2 Home Toolbar
No ratings yet
Ms Excel Lesson 2 Home Toolbar
4 pages
Hacking Tools Cheat Sheet v1.0 PDF
100% (1)
Hacking Tools Cheat Sheet v1.0 PDF
2 pages
Kilimall Ecommerce
No ratings yet
Kilimall Ecommerce
13 pages
State Identity and Behaviour of Objects
No ratings yet
State Identity and Behaviour of Objects
13 pages
Cybersource Device Fingerprinting Guide: December 2019
No ratings yet
Cybersource Device Fingerprinting Guide: December 2019
71 pages
Error After Web Dispatcher Migration to SAP RISE
No ratings yet
Error After Web Dispatcher Migration to SAP RISE
3 pages
Manual: Christian Knufinke Software
No ratings yet
Manual: Christian Knufinke Software
34 pages
Online Ordering System Project PDF
No ratings yet
Online Ordering System Project PDF
24 pages
Oracle Auditing EBSR12.2
No ratings yet
Oracle Auditing EBSR12.2
4 pages
OSY PR Exam Question Bank
No ratings yet
OSY PR Exam Question Bank
3 pages
Process Management: Robin Mathur Department of Computer Science & Engineering, Lpu
No ratings yet
Process Management: Robin Mathur Department of Computer Science & Engineering, Lpu
25 pages
Examples Documentation VPM FAQ Built in V: Advanced Topics
No ratings yet
Examples Documentation VPM FAQ Built in V: Advanced Topics
22 pages
DevOps Resume 14
No ratings yet
DevOps Resume 14
3 pages
PITRAM Software
No ratings yet
PITRAM Software
22 pages
Management and Technical Assistance Support To Moldova Flood Protection Project
No ratings yet
Management and Technical Assistance Support To Moldova Flood Protection Project
21 pages
College Website Creation: Mini Project Report
No ratings yet
College Website Creation: Mini Project Report
36 pages
Dinesh Singh: Professional Summary
No ratings yet
Dinesh Singh: Professional Summary
5 pages
Data Egineering Simplified Cheat Sheet 2023 06 03
No ratings yet
Data Egineering Simplified Cheat Sheet 2023 06 03
2 pages
Windows Lifecycle Fact Sheet - Windows Help PDF
No ratings yet
Windows Lifecycle Fact Sheet - Windows Help PDF
8 pages
Basics
No ratings yet
Basics
11 pages
Tugas Bahasa Inggris
No ratings yet
Tugas Bahasa Inggris
6 pages
Case Analysis # 2
0% (1)
Case Analysis # 2
2 pages
Profound Python Data Science
From Everand
Profound Python Data Science
Onder Teker
No ratings yet
The Essential R Reference
From Everand
The Essential R Reference
Mark Gardener
No ratings yet

Version 2 of Employee_contract

Uploaded by

Version 2 of Employee_contract

Uploaded by

import os

# File paths - modify these to match your file names in /content

# Constants remain the same

def docx_to_pdf(docx_path, pdf_path):

def clean_data(value, is_currency=False, is_numeric=False):

user_input = input("\nEnter your selection: ").strip()

return sorted([row_num - 2 for row_num in selected_indices])

for excel_col, template_key in COLUMN_TO_PLACEHOLDER.items():

def process_employees(df, selected_indices):

# Get employee name and setup/clean folder

# Generate filenames (without timestamp for consistency)

# Generate and save DOCX

# Check if files exist

# Load Excel data

# Get fully populated rows

# Get user selection for rows

# Process selected employees

You might also like