from openpyxl import Workbook
from openpyxl.utils.dataframe import dataframe_to_rows
from pandas import DataFrame
workbook = Workbook()
sheet = workbook.active
data = {'Name': ['Alice', 'Bob', 'Alice', 'Charlie', 'Bob', 'Alice'],
'Age': [25, 30, 25, 35, 30, 25],
'City': ['New York', 'Paris', 'London', 'Tokyo', 'Paris', 'New York']}
df = DataFrame(data)
for row in dataframe_to_rows(df, index=False, header=True):
sheet.append(row)
rows = list(sheet.iter_rows(values_only=True))
seen = set()
rows_without_duplicates = []
for row in rows:
if row not in seen:
seen.add(row)
rows_without_duplicates.append(row)
sheet.delete_rows(1, sheet.max_row)
for row in rows_without_duplicates:
sheet.append(row)
workbook.save('[Exam 01]remove_duplicates_by_row.xlsx')