【以下回答由 GPT 生成】
import pandas as pd
# 读取原始表格数据
df = pd.read_csv("data.csv")
# 创建新的空dataframe用于存放转换后的数据
new_df = pd.DataFrame(columns=["gender", "name", "email_domain", "work_age", "email", "total_profession"])
# 循环遍历每一行数据进行处理
for index, row in df.iterrows():
# 获取每一行中的数据
gender = row["gender"]
name = row["name"]
birthday = pd.to_datetime(row["birthday"])
startwork = pd.to_datetime(row["startwork"])
income = row["Income"]
# 计算工龄
work_age = startwork.year - birthday.year
# 提取邮箱域名
email_domain = ""
if "@" in name:
email_domain = name.split("@")[1]
# 提取邮箱
email = ""
if "@" in name:
email = name
# 判断专业
profession = ""
if work_age >= 10:
profession = "化学"
elif work_age >= 5:
profession = "美术"
elif work_age >= 2:
profession = "统计学"
else:
profession = "政治学"
# 将处理后的数据插入新的dataframe中
new_df.loc[index] = [gender, name, email_domain, work_age, email, profession]
# 打印转换后的数据
print(new_df)
【相关推荐】