add_group_project_name.py 609 字节
Newer Older
M
MaoXianxin 已提交
1 2
import pandas as pd

M
MaoXianxin 已提交
3 4
filenameStr = 'test.csv'
csv = pd.read_csv(filenameStr, encoding='ISO-8859-1', dtype=str, usecols=['project path', 'visits'])
M
MaoXianxin 已提交
5 6
print(len(csv))

M
MaoXianxin 已提交
7
project_path = csv['project path']
M
MaoXianxin 已提交
8 9
group_names = []
project_names = []
M
MaoXianxin 已提交
10 11 12
for index, project in enumerate(project_path):
    group_names.append(project.split('/')[3])
    project_names.append(project.split('/')[4])
M
MaoXianxin 已提交
13 14 15 16

csv['group_name'] = group_names
csv['project_name'] = project_names

M
MaoXianxin 已提交
17 18 19
drop_none = csv.dropna(how='any')
drop_none.to_csv('test.csv', columns=['project path', 'visits', 'group_name', 'project_name'], index=False)
print(len(drop_none))