diff --git a/replace_archive.py b/replace_archive.py deleted file mode 100644 index 98bf681d6d6d5f234053680295581c49869f3ace..0000000000000000000000000000000000000000 --- a/replace_archive.py +++ /dev/null @@ -1,18 +0,0 @@ -import pandas as pd - -csv = pd.read_csv('test.csv') -print(len(csv)) - -replace_archive_row = [] -for i in range(len(csv)): - if 'archive' in csv['project path'][i]: - replace_archive_row.append(i) - -for index in replace_archive_row: - for index_, item in enumerate(csv['project path'][index].split('/')): - if 'archive' in item: - csv['project path'][index] = '/'.join(csv['project path'][index].split('/')[0:index_]) - break - -csv.to_csv('test.csv', columns=['project path', 'visits'], index=False) -print(len(csv)) \ No newline at end of file diff --git a/replace_blob.py b/replace_blob.py deleted file mode 100644 index 3f9127a104f75a94b099a058d878fedcdfabffb2..0000000000000000000000000000000000000000 --- a/replace_blob.py +++ /dev/null @@ -1,19 +0,0 @@ -import pandas as pd - -csv = pd.read_csv('test.csv') -print(len(csv)) - -replace_blob_row = [] -for i in range(len(csv)): - if 'blob' in csv['project path'][i]: - replace_blob_row.append(i) - - -for index in replace_blob_row: - for index_, item in enumerate(csv['project path'][index].split('/')): - if item == 'blob': - csv['project path'][index] = '/'.join(csv['project path'][index].split('/')[0:index_]) - break - -csv.to_csv('test.csv', columns=['project path', 'visits'], index=False) -print(len(csv)) \ No newline at end of file diff --git a/replace_issues.py b/replace_issues.py deleted file mode 100644 index 6e1f87309eacd9c344a5138fd4403adcf41b4a66..0000000000000000000000000000000000000000 --- a/replace_issues.py +++ /dev/null @@ -1,18 +0,0 @@ -import pandas as pd - -csv = pd.read_csv('test.csv') -print(len(csv)) - -replace_tree_row = [] -for i in range(len(csv)): - if 'issues' in csv['project path'][i]: - replace_tree_row.append(i) - -for index in replace_tree_row: - for index_, item in enumerate(csv['project path'][index].split('/')): - if 'issues' in item: - csv['project path'][index] = '/'.join(csv['project path'][index].split('/')[0:index_]) - break - -csv.to_csv('test.csv', columns=['project path', 'visits'], index=False) -print(len(csv)) \ No newline at end of file diff --git a/replace_release.py b/replace_release.py deleted file mode 100644 index 7788defe89b63d8778492cf156fcbdd870822d58..0000000000000000000000000000000000000000 --- a/replace_release.py +++ /dev/null @@ -1,19 +0,0 @@ -import pandas as pd - -csv = pd.read_csv('test.csv') -print(len(csv)) - -replace_release_row = [] -for i in range(len(csv)): - if 'release' in csv['project path'][i]: - replace_release_row.append(i) - -for index in replace_release_row: - for index_, item in enumerate(csv['project path'][index].split('/')): - if item == 'releases': - csv['project path'][index] = '/'.join(csv['project path'][index].split('/')[0:index_]) - break - - -csv.to_csv('test.csv', columns=['project path', 'visits'], index=False) -print(len(csv)) \ No newline at end of file diff --git a/replace_tree.py b/replace_tree.py deleted file mode 100644 index e9c1ae1fe1a649a25ab6dec2be23b08e6f6693ed..0000000000000000000000000000000000000000 --- a/replace_tree.py +++ /dev/null @@ -1,18 +0,0 @@ -import pandas as pd - -csv = pd.read_csv('test.csv') -print(len(csv)) - -replace_tree_row = [] -for i in range(len(csv)): - if 'tree' in csv['project path'][i]: - replace_tree_row.append(i) - -for index in replace_tree_row: - for index_, item in enumerate(csv['project path'][index].split('/')): - if item == 'tree': - csv['project path'][index] = '/'.join(csv['project path'][index].split('/')[0:index_]) - break - -csv.to_csv('test.csv', columns=['project path', 'visits'], index=False) -print(len(csv)) \ No newline at end of file diff --git a/run_githublink.sh b/run_githublink.sh index 4d5c8b0e40b6f0dde080d905288dbdc26e3bff6a..083fdff9b408b249c517214f39ab9fa524c1e55e 100755 --- a/run_githublink.sh +++ b/run_githublink.sh @@ -3,19 +3,11 @@ python delete_none_value.py python delete_not_githublink.py python delete_grouplink.py +python replace_wiki.py +python drop_duplicates.py python replace_#.py python replace_%.py python replace_?.py python replace_.git.py python drop_duplicates.py -# python delete_login_settings.py -python replace_wiki.py -python drop_duplicates.py -# python replace_issues.py -# python replace_release.py -# python replace_blob.py -# python replace_tree.py -# python replace_archive.py -python delete_grouplink.py -# python add_group_project_name.py -python drop_duplicates.py \ No newline at end of file +python delete_grouplink.py \ No newline at end of file