Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
CSDN 技术社区
1024 Report
提交
1e93b039
1
1024 Report
项目概览
CSDN 技术社区
/
1024 Report
通知
84
Star
6
Fork
1
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
1
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
1
1024 Report
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
1
Issue
1
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
前往新版Gitcode,体验更适合开发者的 AI 搜索 >>
提交
1e93b039
编写于
10月 13, 2022
作者:
F
feilong
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
refactor data dir
上级
6f0bde03
变更
18
隐藏空白更改
内联
并排
Showing
18 changed file
with
19 addition
and
18 deletion
+19
-18
data/CSDN/Processor.jpg
data/CSDN/Processor.jpg
+0
-0
data/CSDN/repo-commit-rank.csv
data/CSDN/repo-commit-rank.csv
+0
-0
data/CSDN/repo-csdn-trends.xlsx
data/CSDN/repo-csdn-trends.xlsx
+0
-0
data/CSDN/repository_commit_events_20200930_analysis_new-demo.csv
...N/repository_commit_events_20200930_analysis_new-demo.csv
+0
-0
data/GitHub-Repos.xlsx
data/GitHub-Repos.xlsx
+0
-0
data/GitHub/UserInfo.xlsx
data/GitHub/UserInfo.xlsx
+0
-0
data/OSS数据需求.xlsx
data/OSS数据需求.xlsx
+0
-0
data/PingCAP/近24个月的活跃数据总数.csv
data/PingCAP/近24个月的活跃数据总数.csv
+0
-0
data/PingCAP/项目受欢迎度变化.csv
data/PingCAP/项目受欢迎度变化.csv
+0
-0
data/PingCAP/项目活跃度变化.csv
data/PingCAP/项目活跃度变化.csv
+0
-0
data/RepoType-OSChina.xlsx
data/RepoType-OSChina.xlsx
+0
-0
data/RepoType.xlsx
data/RepoType.xlsx
+0
-0
data/dataset/cncf-interactive-landscape.csv
data/dataset/cncf-interactive-landscape.csv
+0
-0
data/dataset/interactive_landscape.csv
data/dataset/interactive_landscape.csv
+0
-0
data/dataset/linuxfoundation-interactive-landscape.csv
data/dataset/linuxfoundation-interactive-landscape.csv
+0
-0
data/dataset/repo-list.json
data/dataset/repo-list.json
+0
-0
src/main.py
src/main.py
+6
-6
src/repoinfo.py
src/repoinfo.py
+13
-12
未找到文件。
CSDN/Processor.jpg
→
data/
CSDN/Processor.jpg
浏览文件 @
1e93b039
文件已移动
CSDN/repo-commit-rank.csv
→
data/
CSDN/repo-commit-rank.csv
浏览文件 @
1e93b039
文件已移动
CSDN/repo-csdn-trends.xlsx
→
data/
CSDN/repo-csdn-trends.xlsx
浏览文件 @
1e93b039
文件已移动
CSDN/repository_commit_events_20200930_analysis_new-demo.csv
→
data/
CSDN/repository_commit_events_20200930_analysis_new-demo.csv
浏览文件 @
1e93b039
文件已移动
GitHub-Repos.xlsx
→
data/
GitHub-Repos.xlsx
浏览文件 @
1e93b039
文件已移动
GitHub/UserInfo.xlsx
→
data/
GitHub/UserInfo.xlsx
浏览文件 @
1e93b039
文件已移动
OSS数据需求.xlsx
→
data/
OSS数据需求.xlsx
浏览文件 @
1e93b039
文件已移动
PingCAP/近24个月的活跃数据总数.csv
→
data/
PingCAP/近24个月的活跃数据总数.csv
浏览文件 @
1e93b039
文件已移动
PingCAP/项目受欢迎度变化.csv
→
data/
PingCAP/项目受欢迎度变化.csv
浏览文件 @
1e93b039
文件已移动
PingCAP/项目活跃度变化.csv
→
data/
PingCAP/项目活跃度变化.csv
浏览文件 @
1e93b039
文件已移动
RepoType-OSChina.xlsx
→
data/
RepoType-OSChina.xlsx
浏览文件 @
1e93b039
文件已移动
RepoType.xlsx
→
data/
RepoType.xlsx
浏览文件 @
1e93b039
文件已移动
dataset/cncf-interactive-landscape.csv
→
data
/data
set/cncf-interactive-landscape.csv
浏览文件 @
1e93b039
文件已移动
dataset/interactive_landscape.csv
→
data
/data
set/interactive_landscape.csv
浏览文件 @
1e93b039
文件已移动
dataset/linuxfoundation-interactive-landscape.csv
→
data
/data
set/linuxfoundation-interactive-landscape.csv
浏览文件 @
1e93b039
文件已移动
dataset/repo-list.json
→
data
/data
set/repo-list.json
浏览文件 @
1e93b039
文件已移动
src/main.py
浏览文件 @
1e93b039
...
...
@@ -23,7 +23,7 @@ config = {
},
"schema"
:
{
"repo_github_user_info"
:
{
"file"
:
"../GitHub/Userinfo.xlsx"
,
"file"
:
"../
data/
GitHub/Userinfo.xlsx"
,
"sheet_name"
:
"repo"
,
"desc"
:
"开源项目Github贡献者信息"
,
"fields"
:
[
...
...
@@ -100,7 +100,7 @@ config = {
]
},
"repo_github_info"
:
{
"file"
:
"../Github-Repos.xlsx"
,
"file"
:
"../
data/
Github-Repos.xlsx"
,
"sheet_name"
:
"汇总"
,
"desc"
:
"开源项目在Github上的项目交互数据"
,
"fields"
:
[
...
...
@@ -162,7 +162,7 @@ config = {
]
},
"repo_csdn_trends"
:
{
"file"
:
"../CSDN/repo-csdn-trends.xlsx"
,
"file"
:
"../
data/
CSDN/repo-csdn-trends.xlsx"
,
"sheet_name"
:
"Sheet1"
,
"desc"
:
"开源项目在CSDN站内指数数据"
,
"fields"
:
[
...
...
@@ -179,7 +179,7 @@ config = {
]
},
"repo_commit_rank"
:
{
"file"
:
"../CSDN/repo-commit-rank.csv"
,
"file"
:
"../
data/
CSDN/repo-commit-rank.csv"
,
"desc"
:
"开源项目在Github的月commit变化"
,
"fields"
:
[
{
...
...
@@ -205,7 +205,7 @@ config = {
]
},
"repo_github_active_trends"
:
{
"file"
:
"../PingCAP/项目活跃度变化.csv"
,
"file"
:
"../
data/
PingCAP/项目活跃度变化.csv"
,
"desc"
:
"开源项目在Github上的月活跃度数据"
,
"fields"
:
[
{
...
...
@@ -241,7 +241,7 @@ config = {
]
},
"repo_github_popular_trends"
:
{
"file"
:
"../PingCAP/项目受欢迎度变化.csv"
,
"file"
:
"../
data/
PingCAP/项目受欢迎度变化.csv"
,
"desc"
:
"开源项目在Github上的月收欢迎程度数据"
,
"fields"
:
[
{
...
...
src/repoinfo.py
浏览文件 @
1e93b039
...
...
@@ -6,38 +6,39 @@ import time
import
re
# 读取json文件
with
open
(
"dataset/repo-list.json"
,
'r'
)
as
f
:
with
open
(
"
../data/
dataset/repo-list.json"
,
'r'
)
as
f
:
data
=
json
.
load
(
f
)
with
open
(
'dataset/result.txt'
,
'r+'
)
as
file
:
with
open
(
'
../data/
dataset/result.txt'
,
'r+'
)
as
file
:
file
.
truncate
(
0
)
for
list_item
in
data
:
# print(list_item["full_name"])
a
=
list_item
[
"full_name"
]
url
=
"https://api.github.com/repos/"
+
a
# url2 = "https://api.github.com/repos/" + a + "/contributors?per_page=1&anon=true"
payload
=
{}
payload
=
{}
headers
=
{
'Authorization'
:
''
# 这里填入你自己的 GitHub Personal Access Token
}
'Authorization'
:
''
# 这里填入你自己的 GitHub Personal Access Token
}
response
=
requests
.
request
(
"GET"
,
url
,
headers
=
headers
,
data
=
payload
)
# response2 = requests.request("GET", url2, headers=headers, data=payload)
# headers2 = requests.get(url2).headers
# print(headers2)
# pagesize = [int(s) for s in re.findall(r'\b\d+\b',headers2['Link'])]
# print(str(response.json()["id"])+ ',' + response.json()["owner"]["login"] + ',' + response.json()["full_name"] + ',' + str(response.json()["stargazers_count"]) + ',' + str(response.json()["forks_count"]) + ',' + str(response.json()["open_issues"]) + ',' + str(pagesize[-1]))
# with open('dataset/result.txt', 'a') as f:
# f.write(str(response.json()["id"])+ ',' + response.json()["owner"]["login"] + ',' + response.json()["full_name"] + ',' + str(response.json()["stargazers_count"]) + ',' + str(response.json()["forks_count"]) + ',' + str(pagesize[-1]) + "\n")
# time.sleep(4) # Sleep for 2 seconds
# print(str(response.json()["id"])+ ',' + response.json()["owner"]["login"] + ',' + response.json()["full_name"] + ',' + str(response.json()["stargazers_count"]) + ',' + str(response.json()["forks_count"]) + ',' + str(response.json()["open_issues"]))
with
open
(
'dataset/result.txt'
,
'a'
)
as
f
:
f
.
write
(
str
(
response
.
json
()[
"id"
])
+
','
+
response
.
json
()[
"owner"
][
"login"
]
+
','
+
response
.
json
()[
"full_name"
]
+
','
+
str
(
response
.
json
()[
"stargazers_count"
])
+
','
+
str
(
response
.
json
()[
"forks_count"
])
+
"
\n
"
)
time
.
sleep
(
2
)
# Sleep for 2 seconds
\ No newline at end of file
with
open
(
'../data/dataset/result.txt'
,
'a'
)
as
f
:
f
.
write
(
str
(
response
.
json
()[
"id"
])
+
','
+
response
.
json
()[
"owner"
][
"login"
]
+
','
+
response
.
json
()[
"full_name"
]
+
','
+
str
(
response
.
json
()[
"stargazers_count"
])
+
','
+
str
(
response
.
json
()[
"forks_count"
])
+
"
\n
"
)
time
.
sleep
(
2
)
# Sleep for 2 seconds
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录