-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathextractformats.js
106 lines (94 loc) · 3.12 KB
/
extractformats.js
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
var d3 = require('d3'),
fs = require('fs');
var output = [];
var writeFinalData = function(data){
var finalData = d3.tsv.format(data);
fs.writeFile('output/output_ex.tsv', finalData, function(err) {
if(err) {
return console.log(err);
}
console.log("The file was saved!");
});
}
var extensions = fs.readFileSync('data/extensions.tsv','utf8')
extensions = d3.tsv.parse(extensions)
var exList = extensions.map(function(d){
return d.ex;
})
var dir = 'output/users_top_repos_trees/';
fs.readdir(dir,function(err,files){
if (err) throw err;
var count = 0;
var total = files.length;
//var total = 5;
files.forEach(function(file,i){
fs.readFile(dir+file,'utf-8',function(err,data){
var repoData = JSON.parse(data);
var filesData = repoData.filter(function(d){
return d.type == 'blob'
})
filesData.forEach(function(d){
var ex = d.path.split('.')
if(ex.length > 0){
ex = ex[ex.length-1].toLowerCase();
if(exList.indexOf(ex) > -1){
//console.log(ex)
var elm = {
user:d.url.split('/')[4],
repo:d.url.split('/')[5],
path:d.path,
extension:ex,
size:d.size
}
output.push(elm);
// count++
// console.log(count + '/' + total + ' ' + file)
// if(count == total){
// writeFinalData(output);
// }
}else{
// count++
// console.log(count + '/' + total + ' ' + file)
// if(count == total){
// writeFinalData(output);
// }
}
}else{
// count++
// console.log(count + '/' + total + ' ' + file)
// if(count == total){
// writeFinalData(output);
// }
}
})
count++
console.log(count + '/' + total + ' ' + file)
if(count == total){
writeFinalData(output);
//break;
}
// var elm = {
// user:repoData.owner.login,
// name: repoData.name,
// owner: repoData.owner.login,
// description: repoData.description,
// fork: repoData.fork,
// language: repoData.language,
// forks_count: repoData.forks_count,
// stargazers_count: repoData.stargazers_count,
// watchers_count: repoData.watchers_count,
// size: repoData.size,
// default_branch: repoData.default_branch,
// open_issues_count: repoData.open_issues_count,
// pushed_at: repoData.pushed_at,
// updated_at: repoData.updated_at
// }
// output.push(elm);
// count++
// console.log(count + '/' + total + ' ' +repoData.name)
// if(count == total){
// writeFinalData(output);
// }
});
});
});