summaryrefslogtreecommitdiff
path: root/html2json.js
blob: 1c4ae9b01dff5c56359086b6249f97e90057367f (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
var cheerio = require('cheerio')
var path = require('path')

// Read the HTML report
fs = require('fs')
var htmlContent;
try {
    htmlContent = fs.readFileSync(process.argv[2], 'utf8');
} catch(e) {
    console.log('Error:', e.stack);
    process.exit(1);
}

// Get the directory containing the results to make pathes relative to it later.
report_directory = path.dirname(process.argv[2])

const $ = cheerio.load(htmlContent)

// Map that keeps the total tally of the license occurrences
var licenses = {};

// Extract dependencies info.
var dependencies = []
$('div.dependencies div').each(function(i, doc) {
    // Get license name.
    license = $(this).find('blockquote p').text().trim();
    license = license.split("\n")[0];

    if(licenses[license]) {
        licenses[license].count += 1;
    } else {
        licenses[license] = { count: 1, name: license }
    }

    // Get URL.
    license_url = $(this).find('blockquote p a[href]').attr('href');

    // Get dependency name.
    dependency_name = $(this).find('h2').text().trim();
    dependency_name = dependency_name.split("\n")[0];

    // Get dependency URL.
    dependency_url = $(this).find('h2 a[href]').attr('href');

    // Get dependency description.
    dependency_description = $(this).find('dl').first().next().text().trim();

    // Get dependency location relative to the project root path
    dependency_pathes = []
    $(this).find('dl').first().find('dd').each(function(i, doc) {
        dependency_path = path.relative(report_directory, $(this).text().trim());

        // Whitespace path means current directory
        if (!dependency_path) {
            dependency_path = ".";
        }

        dependency_pathes.push(dependency_path);
    })
    dependencies.push({
        license: {
            name: license,
            url: license_url
        },
        dependency: {
            name: dependency_name,
            url: dependency_url,
            description: dependency_description,
            pathes: dependency_pathes
        }
    })
})

// Stable sort of licenses. First license count descending, then license name ascending
licenses = Object.values(licenses)
  .sort(function (a, b) {
  if (a.count === b.count) {
    return a.name > b.name ? 1 : -1;
  }
  return a.count < b.count ? 1 : -1;
});

console.log(JSON.stringify({
    licenses: licenses,
    dependencies: dependencies}, null, 2))