forked from developmentseed/skynet-data
-
Notifications
You must be signed in to change notification settings - Fork 0
/
remove-bad-images
executable file
·56 lines (51 loc) · 1.64 KB
/
remove-bad-images
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
#!/usr/bin/env node
var fs = require('fs')
var path = require('path')
var jpeg = require('jpeg-js')
var split = require('split')
var argv = require('minimist')(process.argv.slice(2), {
default: {
visuallyBlack: 40,
blackThreshold: 0.95,
visuallyWhite: 220,
whiteThreshold: 0.50
},
boolean: ['dryrun']
})
// Delete images in which X% of pixels are "visually black" or "visually white"
console.log(argv)
var inputs = []
process.stdin.pipe(split())
.on('data', function (name) { inputs.push(name) })
.on('end', function () {
var deletedCount = 0
inputs
.filter(Boolean)
.forEach(function (name, j) {
var filename = path.resolve(name)
var jpegData = fs.readFileSync(filename)
var rawImageData = jpeg.decode(jpegData, true) // return as Uint8Array
var data = rawImageData.data
var darkPixelCount = 0
var lightPixelCount = 0
for (var i = 0; i < data.length; i++) {
if (Math.max(data[i], data[i + 1], data[i + 2]) < argv.visuallyBlack) {
darkPixelCount++
}
if (Math.min(data[i], data[i + 1], data[i + 2]) > argv.visuallyWhite) {
lightPixelCount++
}
}
if (darkPixelCount >= (data.length / 4 * argv.blackThreshold) ||
lightPixelCount >= (data.length / 4 * argv.whiteThreshold)) {
deletedCount++
if (!argv.dryrun) {
fs.unlinkSync(filename)
}
console.log(argv.dryrun ? 'DRYRUN delete' : 'delete', filename, darkPixelCount, '(' + j + ' of ' + inputs.length + ')')
} else {
console.log('pass', filename, darkPixelCount, '(' + j + ' of ' + inputs.length + ')')
}
})
console.log('Deleted ' + deletedCount + ' bad images.')
})