2015-07-23 04:23:50 +00:00
|
|
|
var cheerio = require('cheerio');
|
|
|
|
var https = require('https');
|
|
|
|
var fs = require('fs');
|
|
|
|
var path = require('path');
|
|
|
|
var querystring = require('querystring');
|
|
|
|
var crypto = require('crypto');
|
|
|
|
|
2017-04-05 06:02:31 +00:00
|
|
|
import { LoggerFactory } from '@calzoneman/jsli';
|
|
|
|
const LOGGER = LoggerFactory.getLogger('google2vtt');
|
2015-07-23 04:23:50 +00:00
|
|
|
|
|
|
|
function md5(input) {
|
|
|
|
var hash = crypto.createHash('md5');
|
|
|
|
hash.update(input);
|
|
|
|
return hash.digest('base64').replace(/\//g, ' ')
|
|
|
|
.replace(/\+/g, '#')
|
|
|
|
.replace(/=/g, '-');
|
|
|
|
}
|
|
|
|
|
|
|
|
var slice = Array.prototype.slice;
|
|
|
|
var subtitleDir = path.resolve(__dirname, '..', 'google-drive-subtitles');
|
2015-07-29 03:34:55 +00:00
|
|
|
var subtitleLock = {};
|
2015-07-25 08:19:32 +00:00
|
|
|
var ONE_HOUR = 60 * 60 * 1000;
|
|
|
|
var ONE_DAY = 24 * ONE_HOUR;
|
2015-07-23 04:23:50 +00:00
|
|
|
|
|
|
|
function padZeros(n) {
|
|
|
|
n = n.toString();
|
|
|
|
if (n.length < 2) n = '0' + n;
|
|
|
|
return n;
|
|
|
|
}
|
|
|
|
|
|
|
|
function formatTime(time) {
|
|
|
|
var hours = Math.floor(time / 3600);
|
|
|
|
time = time % 3600;
|
|
|
|
var minutes = Math.floor(time / 60);
|
|
|
|
time = time % 60;
|
|
|
|
var seconds = Math.floor(time);
|
|
|
|
var ms = time - seconds;
|
|
|
|
|
|
|
|
var list = [minutes, seconds];
|
|
|
|
if (hours) {
|
|
|
|
list.unshift(hours);
|
|
|
|
}
|
|
|
|
|
|
|
|
return list.map(padZeros).join(':') + ms.toFixed(3).substring(1);
|
|
|
|
}
|
|
|
|
|
2015-07-25 17:31:21 +00:00
|
|
|
function fixText(text) {
|
2015-07-23 04:23:50 +00:00
|
|
|
return text.replace(/&/g, '&')
|
|
|
|
.replace(/</g, '<')
|
|
|
|
.replace(/>/g, '>')
|
|
|
|
.replace(/"/g, '"')
|
2015-07-25 17:31:21 +00:00
|
|
|
.replace(/'/g, "'")
|
|
|
|
.replace(/-->/g, '-->');
|
2015-07-23 04:23:50 +00:00
|
|
|
}
|
|
|
|
|
|
|
|
exports.convert = function convertSubtitles(subtitles) {
|
|
|
|
var $ = cheerio.load(subtitles, { xmlMode: true });
|
|
|
|
var lines = slice.call($('transcript text').map(function (index, elem) {
|
|
|
|
var start = parseFloat(elem.attribs.start);
|
|
|
|
var end = start + parseFloat(elem.attribs.dur);
|
2015-07-25 17:31:21 +00:00
|
|
|
var text;
|
|
|
|
if (elem.children.length) {
|
|
|
|
text = elem.children[0].data;
|
|
|
|
} else {
|
|
|
|
text = '';
|
|
|
|
}
|
2015-07-23 04:23:50 +00:00
|
|
|
|
|
|
|
var line = formatTime(start) + ' --> ' + formatTime(end);
|
2015-07-25 17:31:21 +00:00
|
|
|
line += '\n' + fixText(text) + '\n';
|
2015-07-23 04:23:50 +00:00
|
|
|
return line;
|
|
|
|
}));
|
|
|
|
|
|
|
|
return 'WEBVTT\n\n' + lines.join('\n');
|
|
|
|
};
|
|
|
|
|
|
|
|
exports.attach = function setupRoutes(app) {
|
2015-07-25 17:31:21 +00:00
|
|
|
app.get('/gdvtt/:id/:lang/(:name)?.vtt', handleGetSubtitles);
|
2015-07-23 04:23:50 +00:00
|
|
|
};
|
|
|
|
|
|
|
|
function handleGetSubtitles(req, res) {
|
|
|
|
var id = req.params.id;
|
|
|
|
var lang = req.params.lang;
|
2015-07-25 17:31:21 +00:00
|
|
|
var name = req.params.name || '';
|
2015-07-23 04:23:50 +00:00
|
|
|
var vid = req.query.vid;
|
2015-07-25 17:31:21 +00:00
|
|
|
if (typeof vid !== 'string' || typeof id !== 'string' || typeof lang !== 'string') {
|
2015-07-23 04:23:50 +00:00
|
|
|
return res.sendStatus(400);
|
|
|
|
}
|
|
|
|
var file = [id, lang, md5(name)].join('_') + '.vtt';
|
|
|
|
var fileAbsolute = path.join(subtitleDir, file);
|
|
|
|
|
2015-07-29 03:34:55 +00:00
|
|
|
takeSubtitleLock(fileAbsolute, function () {
|
|
|
|
fs.exists(fileAbsolute, function (exists) {
|
|
|
|
if (exists) {
|
2015-07-23 04:23:50 +00:00
|
|
|
res.sendFile(file, { root: subtitleDir });
|
2015-07-29 03:34:55 +00:00
|
|
|
delete subtitleLock[fileAbsolute];
|
|
|
|
} else {
|
|
|
|
fetchSubtitles(id, lang, name, vid, fileAbsolute, function (err) {
|
|
|
|
delete subtitleLock[fileAbsolute];
|
|
|
|
if (err) {
|
2017-04-05 06:02:31 +00:00
|
|
|
LOGGER.error(err.stack);
|
2015-07-29 03:34:55 +00:00
|
|
|
return res.sendStatus(500);
|
|
|
|
}
|
|
|
|
|
|
|
|
res.sendFile(file, { root: subtitleDir });
|
|
|
|
});
|
|
|
|
}
|
|
|
|
});
|
2015-07-23 04:23:50 +00:00
|
|
|
});
|
|
|
|
}
|
|
|
|
|
|
|
|
function fetchSubtitles(id, lang, name, vid, file, cb) {
|
|
|
|
var query = {
|
|
|
|
id: id,
|
|
|
|
v: id,
|
|
|
|
vid: vid,
|
|
|
|
lang: lang,
|
|
|
|
name: name,
|
|
|
|
type: 'track',
|
|
|
|
kind: undefined
|
|
|
|
};
|
|
|
|
|
|
|
|
var url = 'https://drive.google.com/timedtext?' + querystring.stringify(query);
|
|
|
|
https.get(url, function (res) {
|
|
|
|
if (res.statusCode !== 200) {
|
|
|
|
return cb(new Error(res.statusMessage));
|
|
|
|
}
|
|
|
|
|
|
|
|
var buf = '';
|
|
|
|
res.setEncoding('utf-8');
|
|
|
|
res.on('data', function (data) {
|
|
|
|
buf += data;
|
|
|
|
});
|
|
|
|
|
|
|
|
res.on('end', function () {
|
|
|
|
try {
|
|
|
|
buf = exports.convert(buf);
|
|
|
|
} catch (e) {
|
|
|
|
return cb(e);
|
|
|
|
}
|
|
|
|
|
|
|
|
fs.writeFile(file, buf, function (err) {
|
|
|
|
if (err) {
|
|
|
|
cb(err);
|
|
|
|
} else {
|
2017-04-05 06:02:31 +00:00
|
|
|
LOGGER.info('Saved subtitle file ' + file);
|
2015-07-23 04:23:50 +00:00
|
|
|
cb();
|
|
|
|
}
|
|
|
|
});
|
|
|
|
});
|
|
|
|
}).on('error', function (err) {
|
|
|
|
cb(err);
|
|
|
|
});
|
|
|
|
}
|
2015-07-25 08:19:32 +00:00
|
|
|
|
|
|
|
function clearOldSubtitles() {
|
|
|
|
fs.readdir(subtitleDir, function (err, files) {
|
|
|
|
if (err) {
|
2017-04-05 06:02:31 +00:00
|
|
|
LOGGER.error(err.stack);
|
2015-07-25 08:19:32 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
files.forEach(function (file) {
|
|
|
|
fs.stat(path.join(subtitleDir, file), function (err, stats) {
|
|
|
|
if (err) {
|
2017-04-05 06:02:31 +00:00
|
|
|
LOGGER.error(err.stack);
|
2015-07-25 08:19:32 +00:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (stats.mtime.getTime() < Date.now() - ONE_DAY) {
|
2017-04-05 06:02:31 +00:00
|
|
|
LOGGER.info('Deleting old subtitle file: ' + file);
|
2015-07-25 08:19:32 +00:00
|
|
|
fs.unlink(path.join(subtitleDir, file));
|
|
|
|
}
|
|
|
|
});
|
|
|
|
});
|
|
|
|
});
|
|
|
|
}
|
|
|
|
|
2015-07-29 03:34:55 +00:00
|
|
|
function takeSubtitleLock(filename, cb) {
|
|
|
|
if (!subtitleLock.hasOwnProperty(filename)) {
|
|
|
|
subtitleLock[filename] = true;
|
|
|
|
return setImmediate(cb);
|
|
|
|
}
|
|
|
|
|
|
|
|
var tries = 1;
|
|
|
|
var interval = setInterval(function () {
|
|
|
|
tries++;
|
|
|
|
if (!subtitleLock.hasOwnProperty(filename) || tries >= 5) {
|
|
|
|
subtitleLock[filename] = true;
|
|
|
|
clearInterval(interval);
|
|
|
|
return setImmediate(cb);
|
|
|
|
}
|
|
|
|
}, 200);
|
|
|
|
}
|
|
|
|
|
2015-07-25 08:19:32 +00:00
|
|
|
setInterval(clearOldSubtitles, ONE_HOUR);
|
|
|
|
clearOldSubtitles();
|