backend/src/router/websocket.ts

247 lines
8.7 KiB
TypeScript

import { Elysia, t } from 'elysia';
import { RedisRateLimiter } from 'rolling-rate-limiter'
import * as fs from 'node:fs'
import { db } from '@/utils/database'
import { validateVideo, validateChannel } from '@/utils/regex'
import { checkCaptcha, createDatabaseVideo } from '@/utils/common';
import { downloadVideo } from '@/utils/download';
import { uploadVideo } from '@/utils/upload';
import { getChannelVideos, getVideo } from '@/utils/metadata';
import { error } from '@/utils/html'
import redis from '@/utils/redis';
import { parseSlop } from '@/utils/slop';
const app = new Elysia()
const videoIds: Record<string, string> = {}
const limiter = new RedisRateLimiter({
client: redis,
namespace: 'save:',
interval: 24 * 60 * 60000, // 24h
maxInInterval: 50
})
const sendError = (ws: any, message: string, close: boolean = true) => {
ws.send(`ERROR - ${message}`);
if (close) ws.close();
};
const cleanup = async (ws: any, videoId: string) => {
delete videoIds[ws.id];
if (videoId) await redis.del(videoId);
await redis.del(ws.id);
};
const handleUpload = async (ws: any, videoId: string, isChannel: boolean = false) => {
// the pattern of files that have finished downloading is [videoid].mp4, but some extensions are also possible due to
// current youtube changes, so we need to make sure the other extensions are also covered
let filePath = fs.readdirSync('./videos/').find(f => f.includes(`${videoId}.`))
if (!filePath) {
ws.send(`DATA - Video file for ${videoId} not found. Skipping.`);
return false;
}
filePath = './videos/' + filePath
try {
ws.send('DATA - Uploading file...');
const videoUrl = await uploadVideo(filePath);
fs.unlinkSync(filePath);
const uploaded = await createDatabaseVideo(videoId, videoUrl);
if (uploaded !== 'success') {
ws.send(`DATA - Error while uploading - ${JSON.stringify(uploaded)}`);
return false;
}
if (!isChannel) ws.send(`DONE - ${process.env.FRONTEND}/watch?v=${videoId}`);
return true;
} catch (error: any) {
ws.send(`ERROR - Upload failed for ${videoId}: ${error.message}`);
console.log(`upload failed for ${videoId}: ${error.message}`)
if (fs.existsSync(filePath)) fs.unlinkSync(filePath)
return false;
}
};
const getRateLimitKey = (ip: string): string => {
if (!ip || ip === '0.0.0.0') return ip;
if (ip.includes(':')) {
const parts = ip.split(':');
if (parts.length >= 3) {
return `${parts[0]}:${parts[1]}:${parts[2]}`;
}
return ip;
}
return ip;
};
app.ws('/save', {
query: t.Object({
url: t.String()
}),
body: t.String(),
open: async (ws) => {
console.log(`${ws.id} - ${ws.data.path} - ${JSON.stringify(ws.data.query)}`)
const videoId = validateVideo(ws.data.query.url)
if (!videoId) return sendError(ws, 'Invalid video URL.');
if (await redis.get(videoId)) return sendError(ws, 'Someone is already downloading this video...');
if (await redis.get(`blacklist:${videoId}`)) return sendError(ws, 'This video is blacklisted.');
const already = await db.selectFrom('videos')
.select('id')
.where('id', '=', videoId)
.executeTakeFirst()
if (already) {
ws.send(`DONE - ${process.env.FRONTEND}/watch?v=${videoId}`)
ws.close()
} else {
const hash = Bun.hash(getRateLimitKey(ws.data.headers['cf-connecting-ip'] || '0.0.0.0'))
const isLimited = await limiter.limit(hash.toString())
if (isLimited) {
return sendError(ws, 'You have been ratelimited. </br>Is this an urgent archive? Please email me: admin@preservetube.com');
}
ws.send('DATA - This process is automatic. Your video will start archiving shortly.')
ws.send('CAPTCHA - Solving a cryptographic challenge before downloading.')
videoIds[ws.id] = videoId
}
},
message: async (ws, message) => {
if (message == 'alive') return
const videoId = videoIds[ws.id];
if (!videoId) return sendError(ws, 'No video ID associated with this session.');
if (await redis.get(videoId) !== 'downloading') {
await redis.set(videoId, 'downloading', 'EX', 300)
const captchaCheck = await checkCaptcha(message, ws.data.headers['cf-connecting-ip'] || '0.0.0.0')
if (!captchaCheck.success) {
await cleanup(ws, videoId);
console.log(`captcha failed for ${videoId} - ${JSON.stringify(captchaCheck)}`)
return sendError(ws, 'Captcha validation failed.');
} else {
ws.send('DATA - Captcha validated. Starting download...');
}
const data = await getVideo(videoId)
if (data.error) {
return sendError(ws, 'Unable to retrieve video info from YouTube. Please try again later.')
}
const slopScore = await parseSlop(videoId, data.videoDetails.title,
(data.microformat.playerMicroformatRenderer.description?.simpleText || '').replaceAll('\n', '<br>'))
if (slopScore >= 4) {
sendError(ws, 'Filters can always be wrong. Is the rating wrong? Email me at admin@preservetube.com', false);
return sendError(ws, 'Your download has been rejected by our slop filter.');
}
const downloadResult = await downloadVideo(ws, videoId);
if (downloadResult.fail) {
await cleanup(ws, videoId);
return sendError(ws, downloadResult.message);
}
const uploadSuccess = await handleUpload(ws, videoId);
if (!uploadSuccess) await redis.del(videoId);
await cleanup(ws, videoId);
ws.close();
} else {
ws.send('DATA - Captcha already submitted.');
}
},
close: async (ws) => {
await cleanup(ws, videoIds[ws.id]);
console.log(`closed - ${ws.data.path} - ${JSON.stringify(ws.data.query)}`)
}
})
app.ws('/savechannel', {
query: t.Object({
url: t.String()
}),
body: t.String(),
open: async (ws) => {
console.log(`${ws.id} - ${ws.data.path} - ${JSON.stringify(ws.data.query)}`)
const channelId = await validateChannel(ws.data.query.url);
if (!channelId) return sendError(ws, 'Invalid channel URL.');
if (typeof channelId !== 'string') return sendError(ws, `Failed to fetch channel ID - ${channelId.error}`)
ws.send('DATA - This process is automatic. Your video will start archiving shortly.')
ws.send('CAPTCHA - Solving a cryptographic challenge before downloading.')
videoIds[ws.id] = `captcha-${channelId}`;
},
message: async (ws, message) => {
if (message == 'alive') return
const status = videoIds[ws.id];
if (!status || !status.startsWith('captcha-')) return sendError(ws, 'No channel associated with this session.');
const channelId = status.replace('captcha-', '');
const captchaCheck = await checkCaptcha(message, ws.data.headers['cf-connecting-ip'] || '0.0.0.0')
if (!captchaCheck.success) {
await cleanup(ws, channelId);
console.log(`captcha failed for ${channelId} - ${JSON.stringify(captchaCheck)}`)
return sendError(ws, 'Captcha validation failed.');
} else {
ws.send('DATA - Captcha validated. Starting download...');
}
videoIds[ws.id] = `downloading-${channelId}`;
const videos = await getChannelVideos(channelId);
for (const video of videos.slice(0, 5)) {
if (!video || (await redis.get(video.video_id)) || (await redis.get(`blacklist:${video.video_id}`))) continue;
const already = await db.selectFrom('videos')
.select('id')
.where('id', '=', video.video_id)
.executeTakeFirst()
if (already) continue
const hash = Bun.hash(getRateLimitKey(ws.data.headers['cf-connecting-ip'] || '0.0.0.0'))
const isLimited = await limiter.limit(hash.toString())
if (isLimited) {
sendError(ws, 'You have been ratelimited. </br>Is this an urgent archive? Please email me: admin@preservetube.com', false);
break;
}
const slopScore = await parseSlop(video.video_id, video.title.text, video.description_snippet?.text || '')
if (slopScore >= 4) {
sendError(ws, 'Filters can always be wrong. Is the rating wrong? Email me at admin@preservetube.com', false);
sendError(ws, 'Your download has been rejected by our slop filter.');
continue;
}
ws.send(`DATA - Processing video: ${video.title.text}`);
await redis.set(video.video_id, 'downloading', 'EX', 300);
const downloadResult = await downloadVideo(ws, video.video_id);
if (!downloadResult.fail) await handleUpload(ws, video.video_id, true);
await redis.del(video.video_id);
ws.send(`DATA - Created video page for ${video.title.text}`)
}
await cleanup(ws, channelId);
ws.send(`DONE - ${process.env.FRONTEND}/channel/${channelId}`)
ws.close();
},
close: async (ws) => {
await cleanup(ws, videoIds[ws.id]);
console.log(`closed - ${ws.data.path} - ${JSON.stringify(ws.data.query)}`)
}
})
app.onError(error)
export default app