Files
klz-cables.com/scripts/download-missing-assets.js
2026-01-06 13:55:04 +01:00

153 lines
4.3 KiB
JavaScript

#!/usr/bin/env node
/**
* Script to download missing videos and PDFs
* Downloads videos referenced in processed data and PDFs linked in pages
*/
const fs = require('fs');
const path = require('path');
const https = require('https');
const http = require('http');
// Configuration
const MEDIA_DIR = path.join(__dirname, '..', 'public', 'media');
const PROCESSED_DIR = path.join(__dirname, '..', 'data', 'processed');
// Videos to download (from home pages)
const VIDEOS_TO_DOWNLOAD = [
{
url: 'https://klz-cables.com/wp-content/uploads/2025/02/header.mp4',
filename: 'header.mp4'
},
{
url: 'https://klz-cables.com/wp-content/uploads/2025/02/header.webm',
filename: 'header.webm'
}
];
// PDFs to download (from terms pages)
const PDFS_TO_DOWNLOAD = [
{
url: 'https://klz-cables.com/wp-content/uploads/2025/01/agbs.pdf',
filename: 'agbs.pdf'
}
];
// Create media directory if it doesn't exist
if (!fs.existsSync(MEDIA_DIR)) {
fs.mkdirSync(MEDIA_DIR, { recursive: true });
}
// Download file function
function downloadFile(url, filename) {
return new Promise((resolve, reject) => {
const filePath = path.join(MEDIA_DIR, filename);
// Check if file already exists
if (fs.existsSync(filePath)) {
console.log(`✅ Already exists: ${filename}`);
resolve(filePath);
return;
}
console.log(`📥 Downloading: ${filename} from ${url}`);
const protocol = url.startsWith('https') ? https : http;
const file = fs.createWriteStream(filePath);
protocol.get(url, (res) => {
if (res.statusCode === 200) {
res.pipe(file);
file.on('finish', () => {
console.log(`✅ Downloaded: ${filename}`);
resolve(filePath);
});
} else if (res.statusCode === 301 || res.statusCode === 302) {
// Handle redirects
if (res.headers.location) {
console.log(`🔄 Redirected to: ${res.headers.location}`);
downloadFile(res.headers.location, filename).then(resolve).catch(reject);
} else {
reject(new Error(`Redirect without location: ${res.statusCode}`));
}
} else {
reject(new Error(`Failed to download: HTTP ${res.statusCode}`));
}
}).on('error', (err) => {
fs.unlink(filePath, () => {});
reject(err);
});
});
}
// Main function
async function main() {
console.log('🔍 Downloading Missing Assets');
console.log('==============================');
console.log(`Output: ${MEDIA_DIR}`);
console.log('');
const assetMap = {};
const downloaded = [];
// Download videos
console.log('🎬 Videos:');
for (const video of VIDEOS_TO_DOWNLOAD) {
try {
await downloadFile(video.url, video.filename);
assetMap[video.url] = `/media/${video.filename}`;
downloaded.push(video.filename);
} catch (error) {
console.warn(`⚠️ Failed to download video ${video.filename}:`, error.message);
}
}
console.log('');
// Download PDFs
console.log('📄 PDFs:');
for (const pdf of PDFS_TO_DOWNLOAD) {
try {
await downloadFile(pdf.url, pdf.filename);
assetMap[pdf.url] = `/media/${pdf.filename}`;
downloaded.push(pdf.filename);
} catch (error) {
console.warn(`⚠️ Failed to download PDF ${pdf.filename}:`, error.message);
}
}
// Update asset-map.json with new entries
const assetMapPath = path.join(PROCESSED_DIR, 'asset-map.json');
if (fs.existsSync(assetMapPath)) {
const existingMap = JSON.parse(fs.readFileSync(assetMapPath, 'utf8'));
const updatedMap = { ...existingMap, ...assetMap };
fs.writeFileSync(assetMapPath, JSON.stringify(updatedMap, null, 2));
console.log(`\n✅ Updated asset-map.json with ${Object.keys(assetMap).length} new entries`);
}
console.log('\n🎉 Asset Download Complete!');
console.log('==============================');
console.log(`📥 Downloaded: ${downloaded.length} files`);
console.log(`📁 Directory: public/media/`);
console.log('');
console.log('Files downloaded:');
downloaded.forEach(file => {
console.log(` - ${file}`);
});
}
// Run if called directly
if (require.main === module) {
main().catch(error => {
console.error('\n❌ Script failed:', error.message);
process.exit(1);
});
}
module.exports = {
downloadFile,
main
};