Files
aidio-description/src/cli/index.ts

91 lines
3.2 KiB
TypeScript
Raw Normal View History

2026-05-13 02:17:07 +02:00
import 'dotenv/config';
import { getDefaultConfig } from '../config/config';
import { createStats } from '../config/stats';
import { VisionProviderFactory } from '../providers/vision/visionProviderFactory';
import { TTSProviderFactory } from '../providers/tts/ttsProviderFactory';
import { generateAudioDescription } from '../utils/processor';
import { estimateCost } from '../utils/costEstimator';
import { loadConfigFromFile, saveConfigToFile } from '../utils/configUtils';
import { parseCommandLineArgs } from './args';
import { Config } from '../config/config';
async function main(): Promise<void> {
const argv = parseCommandLineArgs();
let config: Config = getDefaultConfig();
if (argv.config) {
const fileConfig = loadConfigFromFile(argv.config);
config = { ...config, ...fileConfig };
}
const argvObj = argv as unknown as Record<string, unknown>;
Object.keys(argvObj).forEach(key => {
if (key !== '_' && key !== '$0' && key !== 'config' && key !== 'saveConfig' &&
key !== 'estimate' && key !== 'help' && key !== 'version' &&
argvObj[key] !== undefined) {
(config as any)[key] = argvObj[key];
}
});
if (argv.visionModel) {
if (!config.visionProviders[config.visionProvider]) {
config.visionProviders[config.visionProvider] = { model: '' };
}
config.visionProviders[config.visionProvider].model = argv.visionModel;
}
if (argv.ttsModel) {
if (!config.ttsProviders[config.ttsProvider]) {
config.ttsProviders[config.ttsProvider] = { model: '' };
}
config.ttsProviders[config.ttsProvider].model = argv.ttsModel;
}
if (argv.ttsVoice) {
if (!config.ttsProviders[config.ttsProvider]) {
config.ttsProviders[config.ttsProvider] = { model: '', voice: '' };
}
config.ttsProviders[config.ttsProvider].voice = argv.ttsVoice;
}
if (argv.saveConfig) {
saveConfigToFile(argv.saveConfig, config);
}
if (argv._.length < 1) {
console.error('Error: No video file specified');
console.log('Usage: node script.js <video_file_path> [options]');
console.log('Use --help for more information');
process.exit(1);
}
const videoFilePath = String(argv._[0]);
if (argv.estimate) {
try {
const costBreakdown = await estimateCost(videoFilePath, config);
console.log('\n=== COST ESTIMATION ===');
console.log(JSON.stringify(costBreakdown, null, 2));
console.log(`\nEstimated total cost: ${costBreakdown.apiCosts.total}`);
console.log(`Estimated processing time: ${costBreakdown.estimates.estimatedProcessingTimeMinutes.toFixed(1)} minutes`);
console.log('Note: Actual costs may vary based on image complexity and actual response lengths.');
} catch (err) {
console.error('Error estimating costs:', err);
}
} else {
try {
const stats = createStats();
const visionProvider = VisionProviderFactory.getProvider(config);
const ttsProvider = TTSProviderFactory.getProvider(config);
await generateAudioDescription(videoFilePath, visionProvider, ttsProvider, config, stats);
} catch (err) {
console.error('Error generating audio description:', err);
}
}
}
if (require.main === module) {
main().catch(err => console.error('Unhandled error:', err));
}