| 1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
 | import { green, red } from 'colors';
import { ExifImage } from 'exif';
import * as exifr from 'exifr';
import { File } from 'formidable';
import { createReadStream, createWriteStream, existsSync, readFileSync, rename, unlinkSync, writeFile } from 'fs';
import * as path from 'path';
import { basename } from 'path';
import * as sharp from 'sharp';
import { Stream } from 'stream';
import { filesDirectory, publicDirectory } from '.';
import { Opt } from '../fields/Doc';
import { ParsedPDF } from '../server/PdfTypes';
import { Utils } from '../Utils';
import { createIfNotExists } from './ActionUtilities';
import { clientPathToFile, Directory, pathToDirectory, serverPathToFile } from './ApiManagers/UploadManager';
import { resolvedServerUrl } from './server_Initialization';
import { AcceptableMedia, Upload } from './SharedMediaTypes';
import request = require('request-promise');
import formidable = require('formidable');
const spawn = require('child_process').spawn;
const { exec } = require('child_process');
const parse = require('pdf-parse');
const ffmpeg = require('fluent-ffmpeg');
const fs = require('fs');
const requestImageSize = require('../client/util/request-image-size');
const md5File = require('md5-file');
export enum SizeSuffix {
    Small = '_s',
    Medium = '_m',
    Large = '_l',
    Original = '_o',
    None = '',
}
export function InjectSize(filename: string, size: SizeSuffix) {
    const extension = path.extname(filename).toLowerCase();
    return filename.substring(0, filename.length - extension.length) + size + extension;
}
function isLocal() {
    return /Dash-Web[0-9]*[\\\/]src[\\\/]server[\\\/]public[\\\/](.*)/;
}
export namespace DashUploadUtils {
    export interface Size {
        width: number;
        suffix: SizeSuffix;
    }
    export const Sizes: { [size: string]: Size } = {
        SMALL: { width: 100, suffix: SizeSuffix.Small },
        MEDIUM: { width: 400, suffix: SizeSuffix.Medium },
        LARGE: { width: 900, suffix: SizeSuffix.Large },
    };
    export function validateExtension(url: string) {
        return AcceptableMedia.imageFormats.includes(path.extname(url).toLowerCase());
    }
    const size = 'content-length';
    const type = 'content-type';
    const { imageFormats, videoFormats, applicationFormats, audioFormats } = AcceptableMedia; //TODO:glr
    export async function concatVideos(filePaths: string[]): Promise<Upload.AccessPathInfo> {
        // make a list of paths to create the ordered text file for ffmpeg
        const inputListName = 'concat.txt';
        const textFilePath = path.join(filesDirectory, inputListName);
        // make a list of paths to create the ordered text file for ffmpeg
        const filePathsText = filePaths.map(filePath => `file '${filePath}'`).join('\n');
        // write the text file to the file system
        await new Promise<void>((res, reject) =>
            writeFile(textFilePath, filePathsText, err => {
                if (err) {
                    reject();
                    console.log(err);
                } else res();
            })
        );
        // make output file name based on timestamp
        const outputFileName = `output-${Utils.GenerateGuid()}.mp4`;
        // create the output file path in the videos directory
        const outputFilePath = path.join(pathToDirectory(Directory.videos), outputFileName);
        // concatenate the videos
        await new Promise((resolve, reject) => {
            var merge = ffmpeg();
            merge
                .input(textFilePath)
                .inputOptions(['-f concat', '-safe 0'])
                .outputOptions('-c copy')
                //.videoCodec("copy")
                .save(outputFilePath)
                .on('error', (err: any) => {
                    console.log(err);
                    reject();
                })
                .on('end', resolve);
        });
        // delete concat.txt from the file system
        unlinkSync(textFilePath);
        // delete the old segment videos from the server
        filePaths.forEach(filePath => unlinkSync(filePath));
        // return the path(s) to the output file
        return {
            accessPaths: getAccessPaths(Directory.videos, outputFileName),
        };
    }
    function resolveExistingFile(name: string, pat: string, directory: Directory, type?: string, duration?: number, rawText?: string) {
        const data = { size: 0, path: path.basename(pat), name, type: type ?? '' };
        const file = { ...data, toJSON: () => ({ ...data, filename: data.path.replace(/.*\//, ''), mtime: duration?.toString(), mime: '', toJson: () => undefined as any }) };
        return {
            source: file,
            result: {
                accessPaths: {
                    agnostic: getAccessPaths(directory, data.path),
                },
                rawText,
                duration,
            },
        };
    }
    export function QueryYoutubeProgress(videoId: string) {
        return uploadProgress.get(videoId) ?? 'failed';
    }
    let uploadProgress = new Map<string, string>();
    export function uploadYoutube(videoId: string): Promise<Upload.FileResponse> {
        return new Promise<Upload.FileResponse<Upload.FileInformation>>((res, rej) => {
            console.log('Uploading YouTube video: ' + videoId);
            const name = videoId;
            const path = name.replace(/^-/, '__') + '.mp4';
            const finalPath = serverPathToFile(Directory.videos, path);
            if (existsSync(finalPath)) {
                uploadProgress.set(videoId, 'computing duration');
                exec(`yt-dlp -o ${finalPath} "https://www.youtube.com/watch?v=${videoId}" --get-duration`, (error: any, stdout: any, stderr: any) => {
                    const time = Array.from(stdout.trim().split(':')).reverse();
                    const duration = (time.length > 2 ? Number(time[2]) * 1000 * 60 : 0) + (time.length > 1 ? Number(time[1]) * 60 : 0) + (time.length > 0 ? Number(time[0]) : 0);
                    res(resolveExistingFile(name, finalPath, Directory.videos, 'video/mp4', duration, undefined));
                });
            } else {
                uploadProgress.set(videoId, 'starting download');
                const ytdlp = spawn(`yt-dlp`, ['-o', path, `https://www.youtube.com/watch?v=${videoId}`, '--max-filesize', '100M', '-f', 'mp4']);
                ytdlp.stdout.on('data', (data: any) => !uploadProgress.get(videoId)?.includes('Aborting.') && uploadProgress.set(videoId, data.toString()));
                let errors = '';
                ytdlp.stderr.on('data', (data: any) => (errors = data.toString()));
                ytdlp.on('exit', function (code: any) {
                    if (code || uploadProgress.get(videoId)?.includes('Aborting.')) {
                        res({
                            source: {
                                size: 0,
                                path,
                                name,
                                type: '',
                                toJSON: () => ({ name, path }),
                            },
                            result: { name: 'failed youtube query', message: `Could not archive video.  ${code ? errors : uploadProgress.get(videoId)}` },
                        });
                    } else {
                        uploadProgress.set(videoId, 'computing duration');
                        exec(`yt-dlp-o ${path} "https://www.youtube.com/watch?v=${videoId}" --get-duration`, (error: any, stdout: any, stderr: any) => {
                            const time = Array.from(stdout.trim().split(':')).reverse();
                            const duration = (time.length > 2 ? Number(time[2]) * 1000 * 60 : 0) + (time.length > 1 ? Number(time[1]) * 60 : 0) + (time.length > 0 ? Number(time[0]) : 0);
                            const data = { size: 0, path, name, type: 'video/mp4' };
                            const file = { ...data, toJSON: () => ({ ...data, filename: data.path.replace(/.*\//, ''), mtime: duration.toString(), mime: '', toJson: () => undefined as any }) };
                            res(MoveParsedFile(file, Directory.videos));
                        });
                    }
                });
            }
        });
    }
    export async function upload(file: File): Promise<Upload.FileResponse> {
        const { type, path, name } = file;
        const types = type?.split('/') ?? [];
        const category = types[0];
        let format = `.${types[1]}`;
        console.log(green(`Processing upload of file (${name}) and format (${format}) with upload type (${type}) in category (${category}).`));
        switch (category) {
            case 'image':
                if (imageFormats.includes(format)) {
                    const result = await UploadImage(path, basename(path));
                    return { source: file, result };
                }
                fs.unlink(path, () => {});
                return { source: file, result: { name: 'Unsupported image format', message: `Could not upload unsupported file (${name}). Please convert to an .jpg` } };
            case 'video':
                if (format.includes('x-matroska')) {
                    console.log('case video');
                    await new Promise(res =>
                        ffmpeg(file.path)
                            .videoCodec('copy') // this will copy the data instead of reencode it
                            .save(file.path.replace('.mkv', '.mp4'))
                            .on('end', res)
                    );
                    file.path = file.path.replace('.mkv', '.mp4');
                    format = '.mp4';
                }
                if (format.includes('quicktime')) {
                    let abort = false;
                    await new Promise<void>(res =>
                        ffmpeg.ffprobe(file.path, (err: any, metadata: any) => {
                            if (metadata.streams.some((stream: any) => stream.codec_name === 'hevc')) {
                                abort = true;
                            }
                            res();
                        })
                    );
                    if (abort) {
                        // bcz: instead of aborting, we could convert the file using the code below to an mp4.  Problem is that this takes a long time and will clog up the server.
                        // await new Promise(res =>
                        //     ffmpeg(file.path)
                        //         .videoCodec('libx264') // this will copy the data instead of reencode it
                        //         .audioCodec('mp2')
                        //         .save(file.path.replace('.MOV', '.mp4').replace('.mov', '.mp4'))
                        //         .on('end', res)
                        // );
                        // file.path = file.path.replace('.mov', '.mp4').replace('.MOV', '.mp4');
                        // format = '.mp4';
                        fs.unlink(path, () => {});
                        return { source: file, result: { name: 'Unsupported video format', message: `Could not upload unsupported file (${name}). Please convert to an .mp4` } };
                    }
                }
                if (videoFormats.includes(format)) {
                    return MoveParsedFile(file, Directory.videos);
                }
                fs.unlink(path, () => {});
                return { source: file, result: { name: 'Unsupported video format', message: `Could not upload unsupported file (${name}). Please convert to an .mp4` } };
            case 'application':
                if (applicationFormats.includes(format)) {
                    const val = UploadPdf(file);
                    if (val) return val;
                }
            case 'audio':
                const components = format.split(';');
                if (components.length > 1) {
                    format = components[0];
                }
                if (audioFormats.includes(format)) {
                    return UploadAudio(file, format);
                }
                fs.unlink(path, () => {});
                return { source: file, result: { name: 'Unsupported audio format', message: `Could not upload unsupported file (${name}). Please convert to an .mp3` } };
            case 'text':
                if (types[1] == 'csv') {
                    return UploadCsv(file);
                }
        }
        console.log(red(`Ignoring unsupported file (${name}) with upload type (${type}).`));
        fs.unlink(path, () => {});
        return { source: file, result: new Error(`Could not upload unsupported file (${name}) with upload type (${type}).`) };
    }
    async function UploadPdf(file: File) {
        const fileKey = (await md5File(file.path)) + '.pdf';
        const textFilename = `${fileKey.substring(0, fileKey.length - 4)}.txt`;
        if (fExists(fileKey, Directory.pdfs) && fExists(textFilename, Directory.text)) {
            return new Promise<Upload.FileResponse>(res => {
                const textFilename = `${fileKey.substring(0, fileKey.length - 4)}.txt`;
                const readStream = createReadStream(serverPathToFile(Directory.text, textFilename));
                var rawText = '';
                readStream.on('data', chunk => (rawText += chunk.toString())).on('end', () => res(resolveExistingFile(file.name, fileKey, Directory.pdfs, file.type, undefined, rawText)));
            });
        }
        const dataBuffer = readFileSync(file.path);
        const result: ParsedPDF | any = await parse(dataBuffer).catch((e: any) => e);
        if (!result.code) {
            await new Promise<void>((resolve, reject) => {
                const writeStream = createWriteStream(serverPathToFile(Directory.text, textFilename));
                writeStream.write(result?.text, error => (error ? reject(error) : resolve()));
            });
            return MoveParsedFile(file, Directory.pdfs, undefined, result?.text, undefined, fileKey);
        }
        return { source: file, result: { name: 'faile pdf pupload', message: `Could not upload (${file.name}).${result.message}` } };
    }
    async function UploadCsv(file: File) {
        const { path: sourcePath } = file;
        // read the file as a string
        const data = readFileSync(sourcePath, 'utf8');
        // split the string into an array of lines
        return MoveParsedFile(file, Directory.csv, undefined, data);
        // console.log(csvParser(data));
    }
    const manualSuffixes = ['.webm'];
    async function UploadAudio(file: File, format: string) {
        const suffix = manualSuffixes.includes(format) ? format : undefined;
        return MoveParsedFile(file, Directory.audio, suffix);
    }
    /**
     * Uploads an image specified by the @param source to Dash's /public/files/
     * directory, and returns information generated during that upload
     *
     * @param {string} source is either the absolute path of an already uploaded image or
     * the url of a remote image
     * @param {string} filename dictates what to call the image. If not specified,
     * the name {@param prefix}_upload_{GUID}
     * @param {string} prefix is a string prepended to the generated image name in the
     * event that @param filename is not specified
     *
     * @returns {ImageUploadInformation | Error} This method returns
     * 1) the paths to the uploaded images (plural due to resizing)
     * 2) the exif data embedded in the image, or the error explaining why exif couldn't be parsed
     * 3) the size of the image, in bytes (4432130)
     * 4) the content type of the image, i.e. image/(jpeg | png | ...)
     */
    export const UploadImage = async (source: string, filename?: string, prefix: string = ''): Promise<Upload.ImageInformation | Error> => {
        const metadata = await InspectImage(source);
        if (metadata instanceof Error) {
            return { name: metadata.name, message: metadata.message };
        }
        return UploadInspectedImage(metadata, filename || metadata.filename, prefix);
    };
    export async function buildFileDirectories() {
        if (!existsSync(publicDirectory)) {
            console.error('\nPlease ensure that the following directory exists...\n');
            console.log(publicDirectory);
            process.exit(0);
        }
        if (!existsSync(filesDirectory)) {
            console.error('\nPlease ensure that the following directory exists...\n');
            console.log(filesDirectory);
            process.exit(0);
        }
        const pending = Object.keys(Directory).map(sub => createIfNotExists(`${filesDirectory}/${sub}`));
        return Promise.all(pending);
    }
    export interface RequestedImageSize {
        width: number;
        height: number;
        type: string;
    }
    export interface ImageResizer {
        resizer?: sharp.Sharp;
        suffix: SizeSuffix;
    }
    /**
     * Based on the url's classification as local or remote, gleans
     * as much information as possible about the specified image
     *
     * @param source is the path or url to the image in question
     */
    export const InspectImage = async (source: string): Promise<Upload.InspectionResults | Error> => {
        let rawMatches: RegExpExecArray | null;
        let filename: string | undefined;
        /**
         * Just more edge case handling: this if clause handles the case where an image onto the canvas that
         * is represented by a base64 encoded data uri, rather than a proper file. We manually write it out
         * to the server and then carry on as if it had been put there by the Formidable form / file parser.
         */
        if ((rawMatches = /^data:image\/([a-z]+);base64,(.*)/.exec(source)) !== null) {
            const [ext, data] = rawMatches.slice(1, 3);
            const resolved = (filename = `upload_${Utils.GenerateGuid()}.${ext}`);
            const error = await new Promise<Error | null>(resolve => {
                writeFile(serverPathToFile(Directory.images, resolved), data, 'base64', resolve);
            });
            if (error !== null) {
                return error;
            }
            source = `${resolvedServerUrl}${clientPathToFile(Directory.images, resolved)}`;
        }
        let resolvedUrl: string;
        /**
         *
         * At this point, we want to take whatever url we have and make sure it's requestable.
         * Anything that's hosted by some other website already is, but if the url is a local file url
         * (locates the file on this server machine), we have to resolve the client side url by cutting out the
         * basename subtree (i.e. /images/<some_guid>.<ext>) and put it on the end of the server's url.
         *
         * This can always be localhost, regardless of whether this is on the server or not, since we (the server, not the client)
         * will be the ones making the request, and from the perspective of dash-release or dash-web, localhost:<port> refers to the same thing
         * as the full dash-release.eastus.cloudapp.azure.com:<port>.
         */
        const matches = isLocal().exec(source);
        if (matches === null) {
            resolvedUrl = source;
        } else {
            resolvedUrl = `${resolvedServerUrl}/${matches[1].split('\\').join('/')}`;
        }
        // See header comments: not all image files have exif data (I believe only JPG is the only format that can have it)
        const exifData = await parseExifData(resolvedUrl);
        const results = {
            exifData,
            requestable: resolvedUrl,
        };
        // Use the request library to parse out file level image information in the headers
        const { headers } = await new Promise<any>((resolve, reject) => {
            return request.head(resolvedUrl, (error, res) => (error ? reject(error) : resolve(res)));
        }).catch(e => {
            console.log('Error processing headers: ', e);
        });
        try {
            // Compute the native width and height ofthe image with an npm module
            const { width: nativeWidth, height: nativeHeight } = await requestImageSize(resolvedUrl);
            // Bundle up the information into an object
            return {
                source,
                contentSize: parseInt(headers[size]),
                contentType: headers[type],
                nativeWidth,
                nativeHeight,
                filename,
                ...results,
            };
        } catch (e: any) {
            console.log(e);
            return e;
        }
    };
    /**
     * Basically just a wrapper around rename, which 'deletes'
     * the file at the old path and 'moves' it to the new one. For simplicity, the
     * caller just has to pass in the name of the target directory, and this function
     * will resolve the actual target path from that.
     * @param file The file to move
     * @param destination One of the specific media asset directories into which to move it
     * @param suffix If the file doesn't have a suffix and you want to provide it one
     * to appear in the new location
     */
    export async function MoveParsedFile(file: formidable.File, destination: Directory, suffix: string | undefined = undefined, text?: string, duration?: number, targetName?: string): Promise<Upload.FileResponse> {
        const { path: sourcePath } = file;
        let name = targetName ?? path.basename(sourcePath);
        suffix && (name += suffix);
        return new Promise(resolve => {
            const destinationPath = serverPathToFile(destination, name);
            rename(sourcePath, destinationPath, error => {
                resolve({
                    source: file,
                    result: error
                        ? error
                        : {
                              accessPaths: {
                                  agnostic: getAccessPaths(destination, name),
                              },
                              rawText: text,
                              duration,
                          },
                });
            });
        });
    }
    export function fExists(name: string, destination: Directory) {
        const destinationPath = serverPathToFile(destination, name);
        return existsSync(destinationPath);
    }
    export function getAccessPaths(directory: Directory, fileName: string) {
        return {
            client: clientPathToFile(directory, fileName),
            server: serverPathToFile(directory, fileName),
        };
    }
    export const UploadInspectedImage = async (metadata: Upload.InspectionResults, filename?: string, prefix = '', cleanUp = true): Promise<Upload.ImageInformation> => {
        const { requestable, source, ...remaining } = metadata;
        const resolved = filename || `${prefix}upload_${Utils.GenerateGuid()}.${remaining.contentType.split('/')[1].toLowerCase()}`;
        const { images } = Directory;
        const information: Upload.ImageInformation = {
            accessPaths: {
                agnostic: getAccessPaths(images, resolved),
            },
            ...metadata,
        };
        const writtenFiles = await outputResizedImages(() => request(requestable), resolved, pathToDirectory(Directory.images));
        for (const suffix of Object.keys(writtenFiles)) {
            information.accessPaths[suffix] = getAccessPaths(images, writtenFiles[suffix]);
        }
        if (isLocal().test(source) && cleanUp) {
            unlinkSync(source);
        }
        return information;
    };
    const bufferConverterRec = (layer: any) => {
        for (const key of Object.keys(layer)) {
            const val: any = layer[key];
            if (val instanceof Buffer) {
                layer[key] = val.toString();
            } else if (Array.isArray(val) && typeof val[0] === 'number') {
                layer[key] = Buffer.from(val).toString();
            } else if (typeof val === 'object') {
                bufferConverterRec(val);
            }
        }
    };
    const parseExifData = async (source: string) => {
        const image = await request.get(source, { encoding: null });
        const { data, error } = await new Promise<{ data: any; error: any }>(resolve => {
            new ExifImage({ image }, (error, data) => {
                let reason: Opt<string> = undefined;
                if (error) {
                    reason = (error as any).code;
                }
                resolve({ data, error: reason });
            });
        });
        //data && bufferConverterRec(data);
        return error ? { data: undefined, error } : { data: await exifr.parse(image), error };
    };
    const { pngs, jpgs, webps, tiffs } = AcceptableMedia;
    const pngOptions = {
        compressionLevel: 9,
        adaptiveFiltering: true,
        force: true,
    };
    export async function outputResizedImages(streamProvider: () => Stream | Promise<Stream>, outputFileName: string, outputDirectory: string) {
        const writtenFiles: { [suffix: string]: string } = {};
        for (const { resizer, suffix } of resizers(path.extname(outputFileName))) {
            const outputPath = path.resolve(outputDirectory, (writtenFiles[suffix] = InjectSize(outputFileName, suffix)));
            await new Promise<void>(async (resolve, reject) => {
                const source = streamProvider();
                let readStream: Stream = source instanceof Promise ? await source : source;
                if (resizer) {
                    readStream = readStream.pipe(resizer.withMetadata());
                }
                readStream.pipe(createWriteStream(outputPath)).on('close', resolve).on('error', reject);
            });
        }
        return writtenFiles;
    }
    function resizers(ext: string): DashUploadUtils.ImageResizer[] {
        return [
            { suffix: SizeSuffix.Original },
            ...Object.values(DashUploadUtils.Sizes).map(({ suffix, width }) => {
                let initial: sharp.Sharp | undefined = sharp().resize(width, undefined, { withoutEnlargement: true });
                if (pngs.includes(ext)) {
                    initial = initial.png(pngOptions);
                } else if (jpgs.includes(ext)) {
                    initial = initial.jpeg();
                } else if (webps.includes(ext)) {
                    initial = initial.webp();
                } else if (tiffs.includes(ext)) {
                    initial = initial.tiff();
                } else if (ext === '.gif') {
                    initial = undefined;
                }
                return {
                    resizer: initial,
                    suffix,
                };
            }),
        ];
    }
}
 |