ytsm/app/YtManagerApp/management/jobs/download_video.py

import logging
import os
import re
from string import Template
from threading import Lock

import youtube_dl

from YtManagerApp import scheduler
from YtManagerApp.models import Video

log = logging.getLogger('video_downloader')
log_youtube_dl = log.getChild('youtube_dl')

_lock = Lock()


def __get_valid_path(path):
    """
    Normalizes string, converts to lowercase, removes non-alpha characters,
    and converts spaces to hyphens.
    """
    import unicodedata
    value = unicodedata.normalize('NFKD', path).encode('ascii', 'ignore').decode('ascii')
    value = re.sub('[:"*]', '', value).strip()
    value = re.sub('[?<>|]', '#', value)
    return value


def __build_template_dict(video: Video):
    return {
        'channel': video.subscription.channel_name,
        'channel_id': video.subscription.channel_id,
        'playlist': video.subscription.name,
        'playlist_id': video.subscription.playlist_id,
        'playlist_index': "{:03d}".format(1 + video.playlist_index),
        'title': video.name,
        'id': video.video_id,
    }


def __build_youtube_dl_params(video: Video):

    sub = video.subscription
    user = sub.user

    # resolve path
    download_path = user.preferences['download_path']

    template_dict = __build_template_dict(video)
    output_pattern = Template(user.preferences['download_file_pattern']).safe_substitute(template_dict)

    output_path = os.path.join(download_path, output_pattern)
    output_path = os.path.normpath(output_path)

    youtube_dl_params = {
        'logger': log_youtube_dl,
        'format': user.preferences['download_format'],
        'outtmpl': output_path,
        'writethumbnail': True,
        'writedescription': True,
        'writesubtitles': user.preferences['download_subtitles'],
        'writeautomaticsub': user.preferences['download_autogenerated_subtitles'],
        'allsubtitles': user.preferences['download_subtitles_all'],
        'postprocessors': [
            {
                'key': 'FFmpegMetadata'
            },
        ]
    }

    sub_langs = user.preferences['download_subtitles_langs'].split(',')
    sub_langs = [i.strip() for i in sub_langs]
    if len(sub_langs) > 0:
        youtube_dl_params['subtitleslangs'] = sub_langs

    sub_format = user.preferences['download_subtitles_format']
    if len(sub_format) > 0:
        youtube_dl_params['subtitlesformat'] = sub_format

    return youtube_dl_params, output_path


def download_video(video: Video, attempt: int = 1):

    user = video.subscription.user

    log.info('Downloading video %d [%s %s]', video.id, video.video_id, video.name)

    # Issue: if multiple videos are downloaded at the same time, a race condition appears in the mkdirs() call that
    # youtube-dl makes, which causes it to fail with the error 'Cannot create folder - file already exists'.
    # For now, allow a single download instance.
    _lock.acquire()

    try:
        max_attempts = user.preferences['max_download_attempts']

        youtube_dl_params, output_path = __build_youtube_dl_params(video)
        with youtube_dl.YoutubeDL(youtube_dl_params) as yt:
            ret = yt.download(["https://www.youtube.com/watch?v=" + video.video_id])

        log.info('Download finished with code %d', ret)

        if ret == 0:
            video.downloaded_path = output_path
            video.save()
            log.info('Video %d [%s %s] downloaded successfully!', video.id, video.video_id, video.name)

        elif attempt <= max_attempts:
            log.warning('Re-enqueueing video (attempt %d/%d)', attempt, max_attempts)
            __schedule_download_video(video, attempt + 1)

        else:
            log.error('Multiple attempts to download video %d [%s %s] failed!', video.id, video.video_id, video.name)
            video.downloaded_path = ''
            video.save()

    finally:
        _lock.release()


def __schedule_download_video(video: Video, attempt=1):
    job = scheduler.scheduler.add_job(download_video, args=[video, attempt])
    log.info('Scheduled download video job video=(%s), attempt=%d, job=%s', video, attempt, job.id)


def schedule_download_video(video: Video):
    """
    Schedules a download video job to run immediately.
    :param video:
    :return:
    """
    __schedule_download_video(video)
Big refactor 2018-10-10 22:43:50 +00:00			`import logging`
Integrated django-dynamic-preferences library into project. Settings are now stored in the database, the ini file only contains a minimal number of settings. 2018-12-09 23:15:10 +00:00			`import os`
Implemented video management facilities. 2018-10-20 22:20:31 +00:00			`import re`
Integrated django-dynamic-preferences library into project. Settings are now stored in the database, the ini file only contains a minimal number of settings. 2018-12-09 23:15:10 +00:00			`from string import Template`
Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`from threading import Lock`
Big refactor 2018-10-10 22:43:50 +00:00
Integrated django-dynamic-preferences library into project. Settings are now stored in the database, the ini file only contains a minimal number of settings. 2018-12-09 23:15:10 +00:00			`import youtube_dl`

			`from YtManagerApp import scheduler`
			`from YtManagerApp.models import Video`

Big refactor 2018-10-10 22:43:50 +00:00			`log = logging.getLogger('video_downloader')`
			`log_youtube_dl = log.getChild('youtube_dl')`

Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`_lock = Lock()`

Big refactor 2018-10-10 22:43:50 +00:00
Implemented video management facilities. 2018-10-20 22:20:31 +00:00			`def __get_valid_path(path):`
			`"""`
			`Normalizes string, converts to lowercase, removes non-alpha characters,`
			`and converts spaces to hyphens.`
			`"""`
			`import unicodedata`
			`value = unicodedata.normalize('NFKD', path).encode('ascii', 'ignore').decode('ascii')`
			`value = re.sub('[:"*]', '', value).strip()`
			`value = re.sub('[?<>\|]', '#', value)`
			`return value`


Integrated django-dynamic-preferences library into project. Settings are now stored in the database, the ini file only contains a minimal number of settings. 2018-12-09 23:15:10 +00:00			`def __build_template_dict(video: Video):`
			`return {`
Integrated pytaw library for youtube API. 2018-10-29 16:52:09 +00:00			`'channel': video.subscription.channel_name,`
			`'channel_id': video.subscription.channel_id,`
Big refactor 2018-10-10 22:43:50 +00:00			`'playlist': video.subscription.name,`
			`'playlist_id': video.subscription.playlist_id,`
			`'playlist_index': "{:03d}".format(1 + video.playlist_index),`
			`'title': video.name,`
			`'id': video.video_id,`
			`}`

Integrated django-dynamic-preferences library into project. Settings are now stored in the database, the ini file only contains a minimal number of settings. 2018-12-09 23:15:10 +00:00
			`def __build_youtube_dl_params(video: Video):`

			`sub = video.subscription`
			`user = sub.user`

			`# resolve path`
			`download_path = user.preferences['download_path']`

			`template_dict = __build_template_dict(video)`
			`output_pattern = Template(user.preferences['download_file_pattern']).safe_substitute(template_dict)`
Big refactor 2018-10-10 22:43:50 +00:00
			`output_path = os.path.join(download_path, output_pattern)`
			`output_path = os.path.normpath(output_path)`

			`youtube_dl_params = {`
			`'logger': log_youtube_dl,`
Integrated django-dynamic-preferences library into project. Settings are now stored in the database, the ini file only contains a minimal number of settings. 2018-12-09 23:15:10 +00:00			`'format': user.preferences['download_format'],`
Big refactor 2018-10-10 22:43:50 +00:00			`'outtmpl': output_path,`
			`'writethumbnail': True,`
			`'writedescription': True,`
Fixed user settings page. 2018-12-29 18:43:39 +00:00			`'writesubtitles': user.preferences['download_subtitles'],`
			`'writeautomaticsub': user.preferences['download_autogenerated_subtitles'],`
			`'allsubtitles': user.preferences['download_subtitles_all'],`
Big refactor 2018-10-10 22:43:50 +00:00			`'postprocessors': [`
			`{`
Implemented video management facilities. 2018-10-20 22:20:31 +00:00			`'key': 'FFmpegMetadata'`
Big refactor 2018-10-10 22:43:50 +00:00			`},`
			`]`
			`}`

Fixed user settings page. 2018-12-29 18:43:39 +00:00			`sub_langs = user.preferences['download_subtitles_langs'].split(',')`
Big refactor 2018-10-10 22:43:50 +00:00			`sub_langs = [i.strip() for i in sub_langs]`
			`if len(sub_langs) > 0:`
			`youtube_dl_params['subtitleslangs'] = sub_langs`

Fixed user settings page. 2018-12-29 18:43:39 +00:00			`sub_format = user.preferences['download_subtitles_format']`
Big refactor 2018-10-10 22:43:50 +00:00			`if len(sub_format) > 0:`
			`youtube_dl_params['subtitlesformat'] = sub_format`

			`return youtube_dl_params, output_path`


			`def download_video(video: Video, attempt: int = 1):`

Integrated django-dynamic-preferences library into project. Settings are now stored in the database, the ini file only contains a minimal number of settings. 2018-12-09 23:15:10 +00:00			`user = video.subscription.user`

Big refactor 2018-10-10 22:43:50 +00:00			`log.info('Downloading video %d [%s %s]', video.id, video.video_id, video.name)`

Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`# Issue: if multiple videos are downloaded at the same time, a race condition appears in the mkdirs() call that`
			`# youtube-dl makes, which causes it to fail with the error 'Cannot create folder - file already exists'.`
			`# For now, allow a single download instance.`
			`_lock.acquire()`

			`try:`
Fixed user settings page. 2018-12-29 18:43:39 +00:00			`max_attempts = user.preferences['max_download_attempts']`
Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00
			`youtube_dl_params, output_path = __build_youtube_dl_params(video)`
			`with youtube_dl.YoutubeDL(youtube_dl_params) as yt:`
			`ret = yt.download(["https://www.youtube.com/watch?v=" + video.video_id])`
Big refactor 2018-10-10 22:43:50 +00:00
Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`log.info('Download finished with code %d', ret)`
Big refactor 2018-10-10 22:43:50 +00:00
Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`if ret == 0:`
			`video.downloaded_path = output_path`
			`video.save()`
			`log.info('Video %d [%s %s] downloaded successfully!', video.id, video.video_id, video.name)`
Big refactor 2018-10-10 22:43:50 +00:00
Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`elif attempt <= max_attempts:`
			`log.warning('Re-enqueueing video (attempt %d/%d)', attempt, max_attempts)`
			`__schedule_download_video(video, attempt + 1)`
Big refactor 2018-10-10 22:43:50 +00:00
Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`else:`
			`log.error('Multiple attempts to download video %d [%s %s] failed!', video.id, video.video_id, video.name)`
			`video.downloaded_path = ''`
			`video.save()`
Big refactor 2018-10-10 22:43:50 +00:00
Fixed problem caused by parallel downloads where ok.mkdirs would fail (when called by youtube-dl). 2018-11-02 00:50:16 +00:00			`finally:`
			`_lock.release()`
Big refactor 2018-10-10 22:43:50 +00:00

Integrated pytaw library for youtube API. 2018-10-29 16:52:09 +00:00			`def __schedule_download_video(video: Video, attempt=1):`
			`job = scheduler.scheduler.add_job(download_video, args=[video, attempt])`
			`log.info('Scheduled download video job video=(%s), attempt=%d, job=%s', video, attempt, job.id)`


Big refactor 2018-10-10 22:43:50 +00:00			`def schedule_download_video(video: Video):`
			`"""`
			`Schedules a download video job to run immediately.`
			`:param video:`
			`:return:`
			`"""`
Integrated pytaw library for youtube API. 2018-10-29 16:52:09 +00:00			`__schedule_download_video(video)`