edx-platform/cms/djangoapps/contentstore/video_storage_handlers.py

"""
Views related to the video upload feature
"""


import codecs
import csv
import io
import json
import logging
import os
import requests
import shutil
import pathlib
import zipfile
import boto3

from contextlib import closing
from datetime import datetime, timedelta
from uuid import uuid4
from django.conf import settings
from django.contrib.staticfiles.storage import staticfiles_storage
from django.http import FileResponse, HttpResponseNotFound, StreamingHttpResponse
from django.shortcuts import redirect
from django.utils.translation import gettext as _
from django.utils.translation import gettext_noop
from edx_toggles.toggles import WaffleSwitch
from edxval.api import (
    SortDirection,
    VideoSortField,
    create_or_update_transcript_preferences,
    create_video,
    get_3rd_party_transcription_plans,
    get_available_transcript_languages,
    get_video_transcript_url,
    get_transcript_preferences,
    get_videos_for_course,
    remove_transcript_preferences,
    remove_video_for_course,
    update_video_image,
    update_video_status
)
from fs.osfs import OSFS
from opaque_keys import InvalidKeyError
from opaque_keys.edx.keys import CourseKey
from path import Path as path
from pytz import UTC
from rest_framework import status as rest_status
from rest_framework.response import Response
from tempfile import NamedTemporaryFile, mkdtemp
from wsgiref.util import FileWrapper

from common.djangoapps.util.json_request import JsonResponse
from openedx.core.djangoapps.video_config.models import VideoTranscriptEnabledFlag
from openedx.core.djangoapps.video_config.toggles import PUBLIC_VIDEO_SHARE
from openedx.core.djangoapps.video_pipeline.config.waffle import (
    DEPRECATE_YOUTUBE,
    ENABLE_DEVSTACK_VIDEO_UPLOADS,
)
from openedx.core.djangoapps.waffle_utils import CourseWaffleFlag
from xmodule.modulestore.django import modulestore  # lint-amnesty, pylint: disable=wrong-import-order

from .models import VideoUploadConfig
from .toggles import use_mock_video_uploads
from .utils import get_video_uploads_url
from .video_utils import validate_video_image
from .views.course import get_course_and_check_access

LOGGER = logging.getLogger(__name__)

# Waffle switches namespace for videos
WAFFLE_NAMESPACE = 'videos'

# Waffle switch for enabling/disabling video image upload feature
VIDEO_IMAGE_UPLOAD_ENABLED = WaffleSwitch(  # lint-amnesty, pylint: disable=toggle-missing-annotation
    f'{WAFFLE_NAMESPACE}.video_image_upload_enabled', __name__
)

# Waffle flag namespace for studio
WAFFLE_STUDIO_FLAG_NAMESPACE = 'studio'

ENABLE_VIDEO_UPLOAD_PAGINATION = CourseWaffleFlag(  # lint-amnesty, pylint: disable=toggle-missing-annotation
    f'{WAFFLE_STUDIO_FLAG_NAMESPACE}.enable_video_upload_pagination', __name__
)
# Default expiration, in seconds, of one-time URLs used for uploading videos.
KEY_EXPIRATION_IN_SECONDS = 86400

VIDEO_SUPPORTED_FILE_FORMATS = {
    '.mp4': 'video/mp4',
    '.mov': 'video/quicktime',
}

VIDEO_UPLOAD_MAX_FILE_SIZE_GB = 5

# maximum time for video to remain in upload state
MAX_UPLOAD_HOURS = 24

VIDEOS_PER_PAGE = 100


class TranscriptProvider:
    """
    Transcription Provider Enumeration
    """
    CIELO24 = 'Cielo24'
    THREE_PLAY_MEDIA = '3PlayMedia'
    CUSTOM = 'Custom'


class StatusDisplayStrings:
    """
    A class to map status strings as stored in VAL to display strings for the
    video upload page
    """

    # Translators: This is the status of an active video upload
    _UPLOADING = gettext_noop("Uploading")
    # Translators: This is the status for a video that the servers are currently processing
    _IN_PROGRESS = gettext_noop("In Progress")
    # Translators: This is the status for a video that the servers have successfully processed
    _COMPLETE = gettext_noop("Ready")
    # Translators: This is the status for a video that is uploaded completely
    _UPLOAD_COMPLETED = gettext_noop("Uploaded")
    # Translators: This is the status for a video that the servers have failed to process
    _FAILED = gettext_noop("Failed")
    # Translators: This is the status for a video that is cancelled during upload by user
    _CANCELLED = gettext_noop("Cancelled")
    # Translators: This is the status for a video which has failed
    # due to being flagged as a duplicate by an external or internal CMS
    _DUPLICATE = gettext_noop("Failed Duplicate")
    # Translators: This is the status for a video which has duplicate token for youtube
    _YOUTUBE_DUPLICATE = gettext_noop("YouTube Duplicate")
    # Translators: This is the status for a video for which an invalid
    # processing token was provided in the course settings
    _INVALID_TOKEN = gettext_noop("Invalid Token")
    # Translators: This is the status for a video that was included in a course import
    _IMPORTED = gettext_noop("Imported")
    # Translators: This is the status for a video that is in an unknown state
    _UNKNOWN = gettext_noop("Unknown")
    # Translators: This is the status for a video that is having its transcription in progress on servers
    _TRANSCRIPTION_IN_PROGRESS = gettext_noop("Transcription in Progress")
    # Translators: This is the status for a video whose transcription is complete
    _TRANSCRIPT_READY = gettext_noop("Transcript Ready")
    # Translators: This is the status for a video whose transcription job was failed for some languages
    _PARTIAL_FAILURE = gettext_noop("Partial Failure")
    # Translators: This is the status for a video whose transcription job has failed altogether
    _TRANSCRIPT_FAILED = gettext_noop("Transcript Failed")

    _STATUS_MAP = {
        "upload": _UPLOADING,
        "ingest": _IN_PROGRESS,
        "transcode_queue": _IN_PROGRESS,
        "transcode_active": _IN_PROGRESS,
        "file_delivered": _COMPLETE,
        "file_complete": _COMPLETE,
        "upload_completed": _UPLOAD_COMPLETED,
        "file_corrupt": _FAILED,
        "pipeline_error": _FAILED,
        "upload_failed": _FAILED,
        "s3_upload_failed": _FAILED,
        "upload_cancelled": _CANCELLED,
        "duplicate": _DUPLICATE,
        "youtube_duplicate": _YOUTUBE_DUPLICATE,
        "invalid_token": _INVALID_TOKEN,
        "imported": _IMPORTED,
        "transcription_in_progress": _TRANSCRIPTION_IN_PROGRESS,
        "transcript_ready": _TRANSCRIPT_READY,
        "partial_failure": _PARTIAL_FAILURE,
        # TODO: Add a related unit tests when the VAL update is part of platform
        "transcript_failed": _TRANSCRIPT_FAILED,
    }

    @staticmethod
    def get(val_status):
        """Map a VAL status string to a display string"""
        return StatusDisplayStrings._STATUS_MAP.get(val_status, StatusDisplayStrings._UNKNOWN)


def handle_videos(request, course_key_string, edx_video_id=None):
    """
    Restful handler for video uploads.

    GET
        html: return an HTML page to display previous video uploads and allow
            new ones
        json: return json representing the videos that have been uploaded and
            their statuses
    POST
        json: generate new video upload urls, for example upload urls for S3 buckets. To upload the video, you should
            make a PUT request to the returned upload_url values. This can happen on the frontend, MFE,
            or client side - it is not implemented in the backend.
            Example payload:
                {
                    "files": [{
                        "file_name": "video.mp4",
                        "content_type": "video/mp4"
                    }]
                }
            Returns (JSON):
                {
                    "files": [{
                        "file_name": "video.mp4",
                        "upload_url": "http://example.com/put_video"
                    }]
                }
    DELETE
        soft deletes a video for particular course
    """
    course = _get_and_validate_course(course_key_string, request.user)

    if (not course and not use_mock_video_uploads()):
        return HttpResponseNotFound()

    if request.method == "GET":
        if "application/json" in request.META.get("HTTP_ACCEPT", ""):
            return videos_index_json(course)
        pagination_conf = _generate_pagination_configuration(course_key_string, request)
        return videos_index_html(course, pagination_conf)
    elif request.method == "DELETE":
        remove_video_for_course(course_key_string, edx_video_id)
        return JsonResponse()
    else:
        if is_status_update_request(request.json):
            return send_video_status_update(request.json)
        elif _is_pagination_context_update_request(request):
            return _update_pagination_context(request)

        data, status = videos_post(course, request)
        return JsonResponse(data, status=status)


def send_zip(zip_file, size=None):
    """
    Generates a streaming http response for the zip file
    """
    wrapper = FileWrapper(zip_file, settings.COURSE_EXPORT_DOWNLOAD_CHUNK_SIZE)
    response = StreamingHttpResponse(wrapper, content_type='application/zip')
    response['Content-Dispositon'] = 'attachment; filename=%s' % os.path.basename(zip_file.name)
    response['Content-Length'] = size
    return response


def create_video_zip(course_key_string, files):
    """
    Generates the video zip, or returns None if there was an error.

    Updates the context with any error information if applicable.
    """
    name = course_key_string + '_videos'
    video_folder_zip = NamedTemporaryFile(prefix=name + '_',
                                          suffix=".zip")  # lint-amnesty, pylint: disable=consider-using-with
    root_dir = path(mkdtemp())
    video_dir = root_dir + '/' + name
    zip_folder = None
    try:
        for file in files:
            url = file['url']
            file_name = file['name']
            response = requests.get(url, allow_redirects=True)
            file_type = '.' + response.headers['Content-Type'][6:]
            if file_type not in file_name:
                file_name = file['name'] + file_type
            if not os.path.isdir(video_dir):
                os.makedirs(video_dir)
            with OSFS(video_dir).open(file_name, mode="wb") as f:
                f.write(response.content)
        directory = pathlib.Path(video_dir)
        with zipfile.ZipFile(video_folder_zip, mode="w") as archive:
            for file_path in directory.iterdir():
                archive.write(file_path, arcname=file_path.name)
        zip_folder = open(video_folder_zip.name, '+rb')

        return send_zip(zip_folder, video_folder_zip.tell())
    finally:
        if os.path.exists(root_dir / name):
            shutil.rmtree(root_dir / name)


def get_video_usage_path(course_key, edx_video_id):
    """
    API for fetching the locations a specific video is used in a course.
    Returns a list of paths to a video.
    """
    store = modulestore()
    usage_locations = []
    videos = store.get_items(
        course_key,
        qualifiers={
            'category': 'video'
        },
    )

    for video in videos:
        video_id = getattr(video, 'edx_video_id', '')
        try:
            if video_id == edx_video_id:
                usage_dict = {'display_location': '', 'url': ''}
                video_location = str(video.location)
                xblock_display_name = getattr(video, 'display_name', '')
                unit = video.get_parent()
                unit_location = str(video.parent)
                unit_display_name = getattr(unit, 'display_name', '')
                subsection = unit.get_parent()
                subsection_display_name = getattr(subsection, 'display_name', '')
                usage_dict['display_location'] = (f'{subsection_display_name} - '
                                                  f'{unit_display_name} / {xblock_display_name}')
                usage_dict['url'] = f'/container/{unit_location}#{video_location}'
                usage_locations.append(usage_dict)
        except AttributeError:
            continue

    return {'usage_locations': usage_locations}


def handle_generate_video_upload_link(request, course_key_string):
    """
    API for creating a video upload.  Returns an edx_video_id and a presigned URL that can be used
    to upload the video to AWS S3.
    """
    course = _get_and_validate_course(course_key_string, request.user)
    if not course:
        return Response(data='Course Not Found', status=rest_status.HTTP_400_BAD_REQUEST)

    data, status = videos_post(course, request)
    return Response(data, status=status)


def handle_video_images(request, course_key_string, edx_video_id=None):
    """Function to handle image files"""

    # respond with a 404 if image upload is not enabled.
    if not VIDEO_IMAGE_UPLOAD_ENABLED.is_enabled() and not use_mock_video_uploads():
        return HttpResponseNotFound()

    if 'file' not in request.FILES:
        return JsonResponse({'error': _('An image file is required.')}, status=400)

    image_file = request.FILES['file']
    error = validate_video_image(image_file)
    if error:
        return JsonResponse({'error': error}, status=400)

    with closing(image_file):
        image_url = update_video_image(edx_video_id, course_key_string, image_file, image_file.name)
        LOGGER.info(
            'VIDEOS: Video image uploaded for edx_video_id [%s] in course [%s]', edx_video_id, course_key_string
        )

    return JsonResponse({'image_url': image_url})


def check_video_images_upload_enabled(request):
    """Function to check if images can be uploaded"""
    # respond with a false if image upload is not enabled.
    if not VIDEO_IMAGE_UPLOAD_ENABLED.is_enabled():
        return JsonResponse({'allowThumbnailUpload': False})

    return JsonResponse({'allowThumbnailUpload': True})


def enabled_video_features(request):
    """ Return a dict with info about which video features are enabled """

    features = {
        'allowThumbnailUpload': VIDEO_IMAGE_UPLOAD_ENABLED.is_enabled(),
        'videoSharingEnabled': PUBLIC_VIDEO_SHARE.is_enabled(),
    }
    return JsonResponse(features)


def validate_transcript_preferences(provider, cielo24_fidelity, cielo24_turnaround,
                                    three_play_turnaround, video_source_language, preferred_languages):
    """
    Validate 3rd Party Transcription Preferences.

    Arguments:
        provider: Transcription provider
        cielo24_fidelity:  Cielo24 transcription fidelity.
        cielo24_turnaround: Cielo24 transcription turnaround.
        three_play_turnaround: 3PlayMedia transcription turnaround.
        video_source_language: Source/Speech language of the videos that are going to be submitted to the Providers.
        preferred_languages: list of language codes.

    Returns:
        validated preferences or a validation error.
    """
    error, preferences = None, {}

    # validate transcription providers
    transcription_plans = get_3rd_party_transcription_plans()
    if provider in list(transcription_plans.keys()):   # lint-amnesty, pylint: disable=consider-iterating-dictionary

        # Further validations for providers
        if provider == TranscriptProvider.CIELO24:

            # Validate transcription fidelity
            if cielo24_fidelity in transcription_plans[provider]['fidelity']:

                # Validate transcription turnaround
                if cielo24_turnaround not in transcription_plans[provider]['turnaround']:
                    error = f'Invalid cielo24 turnaround {cielo24_turnaround}.'
                    return error, preferences

                # Validate transcription languages
                supported_languages = transcription_plans[provider]['fidelity'][cielo24_fidelity]['languages']
                if video_source_language not in supported_languages:
                    error = f'Unsupported source language {video_source_language}.'
                    return error, preferences

                if not preferred_languages or not set(preferred_languages) <= set(supported_languages.keys()):
                    error = f'Invalid languages {preferred_languages}.'
                    return error, preferences

                # Validated Cielo24 preferences
                preferences = {
                    'video_source_language': video_source_language,
                    'cielo24_fidelity': cielo24_fidelity,
                    'cielo24_turnaround': cielo24_turnaround,
                    'preferred_languages': preferred_languages,
                }
            else:
                error = f'Invalid cielo24 fidelity {cielo24_fidelity}.'
        elif provider == TranscriptProvider.THREE_PLAY_MEDIA:

            # Validate transcription turnaround
            if three_play_turnaround not in transcription_plans[provider]['turnaround']:
                error = f'Invalid 3play turnaround {three_play_turnaround}.'
                return error, preferences

            # Validate transcription languages
            valid_translations_map = transcription_plans[provider]['translations']
            if video_source_language not in list(valid_translations_map.keys()):
                error = f'Unsupported source language {video_source_language}.'
                return error, preferences

            valid_target_languages = valid_translations_map[video_source_language]
            if not preferred_languages or not set(preferred_languages) <= set(valid_target_languages):
                error = f'Invalid languages {preferred_languages}.'
                return error, preferences

            # Validated 3PlayMedia preferences
            preferences = {
                'three_play_turnaround': three_play_turnaround,
                'video_source_language': video_source_language,
                'preferred_languages': preferred_languages,
            }
    else:
        error = f'Invalid provider {provider}.'

    return error, preferences


def handle_transcript_preferences(request, course_key_string):
    """
    JSON view handler to post the transcript preferences.

    Arguments:
        request: WSGI request object
        course_key_string: string for course key

    Returns: valid json response or 400 with error message
    """
    course_key = CourseKey.from_string(course_key_string)
    is_video_transcript_enabled = VideoTranscriptEnabledFlag.feature_enabled(course_key)
    if not is_video_transcript_enabled:
        return HttpResponseNotFound()
    if request.method == 'POST':
        data = request.json
        provider = data.get('provider')
        error, preferences = validate_transcript_preferences(
            provider=provider,
            cielo24_fidelity=data.get('cielo24_fidelity', ''),
            cielo24_turnaround=data.get('cielo24_turnaround', ''),
            three_play_turnaround=data.get('three_play_turnaround', ''),
            video_source_language=data.get('video_source_language'),
            preferred_languages=list(map(str, data.get('preferred_languages', [])))
        )
        if error:
            response = JsonResponse({'error': error}, status=400)
        else:
            preferences.update({'provider': provider})
            transcript_preferences = create_or_update_transcript_preferences(course_key_string, **preferences)
            response = JsonResponse({'transcript_preferences': transcript_preferences}, status=200)

        return response
    elif request.method == 'DELETE':
        remove_transcript_preferences(course_key_string)
        return JsonResponse()


def get_video_encodings_download(request, course_key_string):
    """
    Returns a CSV report containing the encoded video URLs for video uploads
    in the following format:

    Video ID,Name,Status,Profile1 URL,Profile2 URL
    aaaaaaaa-aaaa-4aaa-aaaa-aaaaaaaaaaaa,video.mp4,Complete,http://example.com/prof1.mp4,http://example.com/prof2.mp4
    """
    course = _get_and_validate_course(course_key_string, request.user)

    if not course:
        return HttpResponseNotFound()

    def get_profile_header(profile):
        """Returns the column header string for the given profile's URLs"""
        # Translators: This is the header for a CSV file column
        # containing URLs for video encodings for the named profile
        # (e.g. desktop, mobile high quality, mobile low quality)
        return _("{profile_name} URL").format(profile_name=profile)

    profile_whitelist = VideoUploadConfig.get_profile_whitelist()
    videos, __ = _get_videos(course)
    videos = list(videos)
    name_col = _("Name")
    duration_col = _("Duration")
    added_col = _("Date Added")
    video_id_col = _("Video ID")
    status_col = _("Status")
    profile_cols = [get_profile_header(profile) for profile in profile_whitelist]

    def make_csv_dict(video):
        """
        Makes a dictionary suitable for writing CSV output. This involves
        extracting the required items from the original video dict and
        converting all keys and values to UTF-8 encoded string objects,
        because the CSV module doesn't play well with unicode objects.
        """
        # Translators: This is listed as the duration for a video that has not
        # yet reached the point in its processing by the servers where its
        # duration is determined.
        duration_val = str(video["duration"]) if video["duration"] > 0 else _("Pending")
        ret = dict(
            [
                (name_col, video["client_video_id"]),
                (duration_col, duration_val),
                (added_col, video["created"].isoformat()),
                (video_id_col, video["edx_video_id"]),
                (status_col, video["status"]),
            ] +
            [
                (get_profile_header(encoded_video["profile"]), encoded_video["url"])
                for encoded_video in video["encoded_videos"]
                if encoded_video["profile"] in profile_whitelist
            ]
        )
        return dict(ret.items())

    # Write csv to bytes-like object. We need a separate writer and buffer as the csv
    # writer writes str and the FileResponse expects a bytes files.
    buffer = io.BytesIO()
    buffer_writer = codecs.getwriter("utf-8")(buffer)
    writer = csv.DictWriter(
        buffer_writer,
        [name_col, duration_col, added_col, video_id_col, status_col] + profile_cols,
        dialect=csv.excel
    )
    writer.writeheader()
    for video in videos:
        writer.writerow(make_csv_dict(video))
    buffer.seek(0)

    # Translators: This is the suggested filename when downloading the URL
    # listing for videos uploaded through Studio
    filename = _("{course}_video_urls").format(course=course.id.course) + ".csv"
    return FileResponse(buffer, as_attachment=True, filename=filename, content_type="text/csv")


def _get_and_validate_course(course_key_string, user):
    """
    Given a course key, return the course if it exists, the given user has
    access to it, and it is properly configured for video uploads
    """
    course_key = CourseKey.from_string(course_key_string)

    # For now, assume all studio users that have access to the course can upload videos.
    # In the future, we plan to add a new org-level role for video uploaders.
    course = get_course_and_check_access(course_key, user)

    if (
        settings.FEATURES["ENABLE_VIDEO_UPLOAD_PIPELINE"] and
        getattr(settings, "VIDEO_UPLOAD_PIPELINE", None) and
        course and
        course.video_pipeline_configured
    ):
        return course
    else:
        return None


def convert_video_status(video, is_video_encodes_ready=False):
    """
    Convert status of a video. Status can be converted to one of the following:

        *   FAILED if video is in `upload` state for more than 24 hours
        *   `YouTube Duplicate` if status is `invalid_token`
        *   user-friendly video status
    """
    now = datetime.now(video.get('created', datetime.now().replace(tzinfo=UTC)).tzinfo)

    if video['status'] == 'upload' and (now - video['created']) > timedelta(hours=MAX_UPLOAD_HOURS):
        new_status = 'upload_failed'
        status = StatusDisplayStrings.get(new_status)
        message = 'Video with id [{}] is still in upload after [{}] hours, setting status to [{}]'.format(
            video['edx_video_id'], MAX_UPLOAD_HOURS, new_status
        )
        send_video_status_update([
            {
                'edxVideoId': video['edx_video_id'],
                'status': new_status,
                'message': message
            }
        ])
    elif video['status'] == 'invalid_token':
        status = StatusDisplayStrings.get('youtube_duplicate')
    elif is_video_encodes_ready:
        status = StatusDisplayStrings.get('file_complete')
    else:
        status = StatusDisplayStrings.get(video['status'])

    return status


def _get_videos(course, pagination_conf=None):
    """
    Retrieves the list of videos from VAL corresponding to this course.
    """
    videos, pagination_context = get_videos_for_course(
        str(course.id),
        VideoSortField.created,
        SortDirection.desc,
        pagination_conf
    )
    videos = list(videos)

    # This is required to see if edx video pipeline is enabled while converting the video status.
    course_video_upload_token = course.video_upload_pipeline.get('course_video_upload_token')
    transcription_statuses = ['transcription_in_progress', 'transcript_ready', 'partial_failure', 'transcript_failed']

    # convert VAL's status to studio's Video Upload feature status.
    for video in videos:
        # If we are using "new video workflow" and status is in `transcription_statuses` then video encodes are ready.
        # This is because Transcription starts once all the encodes are complete except for YT, but according to
        # "new video workflow" YT is disabled as well as deprecated. So, Its precise to say that the Transcription
        # starts once all the encodings are complete *for the new video workflow*.
        is_video_encodes_ready = not course_video_upload_token and (video['status'] in transcription_statuses)
        # Update with transcript languages
        video['transcripts'] = get_available_transcript_languages(video_id=video['edx_video_id'])
        video['transcription_status'] = (
            StatusDisplayStrings.get(video['status']) if is_video_encodes_ready else ''
        )
        video['transcript_urls'] = {}
        for language_code in video['transcripts']:
            video['transcript_urls'][language_code] = get_video_transcript_url(
                video_id=video['edx_video_id'],
                language_code=language_code,
            )
        # Convert the video status.
        # Legacy frontend expects the status to be translated unlike MFEs which handle translation themselves.
        video['status_nontranslated'] = convert_video_status(video, is_video_encodes_ready)
        # pylint: disable=translation-of-non-string
        video['status'] = _(video['status_nontranslated'])

    return videos, pagination_context


def _get_default_video_image_url():
    """
    Returns default video image url
    """
    return staticfiles_storage.url(settings.VIDEO_IMAGE_DEFAULT_FILENAME)


def _get_index_videos(course, pagination_conf=None):
    """
    Returns the information about each video upload required for the video list
    """
    course_id = str(course.id)
    attrs = [
        'edx_video_id', 'client_video_id', 'created', 'duration', 'status_nontranslated',
        'status', 'courses', 'encoded_videos', 'transcripts', 'transcription_status',
        'transcript_urls', 'error_description'
    ]

    def _get_values(video, course):
        """
        Get data for predefined video attributes.
        """
        values = {}
        for attr in attrs:
            if attr == 'courses':
                current_course = [c for c in video['courses'] if course_id in c]
                if current_course:
                    values['course_video_image_url'] = current_course[0][course_id]
                else:
                    values['course_video_image_url'] = None
            elif attr == 'encoded_videos':
                values['download_link'] = ''
                values['file_size'] = 0
                for encoding in video['encoded_videos']:
                    if encoding['profile'] == 'desktop_mp4':
                        values['download_link'] = encoding['url']
                        values['file_size'] = encoding['file_size']
            else:
                values[attr] = video[attr]
        return values

    videos, pagination_context = _get_videos(course, pagination_conf)
    return [_get_values(video, course) for video in videos], pagination_context


def get_all_transcript_languages():
    """
    Returns all possible languages for transcript.
    """
    third_party_transcription_languages = {}
    transcription_plans = get_3rd_party_transcription_plans()
    cielo_fidelity = transcription_plans[TranscriptProvider.CIELO24]['fidelity']

    # Get third party transcription languages.
    third_party_transcription_languages.update(transcription_plans[TranscriptProvider.THREE_PLAY_MEDIA]['languages'])
    third_party_transcription_languages.update(cielo_fidelity['MECHANICAL']['languages'])
    third_party_transcription_languages.update(cielo_fidelity['PREMIUM']['languages'])
    third_party_transcription_languages.update(cielo_fidelity['PROFESSIONAL']['languages'])

    # combines ALL_LANGUAGES with additional languages that should be supported for transcripts
    extended_all_languages = settings.ALL_LANGUAGES + settings.EXTENDED_VIDEO_TRANSCRIPT_LANGUAGES
    all_languages_dict = dict(extended_all_languages, **third_party_transcription_languages)
    # Return combined system settings and 3rd party transcript languages.
    all_languages = []
    for key, value in sorted(all_languages_dict.items(), key=lambda k_v: k_v[1]):
        all_languages.append({
            'language_code': key,
            'language_text': value
        })
    return all_languages


def videos_index_html(course, pagination_conf=None):
    """
    Returns an HTML page to display previous video uploads and allow new ones
    """
    return redirect(get_video_uploads_url(course.id))


def videos_index_json(course):
    """
    Returns JSON in the following format:
    {
        'videos': [{
            'edx_video_id': 'aaaaaaaa-aaaa-4aaa-aaaa-aaaaaaaaaaaa',
            'client_video_id': 'video.mp4',
            'created': '1970-01-01T00:00:00Z',
            'duration': 42.5,
            'status': 'upload',
            'course_video_image_url': 'https://video/images/1234.jpg'
        }]
    }
    """
    index_videos, __ = _get_index_videos(course)
    return JsonResponse({"videos": index_videos}, status=200)


def videos_post(course, request):
    """
    Input (JSON):
    {
        "files": [{
            "file_name": "video.mp4",
            "content_type": "video/mp4"
        }]
    }

    Returns (JSON):
    {
        "files": [{
            "file_name": "video.mp4",
            "upload_url": "http://example.com/put_video"
        }]
    }

    The returned array corresponds exactly to the input array.
    """

    if use_mock_video_uploads():
        return {'files': [{
            'file_name': 'video.mp4', 'upload_url': 'http://example.com/put_video', 'edx_video_id': '1234'
        }]}, 200

    error = None
    data = request.json
    if 'files' not in data:
        error = "Request object is not JSON or does not contain 'files'"
    elif any(
        'file_name' not in file or 'content_type' not in file
        for file in data['files']
    ):
        error = "Request 'files' entry does not contain 'file_name' and 'content_type'"
    elif any(
        file['content_type'] not in list(VIDEO_SUPPORTED_FILE_FORMATS.values())
        for file in data['files']
    ):
        error = "Request 'files' entry contain unsupported content_type"

    if error:
        return {'error': error}, 400

    bucket = storage_service_bucket()
    req_files = data['files']
    resp_files = []

    for req_file in req_files:
        file_name = req_file['file_name']

        try:
            file_name.encode('ascii')
        except UnicodeEncodeError:
            error_msg = 'The file name for %s must contain only ASCII characters.' % file_name
            return {'error': error_msg}, 400

        edx_video_id = str(uuid4())
        key_name = storage_service_key(bucket, file_name=edx_video_id)

        metadata_list = [
            ('client_video_id', file_name),
            ('course_key', str(course.id)),
        ]

        course_video_upload_token = course.video_upload_pipeline.get('course_video_upload_token')

        # Only include `course_video_upload_token` if youtube has not been deprecated
        # for this course.
        if not DEPRECATE_YOUTUBE.is_enabled(course.id) and course_video_upload_token:
            metadata_list.append(('course_video_upload_token', course_video_upload_token))

        is_video_transcript_enabled = VideoTranscriptEnabledFlag.feature_enabled(course.id)
        if is_video_transcript_enabled:
            transcript_preferences = get_transcript_preferences(str(course.id))
            if transcript_preferences is not None:
                metadata_list.append(('transcript_preferences', json.dumps(transcript_preferences)))

        # Prepare metadata for presigned URL
        metadata = dict(metadata_list)

        # Generate presigned URL using boto3
        s3_client = bucket.meta.client
        upload_url = s3_client.generate_presigned_url(
            'put_object',
            Params={
                'Bucket': bucket.name,
                'Key': key_name,
                'ContentType': req_file['content_type'],
                'Metadata': metadata
            },
            ExpiresIn=KEY_EXPIRATION_IN_SECONDS
        )

        # persist edx_video_id in VAL
        create_video({
            'edx_video_id': edx_video_id,
            'status': 'upload',
            'client_video_id': file_name,
            'duration': 0,
            'encoded_videos': [],
            'courses': [str(course.id)]
        })

        resp_files.append({'file_name': file_name, 'upload_url': upload_url, 'edx_video_id': edx_video_id})

    return {'files': resp_files}, 200


def storage_service_bucket():
    """
    Returns an S3 bucket for video upload.
    """
    if ENABLE_DEVSTACK_VIDEO_UPLOADS.is_enabled():
        params = {
            'aws_access_key_id': settings.AWS_ACCESS_KEY_ID,
            'aws_secret_access_key': settings.AWS_SECRET_ACCESS_KEY,
            'security_token': settings.AWS_SECURITY_TOKEN

        }
    else:
        params = {
            'aws_access_key_id': settings.AWS_ACCESS_KEY_ID,
            'aws_secret_access_key': settings.AWS_SECRET_ACCESS_KEY
        }

    conn = boto3.resource("s3", **params)

    return conn.Bucket(settings.VIDEO_UPLOAD_PIPELINE['VEM_S3_BUCKET'])


def storage_service_key(bucket, file_name):
    """
    Returns an S3 key name for the given file in the given bucket.
    """
    return "{}/{}".format(
        settings.VIDEO_UPLOAD_PIPELINE.get("ROOT_PATH", ""),
        file_name
    )


def send_video_status_update(updates):
    """
    Update video status in edx-val.
    """
    for update in updates:
        update_video_status(update.get('edxVideoId'), update.get('status'))
        LOGGER.info(
            'VIDEOS: Video status update with id [%s], status [%s] and message [%s]',
            update.get('edxVideoId'),
            update.get('status'),
            update.get('message')
        )

    return JsonResponse()


def is_status_update_request(request_data):
    """
    Returns True if `request_data` contains status update else False.
    """
    return any('status' in update for update in request_data)


def _generate_pagination_configuration(course_key_string, request):
    """
    Returns pagination configuration
    """
    course_key = CourseKey.from_string(course_key_string)
    if not ENABLE_VIDEO_UPLOAD_PAGINATION.is_enabled(course_key):
        return None
    return {
        'page_number': request.GET.get('page', 1),
        'videos_per_page': request.session.get("VIDEOS_PER_PAGE", VIDEOS_PER_PAGE)
    }


def _is_pagination_context_update_request(request):
    """
    Checks if request contains `videos_per_page`
    """
    return request.POST.get('id', '') == "videos_per_page"


def _update_pagination_context(request):
    """
    Updates session with posted value
    """
    error_msg = _('A non zero positive integer is expected')
    try:
        videos_per_page = int(request.POST.get('value'))
        if videos_per_page <= 0:
            return JsonResponse({'error': error_msg}, status=500)
    except ValueError:
        return JsonResponse({'error': error_msg}, status=500)

    request.session['VIDEOS_PER_PAGE'] = videos_per_page
    return JsonResponse()


def get_course_youtube_edx_video_ids(course_id):
    """
    Get a list of youtube edx_video_ids
    """
    invalid_key_error_msg = "Invalid course_key: '%s'." % course_id
    unexpected_error_msg = "Unexpected error occurred for course_id: '%s'." % course_id

    try:  # lint-amnesty, pylint: disable=too-many-nested-blocks
        course_key = CourseKey.from_string(course_id)
        course = modulestore().get_course(course_key)

        blocks = []
        block_yt_field = 'youtube_id_1_0'
        block_edx_id_field = 'edx_video_id'
        if hasattr(course, 'get_children'):
            for section in course.get_children():
                for subsection in section.get_children():
                    for vertical in subsection.get_children():
                        for block in vertical.get_children():
                            blocks.append(block)

        edx_video_ids = []
        for block in blocks:
            if hasattr(block, block_yt_field) and getattr(block, block_yt_field):
                if getattr(block, block_edx_id_field):
                    edx_video_ids.append(getattr(block, block_edx_id_field))

    except InvalidKeyError as error:
        LOGGER.exception(
            f"InvalidKeyError occurred while getting YouTube video IDs for course_id: {course_id}: {error}"
        )
        return JsonResponse({'error': invalid_key_error_msg}, status=500)
    except (TypeError, AttributeError) as error:
        LOGGER.exception(
            f"Error occurred while getting YouTube video IDs for course_id: {course_id}: {error}"
        )
        return JsonResponse({'error': unexpected_error_msg}, status=500)

    return JsonResponse({'edx_video_ids': edx_video_ids}, status=200)