From 5c754fdaeeddb1bbeff165bbecb77e33b75b3c7d Mon Sep 17 00:00:00 2001
From: Joar Wandborg <joar@wandborg.se>
Date: Tue, 22 Jan 2013 22:44:19 +0100
Subject: [PATCH 01/16] Added option to skip transcoding

- If the video input matches the configurable rules, just copy it to the
  output without transcoding it.
---
 mediagoblin/config_spec.ini                  |  6 ++
 mediagoblin/media_types/video/processing.py  | 59 ++++++++++++-------
 mediagoblin/media_types/video/transcoders.py |  4 +-
 mediagoblin/media_types/video/util.py        | 60 ++++++++++++++++++++
 4 files changed, 109 insertions(+), 20 deletions(-)
 create mode 100644 mediagoblin/media_types/video/util.py

diff --git a/mediagoblin/config_spec.ini b/mediagoblin/config_spec.ini
index bee67d46..712d087e 100644
--- a/mediagoblin/config_spec.ini
+++ b/mediagoblin/config_spec.ini
@@ -97,6 +97,12 @@ vp8_quality = integer(default=8)
 # Range: -0.1..1
 vorbis_quality = float(default=0.3)
 
+[[skip_transcode]]
+mime_types = string_list(default=list("video/webm"))
+container_formats = string_list(default=list("Matroska"))
+video_codecs = string_list(default=list("VP8 video"))
+audio_codecs = string_list(default=list("Vorbis"))
+dimensions_match = boolean(default=True)
 
 [media_type:mediagoblin.media_types.audio]
 keep_original = boolean(default=True)
diff --git a/mediagoblin/media_types/video/processing.py b/mediagoblin/media_types/video/processing.py
index 4c9f0131..53fe1a73 100644
--- a/mediagoblin/media_types/video/processing.py
+++ b/mediagoblin/media_types/video/processing.py
@@ -24,6 +24,8 @@ from mediagoblin.processing import \
 from mediagoblin.tools.translate import lazy_pass_to_ugettext as _
 
 from . import transcoders
+from .util import skip_transcode
+
 
 _log = logging.getLogger(__name__)
 _log.setLevel(logging.DEBUG)
@@ -80,24 +82,43 @@ def process_video(entry, workbench=None):
     with tmp_dst:
         # Transcode queued file to a VP8/vorbis file that fits in a 640x640 square
         progress_callback = ProgressCallback(entry)
-        transcoder = transcoders.VideoTranscoder()
-        transcoder.transcode(queued_filename, tmp_dst.name,
-                vp8_quality=video_config['vp8_quality'],
-                vp8_threads=video_config['vp8_threads'],
-                vorbis_quality=video_config['vorbis_quality'],
-                progress_callback=progress_callback)
 
-    # Push transcoded video to public storage
-    _log.debug('Saving medium...')
-    mgg.public_store.copy_local_to_storage(tmp_dst.name, medium_filepath)
-    _log.debug('Saved medium')
+        dimensions = (
+            mgg.global_config['media:medium']['max_width'],
+            mgg.global_config['media:medium']['max_height'])
 
-    entry.media_files['webm_640'] = medium_filepath
+        metadata = transcoders.VideoTranscoder().discover(queued_filename)
 
-    # Save the width and height of the transcoded video
-    entry.media_data_init(
-        width=transcoder.dst_data.videowidth,
-        height=transcoder.dst_data.videoheight)
+        if skip_transcode(metadata):
+            _log.debug('Skipping transcoding')
+            # Just push the submitted file to the tmp_dst
+            open(tmp_dst.name, 'wb').write(open(queued_filename, 'rb').read())
+
+            dst_dimensions = metadata['videowidth'], metadata['videoheight']
+        else:
+            transcoder = transcoders.VideoTranscoder()
+
+            transcoder.transcode(queued_filename, tmp_dst.name,
+                    vp8_quality=video_config['vp8_quality'],
+                    vp8_threads=video_config['vp8_threads'],
+                    vorbis_quality=video_config['vorbis_quality'],
+                    progress_callback=progress_callback,
+                    dimensions=dimensions)
+
+            dst_dimensions = transcoder.dst_data.videowidth,\
+                    transcoder.dst_data.videoheight
+
+        # Push transcoded video to public storage
+        _log.debug('Saving medium...')
+        mgg.public_store.copy_local_to_storage(tmp_dst.name, medium_filepath)
+        _log.debug('Saved medium')
+
+        entry.media_files['webm_640'] = medium_filepath
+
+        # Save the width and height of the transcoded video
+        entry.media_data_init(
+            width=dst_dimensions[0],
+            height=dst_dimensions[1])
 
     # Temporary file for the video thumbnail (cleaned up with workbench)
     tmp_thumb = NamedTemporaryFile(dir=workbench.dir, suffix='.jpg', delete=False)
@@ -109,10 +130,10 @@ def process_video(entry, workbench=None):
                 tmp_thumb.name,
                 180)
 
-    # Push the thumbnail to public storage
-    _log.debug('Saving thumbnail...')
-    mgg.public_store.copy_local_to_storage(tmp_thumb.name, thumbnail_filepath)
-    entry.media_files['thumb'] = thumbnail_filepath
+        # Push the thumbnail to public storage
+        _log.debug('Saving thumbnail...')
+        mgg.public_store.copy_local_to_storage(tmp_thumb.name, thumbnail_filepath)
+        entry.media_files['thumb'] = thumbnail_filepath
 
     if video_config['keep_original']:
         # Push original file to public storage
diff --git a/mediagoblin/media_types/video/transcoders.py b/mediagoblin/media_types/video/transcoders.py
index 152de288..8aa7121f 100644
--- a/mediagoblin/media_types/video/transcoders.py
+++ b/mediagoblin/media_types/video/transcoders.py
@@ -673,6 +673,7 @@ class VideoTranscoder:
         self._setup()
         self._run()
 
+    # XXX: This could be a static method.
     def discover(self, src):
         '''
         Discover properties about a media file
@@ -793,7 +794,8 @@ class VideoTranscoder:
         self.audioconvert = gst.element_factory_make('audioconvert', 'audioconvert')
         self.pipeline.add(self.audioconvert)
 
-        self.audiocapsfilter = gst.element_factory_make('capsfilter', 'audiocapsfilter')
+        self.audiocapsfilter = gst.element_factory_make('capsfilter',
+                                                        'audiocapsfilter')
         audiocaps = ['audio/x-raw-float']
         self.audiocapsfilter.set_property(
             'caps',
diff --git a/mediagoblin/media_types/video/util.py b/mediagoblin/media_types/video/util.py
new file mode 100644
index 00000000..93f098f7
--- /dev/null
+++ b/mediagoblin/media_types/video/util.py
@@ -0,0 +1,60 @@
+# GNU MediaGoblin -- federated, autonomous media hosting
+# Copyright (C) 2011, 2012 MediaGoblin contributors.  See AUTHORS.
+#
+# This program is free software: you can redistribute it and/or modify
+# it under the terms of the GNU Affero General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+#
+# This program is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU Affero General Public License for more details.
+#
+# You should have received a copy of the GNU Affero General Public License
+# along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+import logging
+
+from mediagoblin import mg_globals as mgg
+
+_log = logging.getLogger(__name__)
+
+
+def skip_transcode(metadata):
+    '''
+    Checks video metadata against configuration values for skip_transcode.
+
+    Returns True if the video matches the requirements in the configuration.
+    '''
+    config = mgg.global_config['media_type:mediagoblin.media_types.video']\
+            ['skip_transcode']
+
+    medium_config = mgg.global_config['media:medium']
+
+    _log.debug('skip_transcode config: {0}'.format(config))
+
+    if config['mime_types'] and metadata.get('mimetype'):
+        if not metadata['mimetype'] in config['mime_types']:
+            return False
+
+    if config['container_formats'] and metadata['tags'].get('audio-codec'):
+        if not metadata['tags']['container-format'] in config['container_formats']:
+            return False
+
+    if config['video_codecs'] and metadata['tags'].get('audio-codec'):
+        if not metadata['tags']['video-codec'] in config['video_codecs']:
+            return False
+
+    if config['audio_codecs'] and metadata['tags'].get('audio-codec'):
+        if not metadata['tags']['audio-codec'] in config['audio_codecs']:
+            return False
+
+    if config['dimensions_match']:
+        if not metadata['videoheight'] <= medium_config['max_height']:
+            return False
+        if not metadata['videowidth'] <= medium_config['max_width']:
+            return False
+
+    return True
+

From fd693e368bf7d344c29ff99b77acbb92f4524b73 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Fri, 1 Mar 2013 17:28:07 -0600
Subject: [PATCH 02/16] If we're not transcoding, copy this file directly over
 to ['original']

There's no reason to copy it over to 'webm_640' in such a case,
clearly.

Added logic so we don't do it twice either.

Haven't tested this yet though ;)

This commit sponsored by Algot Runeman.  Thank you!
---
 mediagoblin/media_types/video/processing.py | 23 +++++++++++++++------
 1 file changed, 17 insertions(+), 6 deletions(-)

diff --git a/mediagoblin/media_types/video/processing.py b/mediagoblin/media_types/video/processing.py
index 41929f3d..32313be7 100644
--- a/mediagoblin/media_types/video/processing.py
+++ b/mediagoblin/media_types/video/processing.py
@@ -94,6 +94,12 @@ def process_video(proc_state):
             open(tmp_dst.name, 'wb').write(open(queued_filename, 'rb').read())
 
             dst_dimensions = metadata['videowidth'], metadata['videoheight']
+
+            # Push original file to public storage
+            _log.debug('Saving original...')
+            proc_state.copy_original(queued_filepath[-1])
+
+            did_transcode = False
         else:
             transcoder = transcoders.VideoTranscoder()
 
@@ -107,12 +113,14 @@ def process_video(proc_state):
             dst_dimensions = transcoder.dst_data.videowidth,\
                     transcoder.dst_data.videoheight
 
-        # Push transcoded video to public storage
-        _log.debug('Saving medium...')
-        mgg.public_store.copy_local_to_storage(tmp_dst.name, medium_filepath)
-        _log.debug('Saved medium')
+            # Push transcoded video to public storage
+            _log.debug('Saving medium...')
+            mgg.public_store.copy_local_to_storage(tmp_dst.name, medium_filepath)
+            _log.debug('Saved medium')
 
-        entry.media_files['webm_640'] = medium_filepath
+            entry.media_files['webm_640'] = medium_filepath
+
+            did_transcode = True
 
         # Save the width and height of the transcoded video
         entry.media_data_init(
@@ -134,7 +142,10 @@ def process_video(proc_state):
         mgg.public_store.copy_local_to_storage(tmp_thumb.name, thumbnail_filepath)
         entry.media_files['thumb'] = thumbnail_filepath
 
-    if video_config['keep_original']:
+    # save the original... but only if we did a transcoding
+    # (if we skipped transcoding and just kept the original anyway as the main
+    #  media, then why would we save the original twice?)
+    if video_config['keep_original'] and did_transcode:
         # Push original file to public storage
         _log.debug('Saving original...')
         proc_state.copy_original(queued_filepath[-1])

From ddbf6af1e20222882a7ce559804ed48f4ad31a92 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sat, 2 Mar 2013 19:06:31 -0600
Subject: [PATCH 03/16] Huge amount of work to (mostly) allow .ogg (and maybe
 other) formats to skip transcode

 - Update get_display_media in several ways:
   - now uses the media type's own declaration of the order of things
   - returns both the media_size and the media_path, as per the docstring
   - implicitly uses self.media_files as opposed to forcing you to pass it in
 - update videos to use get_display_media
 - update images to declare media_fetch_order in the media manager (videos also)
 - update stl to use media.media_files['original'] instead of weird
   use of get_display_media
 - update sidebar to only conditionally show webm_640

TODO still: identify video type information *during* processing, show
that in the <video><source /></video> element.

This commit sponsored by Nathan Yergler.  Thanks, nyergler!
---
 mediagoblin/db/mixin.py                       | 24 ++++++++++++-------
 mediagoblin/media_types/image/__init__.py     |  6 ++++-
 mediagoblin/media_types/video/__init__.py     |  6 ++++-
 .../mediagoblin/media_displays/stl.html       |  2 +-
 .../mediagoblin/media_displays/video.html     |  8 ++++---
 .../mediagoblin/user_pages/media.html         |  2 +-
 mediagoblin/tools/common.py                   |  1 -
 7 files changed, 32 insertions(+), 17 deletions(-)

diff --git a/mediagoblin/db/mixin.py b/mediagoblin/db/mixin.py
index 6789a970..c4bd806c 100644
--- a/mediagoblin/db/mixin.py
+++ b/mediagoblin/db/mixin.py
@@ -126,24 +126,30 @@ class MediaEntryMixin(object):
         """
         return cleaned_markdown_conversion(self.description)
 
-    def get_display_media(self, media_map,
-                          fetch_order=common.DISPLAY_IMAGE_FETCHING_ORDER):
+    def get_display_media(self, fetch_order=None):
         """
         Find the best media for display.
 
         Args:
-        - media_map: a dict like
-          {u'image_size': [u'dir1', u'dir2', u'image.jpg']}
-        - fetch_order: the order we should try fetching images in
+        - fetch_order: the order we should try fetching images in.
+            If this isn't supplied, we try checking
+            self.media_data.fetching_order if it exists.
 
         Returns:
-        (media_size, media_path)
+          (media_size, media_path)
+          or, if not found, None.
         """
-        media_sizes = media_map.keys()
+        fetch_order = self.media_manager.get("media_fetch_order")
 
-        for media_size in common.DISPLAY_IMAGE_FETCHING_ORDER:
+        # No fetching order found?  well, give up!
+        if not fetch_order:
+            return None
+
+        media_sizes = self.media_files.keys()
+
+        for media_size in fetch_order:
             if media_size in media_sizes:
-                return media_map[media_size]
+                return media_size, self.media_files[media_size]
 
     def main_mediafile(self):
         pass
diff --git a/mediagoblin/media_types/image/__init__.py b/mediagoblin/media_types/image/__init__.py
index 36d7c201..3e167db1 100644
--- a/mediagoblin/media_types/image/__init__.py
+++ b/mediagoblin/media_types/image/__init__.py
@@ -25,4 +25,8 @@ MEDIA_MANAGER = {
     "sniff_handler": sniff_handler,
     "display_template": "mediagoblin/media_displays/image.html",
     "default_thumb": "images/media_thumbs/image.png",
-    "accepted_extensions": ["jpg", "jpeg", "png", "gif", "tiff"]}
+    "accepted_extensions": ["jpg", "jpeg", "png", "gif", "tiff"],
+
+    # Used by the media_entry.get_display_media method
+    "media_fetch_order": [u'medium', u'original', u'thumb'],
+}
diff --git a/mediagoblin/media_types/video/__init__.py b/mediagoblin/media_types/video/__init__.py
index 3faa5b9f..fd364c02 100644
--- a/mediagoblin/media_types/video/__init__.py
+++ b/mediagoblin/media_types/video/__init__.py
@@ -26,4 +26,8 @@ MEDIA_MANAGER = {
     "display_template": "mediagoblin/media_displays/video.html",
     "default_thumb": "images/media_thumbs/video.jpg",
     "accepted_extensions": [
-        "mp4", "mov", "webm", "avi", "3gp", "3gpp", "mkv", "ogv", "m4v"]}
+        "mp4", "mov", "webm", "avi", "3gp", "3gpp", "mkv", "ogv", "m4v"],
+
+    # Used by the media_entry.get_display_media method
+    "media_fetch_order": [u'webm_640', u'original'],
+}
diff --git a/mediagoblin/templates/mediagoblin/media_displays/stl.html b/mediagoblin/templates/mediagoblin/media_displays/stl.html
index 043faac8..a89e0b4f 100644
--- a/mediagoblin/templates/mediagoblin/media_displays/stl.html
+++ b/mediagoblin/templates/mediagoblin/media_displays/stl.html
@@ -23,7 +23,7 @@
 
 
 {% set model_download = request.app.public_store.file_url(
-   media.get_display_media(media.media_files)) %}
+   media.media_files['original']) %}
 {% set perspective_view = request.app.public_store.file_url(
    media.media_files['perspective']) %}
 {% set top_view = request.app.public_store.file_url(
diff --git a/mediagoblin/templates/mediagoblin/media_displays/video.html b/mediagoblin/templates/mediagoblin/media_displays/video.html
index 9eeb7c85..2e33e1a3 100644
--- a/mediagoblin/templates/mediagoblin/media_displays/video.html
+++ b/mediagoblin/templates/mediagoblin/media_displays/video.html
@@ -33,7 +33,7 @@
       data-setup='{"height": {{ media.media_data.height }},
                  "width": {{ media.media_data.width }} }'>
     <source src="{{ request.app.public_store.file_url(
-      	   media.media_files['webm_640']) }}"
+                        media.get_display_media()[1]) }}"
             type="video/webm; codecs=&quot;vp8, vorbis&quot;" />
     <div class="no_html5">
       {%- trans -%}Sorry, this video will not work because
@@ -53,7 +53,9 @@
       <li><a href="{{ request.app.public_store.file_url(
                        media.media_files.original) }}">{% trans %}Original file{% endtrans %}</a>
     {% endif %}
-    <li><a href="{{ request.app.public_store.file_url(
-                     media.media_files.webm_640) }}">{% trans %}WebM file (640p; VP8/Vorbis){% endtrans %}</a>
+    {% if 'webm_640' in media.media_files %}
+      <li><a href="{{ request.app.public_store.file_url(
+                       media.media_files.webm_640) }}">{% trans %}WebM file (640p; VP8/Vorbis){% endtrans %}</a>
+    {% endif %}
   </ul>
 {% endblock %}
diff --git a/mediagoblin/templates/mediagoblin/user_pages/media.html b/mediagoblin/templates/mediagoblin/user_pages/media.html
index f151c577..b77c12b9 100644
--- a/mediagoblin/templates/mediagoblin/user_pages/media.html
+++ b/mediagoblin/templates/mediagoblin/user_pages/media.html
@@ -47,7 +47,7 @@
     <div class="media_image_container">
       {% block mediagoblin_media %}
         {% set display_media = request.app.public_store.file_url(
-                 media.get_display_media(media.media_files)) %}
+                 media.get_display_media()[1]) %}
         {# if there's a medium file size, that means the medium size
          #  isn't the original... so link to the original!
          #}
diff --git a/mediagoblin/tools/common.py b/mediagoblin/tools/common.py
index c9f9d032..34586611 100644
--- a/mediagoblin/tools/common.py
+++ b/mediagoblin/tools/common.py
@@ -16,7 +16,6 @@
 
 import sys
 
-DISPLAY_IMAGE_FETCHING_ORDER = [u'medium', u'original', u'thumb']
 
 global TESTS_ENABLED
 TESTS_ENABLED = False

From 29adab4651cd2485441a08bb97ae0165e5be0017 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 10:36:37 -0600
Subject: [PATCH 04/16] Now store metadata info from processing into the media
 type.

This comes in several parts:
 - Store the metadata from gstreamer during processing
 - Add a new JSONEncoded field to the VideoData table
 - And, of course, add a migration for that field!

This commit sponsored by Julius Tuomisto.  Thank you, Julius!
---
 mediagoblin/media_types/video/migrations.py | 15 +++++++++++
 mediagoblin/media_types/video/models.py     | 19 ++++++++++++++
 mediagoblin/media_types/video/processing.py | 28 +++++++++++++++++++++
 3 files changed, 62 insertions(+)

diff --git a/mediagoblin/media_types/video/migrations.py b/mediagoblin/media_types/video/migrations.py
index f54c23ea..442bbd8d 100644
--- a/mediagoblin/media_types/video/migrations.py
+++ b/mediagoblin/media_types/video/migrations.py
@@ -14,4 +14,19 @@
 # You should have received a copy of the GNU Affero General Public License
 # along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
+from mediagoblin.db.migration_tools import RegisterMigration, inspect_table
+
+from sqlalchemy import MetaData, Column, Unicode
+
 MIGRATIONS = {}
+
+@RegisterMigration(1, MIGRATIONS)
+def add_orig_metadata_column(db_conn):
+    metadata = MetaData(bind=db_conn.bind)
+
+    vid_data = inspect_table(metadata, "video__mediadata")
+
+    col = Column('orig_metadata', Unicode,
+                 default=None, nullable=True)
+    col.create(vid_data)
+    db_conn.commit()
diff --git a/mediagoblin/media_types/video/models.py b/mediagoblin/media_types/video/models.py
index a771352c..e0043718 100644
--- a/mediagoblin/media_types/video/models.py
+++ b/mediagoblin/media_types/video/models.py
@@ -20,12 +20,29 @@ from mediagoblin.db.base import Base
 from sqlalchemy import (
     Column, Integer, SmallInteger, ForeignKey)
 from sqlalchemy.orm import relationship, backref
+from mediagoblin.db.extratypes import JSONEncoded
 
 
 BACKREF_NAME = "video__media_data"
 
 
 class VideoData(Base):
+    """
+    Attributes:
+     - media_data: the originating media entry (of course)
+     - width: width of the transcoded video
+     - height: height of the transcoded video
+     - orig_metadata: A loose json structure containing metadata gstreamer
+         pulled from the original video.
+         This field is NOT GUARANTEED to exist!
+    
+         Likely metadata extracted:
+           "videoheight", "videolength", "videowidth",
+           "audiorate", "audiolength", "audiochannels", "audiowidth",
+           "mimetype", "tags"
+     
+         TODO: document the above better.
+    """
     __tablename__ = "video__mediadata"
 
     # The primary key *and* reference to the main media_entry
@@ -38,6 +55,8 @@ class VideoData(Base):
     width = Column(SmallInteger)
     height = Column(SmallInteger)
 
+    orig_metadata = Column(JSONEncoded)
+
 
 DATA_MODEL = VideoData
 MODELS = [VideoData]
diff --git a/mediagoblin/media_types/video/processing.py b/mediagoblin/media_types/video/processing.py
index 32313be7..ec9ff225 100644
--- a/mediagoblin/media_types/video/processing.py
+++ b/mediagoblin/media_types/video/processing.py
@@ -86,8 +86,12 @@ def process_video(proc_state):
             mgg.global_config['media:medium']['max_width'],
             mgg.global_config['media:medium']['max_height'])
 
+        # Extract metadata and keep a record of it
         metadata = transcoders.VideoTranscoder().discover(queued_filename)
+        store_metadata(entry, metadata)
 
+        # Figure out whether or not we need to transcode this video or
+        # if we can skip it
         if skip_transcode(metadata):
             _log.debug('Skipping transcoding')
             # Just push the submitted file to the tmp_dst
@@ -152,3 +156,27 @@ def process_video(proc_state):
 
     # Remove queued media file from storage and database
     proc_state.delete_queue_file()
+
+
+def store_metadata(media_entry, metadata):
+    """
+    Store metadata from this video for this media entry.
+    """
+    # Let's pull out the easy, not having to be converted ones first
+    stored_metadata = dict(
+        [(key, metadata[key])
+         for key in [
+                 "videoheight", "videolength", "videowidth",
+                 "audiorate", "audiolength", "audiochannels", "audiowidth",
+                 "mimetype", "tags"]
+         if key in metadata])
+
+    # We have to convert videorate into a sequence because it's a
+    # special type normally..
+
+    if "videorate" in metadata:
+        videorate = metadata["videorate"]
+        stored_metadata["videorate"] = [videorate.num, videorate.denom]
+
+    media_entry.media_data_init(
+        orig_metadata=stored_metadata)

From 3ff006ef3b3b4dbd302ef8c30f5c3062e2954973 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 10:38:06 -0600
Subject: [PATCH 05/16] pdb.set_trace() in mediagoblin code is Not Allowed(TM),
 removing from audio code

Of course, the version that appears here is not really dangerous
because it's for the "call the file individually" form of debugging,
but it isn't allowed anyway.

This commit sponsored by Michael Faryniarz.  Thanks!
---
 mediagoblin/media_types/audio/transcoders.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/mediagoblin/media_types/audio/transcoders.py b/mediagoblin/media_types/audio/transcoders.py
index f3d49c30..3a9a2125 100644
--- a/mediagoblin/media_types/audio/transcoders.py
+++ b/mediagoblin/media_types/audio/transcoders.py
@@ -14,7 +14,6 @@
 # You should have received a copy of the GNU Affero General Public License
 # along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
-import pdb
 import logging
 import Image
 
@@ -233,5 +232,3 @@ if __name__ == '__main__':
     thumbnailer = AudioThumbnailer()
 
     thumbnailer.spectrogram(*sys.argv[1:], width=640)
-
-    pdb.set_trace()

From 14814f217af471538774a5861469af157735d893 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 11:03:30 -0600
Subject: [PATCH 06/16] {% set %} the display_type and display_path and use
 that elsewhere

This will make some stuff a bit cleaner that's coming up...

This commit sponsored by J B Nicholson-Owens.  Thanks!
---
 mediagoblin/templates/mediagoblin/media_displays/video.html | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/mediagoblin/templates/mediagoblin/media_displays/video.html b/mediagoblin/templates/mediagoblin/media_displays/video.html
index 2e33e1a3..06f5f226 100644
--- a/mediagoblin/templates/mediagoblin/media_displays/video.html
+++ b/mediagoblin/templates/mediagoblin/media_displays/video.html
@@ -27,13 +27,14 @@
 {%- endblock %}
 
 {% block mediagoblin_media %}
+  {% set display_type, display_path = media.get_display_media() %}
+
   <video controls
          {% if global_config['media_type:mediagoblin.media_types.video']['auto_play'] %}autoplay{% endif %}
          preload="auto" class="video-js vjs-mg-skin"
       data-setup='{"height": {{ media.media_data.height }},
                  "width": {{ media.media_data.width }} }'>
-    <source src="{{ request.app.public_store.file_url(
-                        media.get_display_media()[1]) }}"
+    <source src="{{ request.app.public_store.file_url(display_path) }}"
             type="video/webm; codecs=&quot;vp8, vorbis&quot;" />
     <div class="no_html5">
       {%- trans -%}Sorry, this video will not work because

From b35dfd3271bb40168b3d8c9335238715584eac02 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 11:08:14 -0600
Subject: [PATCH 07/16] Mild cosmetic cleanups to video.html and adding missing
 </li> elements.

This commit sponsored by Jukka Hellen.  Thanks!
---
 .../mediagoblin/media_displays/video.html     | 24 ++++++++++++-------
 1 file changed, 16 insertions(+), 8 deletions(-)

diff --git a/mediagoblin/templates/mediagoblin/media_displays/video.html b/mediagoblin/templates/mediagoblin/media_displays/video.html
index 06f5f226..d30c6a2b 100644
--- a/mediagoblin/templates/mediagoblin/media_displays/video.html
+++ b/mediagoblin/templates/mediagoblin/media_displays/video.html
@@ -22,8 +22,8 @@
   {{ super() }}
   <script type="text/javascript" src="{{
      request.staticdirect('/extlib/video-js/video.min.js') }}"></script>
-  <link href="{{ request.staticdirect('/css/vjs-mg-skin.css')
-     }}" rel="stylesheet">
+  <link href="{{ request.staticdirect('/css/vjs-mg-skin.css') }}"
+        rel="stylesheet">
 {%- endblock %}
 
 {% block mediagoblin_media %}
@@ -32,8 +32,8 @@
   <video controls
          {% if global_config['media_type:mediagoblin.media_types.video']['auto_play'] %}autoplay{% endif %}
          preload="auto" class="video-js vjs-mg-skin"
-      data-setup='{"height": {{ media.media_data.height }},
-                 "width": {{ media.media_data.width }} }'>
+         data-setup='{"height": {{ media.media_data.height }},
+                      "width": {{ media.media_data.width }} }'>
     <source src="{{ request.app.public_store.file_url(display_path) }}"
             type="video/webm; codecs=&quot;vp8, vorbis&quot;" />
     <div class="no_html5">
@@ -51,12 +51,20 @@
   <h3>{% trans %}Download{% endtrans %}</h3>
   <ul>
     {% if 'original' in media.media_files %}
-      <li><a href="{{ request.app.public_store.file_url(
-                       media.media_files.original) }}">{% trans %}Original file{% endtrans %}</a>
+      <li>
+        <a href="{{ request.app.public_store.file_url(
+                       media.media_files.original) }}">
+          {%- trans %}Original file{% endtrans -%}
+        </a>
+      </li>
     {% endif %}
     {% if 'webm_640' in media.media_files %}
-      <li><a href="{{ request.app.public_store.file_url(
-                       media.media_files.webm_640) }}">{% trans %}WebM file (640p; VP8/Vorbis){% endtrans %}</a>
+      <li>
+        <a href="{{ request.app.public_store.file_url(
+                       media.media_files.webm_640) }}">
+          {%- trans %}WebM file (640p; VP8/Vorbis){% endtrans -%}
+        </a>
+      </li>
     {% endif %}
   </ul>
 {% endblock %}

From 787aafd64482de3a4d150c75ffec024e8e11f287 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 11:41:40 -0600
Subject: [PATCH 08/16] Extrapolate type= based on the video metadata that we
 have, if we can.

It's kind of awkward because it relies on there being a entry.media_data,
but that's not guaranteed... (see http://issues.mediagoblin.org/ticket/650)
so we use a dopey fallback in the template in that case (kind of
annoying info duplication).

This commit sponsored by Piotr Wieczorek.  Thank you!
---
 mediagoblin/media_types/video/models.py       | 29 +++++++++++++++++++
 mediagoblin/media_types/video/util.py         |  1 -
 .../mediagoblin/media_displays/video.html     |  6 +++-
 3 files changed, 34 insertions(+), 2 deletions(-)

diff --git a/mediagoblin/media_types/video/models.py b/mediagoblin/media_types/video/models.py
index e0043718..4639b8c8 100644
--- a/mediagoblin/media_types/video/models.py
+++ b/mediagoblin/media_types/video/models.py
@@ -26,6 +26,8 @@ from mediagoblin.db.extratypes import JSONEncoded
 BACKREF_NAME = "video__media_data"
 
 
+DEFAULT_WEBM_TYPE = 'video/webm; codecs="vp8, vorbis"'
+
 class VideoData(Base):
     """
     Attributes:
@@ -57,6 +59,33 @@ class VideoData(Base):
 
     orig_metadata = Column(JSONEncoded)
 
+    def source_type(self):
+        """
+        Construct a useful type=... that is to say, used like:
+          <video><source type="{{ entry.media_data.source_type() }}" /></video>
+
+        Try to construct it out of self.orig_metadata... if we fail we
+        just dope'ily fall back on DEFAULT_WEBM_TYPE
+        """
+        orig_metadata = self.orig_metadata or {}
+
+        if "webm_640" not in self.get_media_entry.media_files \
+           and "mimetype" in orig_metadata \
+           and "tags" in orig_metadata \
+           and "audio-codec" in orig_metadata["tags"] \
+           and "video-codec" in orig_metadata["tags"]:
+            if orig_metadata['mimetype'] == 'application/ogg':
+                # stupid ambiguous .ogg extension
+                mimetype = "video/ogg"
+            else:
+                mimetype = orig_metadata['mimetype']
+            return '%s; codecs="%s, %s"' % (
+                mimetype,
+                orig_metadata["tags"]["video-codec"].lower(),
+                orig_metadata["tags"]["audio-codec"].lower())
+        else:
+            return DEFAULT_WEBM_TYPE
+
 
 DATA_MODEL = VideoData
 MODELS = [VideoData]
diff --git a/mediagoblin/media_types/video/util.py b/mediagoblin/media_types/video/util.py
index 93f098f7..5765ecfb 100644
--- a/mediagoblin/media_types/video/util.py
+++ b/mediagoblin/media_types/video/util.py
@@ -57,4 +57,3 @@ def skip_transcode(metadata):
             return False
 
     return True
-
diff --git a/mediagoblin/templates/mediagoblin/media_displays/video.html b/mediagoblin/templates/mediagoblin/media_displays/video.html
index d30c6a2b..dc0c7b55 100644
--- a/mediagoblin/templates/mediagoblin/media_displays/video.html
+++ b/mediagoblin/templates/mediagoblin/media_displays/video.html
@@ -35,7 +35,11 @@
          data-setup='{"height": {{ media.media_data.height }},
                       "width": {{ media.media_data.width }} }'>
     <source src="{{ request.app.public_store.file_url(display_path) }}"
-            type="video/webm; codecs=&quot;vp8, vorbis&quot;" />
+            {% if media.media_data %}
+              type="{{ media.media_data.source_type() }}"
+            {% else %}
+              type="video/webm; codecs=&quot;vp8, vorbis&quot;"
+            {% endif %} />
     <div class="no_html5">
       {%- trans -%}Sorry, this video will not work because
       your web browser does not support HTML5 

From 9d4cebfd36b7bba3d8d4ad2cb97a85ec63068cb5 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 14:27:36 -0600
Subject: [PATCH 09/16] Per Elrond's suggestions moving DEFAULT_WEBM_TYPE to
 media manager

The reason for this is to avoid defining this twice as we were
previously (once in the template, once in video/models.py)

This commit sponsored by Roland McIntosh.  Thank you!
---
 mediagoblin/media_types/video/__init__.py                   | 1 +
 mediagoblin/media_types/video/models.py                     | 5 ++---
 mediagoblin/templates/mediagoblin/media_displays/video.html | 2 +-
 3 files changed, 4 insertions(+), 4 deletions(-)

diff --git a/mediagoblin/media_types/video/__init__.py b/mediagoblin/media_types/video/__init__.py
index fd364c02..fab601f6 100644
--- a/mediagoblin/media_types/video/__init__.py
+++ b/mediagoblin/media_types/video/__init__.py
@@ -30,4 +30,5 @@ MEDIA_MANAGER = {
 
     # Used by the media_entry.get_display_media method
     "media_fetch_order": [u'webm_640', u'original'],
+    "default_webm_type": 'video/webm; codecs="vp8, vorbis"',
 }
diff --git a/mediagoblin/media_types/video/models.py b/mediagoblin/media_types/video/models.py
index 4639b8c8..970ceb75 100644
--- a/mediagoblin/media_types/video/models.py
+++ b/mediagoblin/media_types/video/models.py
@@ -21,13 +21,12 @@ from sqlalchemy import (
     Column, Integer, SmallInteger, ForeignKey)
 from sqlalchemy.orm import relationship, backref
 from mediagoblin.db.extratypes import JSONEncoded
+from mediagoblin.media_types import video
 
 
 BACKREF_NAME = "video__media_data"
 
 
-DEFAULT_WEBM_TYPE = 'video/webm; codecs="vp8, vorbis"'
-
 class VideoData(Base):
     """
     Attributes:
@@ -84,7 +83,7 @@ class VideoData(Base):
                 orig_metadata["tags"]["video-codec"].lower(),
                 orig_metadata["tags"]["audio-codec"].lower())
         else:
-            return DEFAULT_WEBM_TYPE
+            return video.MEDIA_MANAGER["default_webm_type"]
 
 
 DATA_MODEL = VideoData
diff --git a/mediagoblin/templates/mediagoblin/media_displays/video.html b/mediagoblin/templates/mediagoblin/media_displays/video.html
index dc0c7b55..b0854c9f 100644
--- a/mediagoblin/templates/mediagoblin/media_displays/video.html
+++ b/mediagoblin/templates/mediagoblin/media_displays/video.html
@@ -38,7 +38,7 @@
             {% if media.media_data %}
               type="{{ media.media_data.source_type() }}"
             {% else %}
-              type="video/webm; codecs=&quot;vp8, vorbis&quot;"
+              type="{{ media.media_manager['default_webm_type'] }}"
             {% endif %} />
     <div class="no_html5">
       {%- trans -%}Sorry, this video will not work because

From 4f239ff19418a48fa4d369efb005abfc09593359 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 14:29:30 -0600
Subject: [PATCH 10/16] Another elrond suggestion: only init orig_metadata if
 there's anything in the dict.

This commit sponsored by Joshua Rosen.  Thank you!
---
 mediagoblin/media_types/video/processing.py | 6 ++++--
 1 file changed, 4 insertions(+), 2 deletions(-)

diff --git a/mediagoblin/media_types/video/processing.py b/mediagoblin/media_types/video/processing.py
index ec9ff225..3da19a08 100644
--- a/mediagoblin/media_types/video/processing.py
+++ b/mediagoblin/media_types/video/processing.py
@@ -178,5 +178,7 @@ def store_metadata(media_entry, metadata):
         videorate = metadata["videorate"]
         stored_metadata["videorate"] = [videorate.num, videorate.denom]
 
-    media_entry.media_data_init(
-        orig_metadata=stored_metadata)
+    # Only save this field if there's something to save
+    if len(stored_metadata):
+        media_entry.media_data_init(
+            orig_metadata=stored_metadata)

From e77df64fd17adc57121176898e14ea21693489c5 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 15:40:49 -0600
Subject: [PATCH 11/16] No reason really to pass in fetch_order anyway...

I think this is legacy code from get_display_media being a utility, or
something.  Removed!  (Thanks for pointing this out, Elrond!)

This commit sponsored by Tristan Chambers.  Thank you!
---
 mediagoblin/db/mixin.py | 12 +++++-------
 1 file changed, 5 insertions(+), 7 deletions(-)

diff --git a/mediagoblin/db/mixin.py b/mediagoblin/db/mixin.py
index c4bd806c..92834a72 100644
--- a/mediagoblin/db/mixin.py
+++ b/mediagoblin/db/mixin.py
@@ -126,18 +126,16 @@ class MediaEntryMixin(object):
         """
         return cleaned_markdown_conversion(self.description)
 
-    def get_display_media(self, fetch_order=None):
-        """
-        Find the best media for display.
+    def get_display_media(self):
+        """Find the best media for display.
 
-        Args:
-        - fetch_order: the order we should try fetching images in.
-            If this isn't supplied, we try checking
-            self.media_data.fetching_order if it exists.
+        We try checking self.media_data.fetching_order if it exists to
+        pull down the order.
 
         Returns:
           (media_size, media_path)
           or, if not found, None.
+
         """
         fetch_order = self.media_manager.get("media_fetch_order")
 

From 5302477671e4ef65e35baa1e5b868c4dae4a35c7 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Sun, 3 Mar 2013 16:28:16 -0600
Subject: [PATCH 12/16] self.media_data->self.media_manager in the docstring. 
 Thanks for catching, Elrond.

This commit sponsored by Sebastian Hugentobler.  Thank you!
---
 mediagoblin/db/mixin.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/mediagoblin/db/mixin.py b/mediagoblin/db/mixin.py
index 92834a72..fdf61e8d 100644
--- a/mediagoblin/db/mixin.py
+++ b/mediagoblin/db/mixin.py
@@ -129,7 +129,7 @@ class MediaEntryMixin(object):
     def get_display_media(self):
         """Find the best media for display.
 
-        We try checking self.media_data.fetching_order if it exists to
+        We try checking self.media_manager.fetching_order if it exists to
         pull down the order.
 
         Returns:

From 17e4679ddc4b6ee6d2be5a5e55ba9d314e5a1a42 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Mon, 4 Mar 2013 10:12:48 -0600
Subject: [PATCH 13/16] Three fixes to collection adding view, one of them a
 serious security bug

 - Don't let people who aren't the authors of a collection from adding
   things to it (handled by forcing the user check in the query)
 - request url in case invalid collection selected fixed
 - collection_item.author doesn't yet exist; removing the selection
   (we might want multiple people to be able to edit a collection in
   the future but that future does not yet exist; as Elrond said,
   remove this "false hope")

Thanks to Elrond to pointing out these issues.

And thanks to David Kindler for sponsoring this commit!
---
 mediagoblin/user_pages/views.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/mediagoblin/user_pages/views.py b/mediagoblin/user_pages/views.py
index 69d7defb..80919d47 100644
--- a/mediagoblin/user_pages/views.py
+++ b/mediagoblin/user_pages/views.py
@@ -227,7 +227,8 @@ def media_collect(request, media):
     # Otherwise, use the collection selected from the drop-down
     else:
         collection = Collection.query.filter_by(
-            id=request.form.get('collection')).first()
+            id=request.form.get('collection'),
+            creator=request.user.id).first()
 
     # Make sure the user actually selected a collection
     if not collection:
@@ -236,7 +237,7 @@ def media_collect(request, media):
             _('You have to select or add a collection'))
         return redirect(request, "mediagoblin.user_pages.media_collect",
                     user=media.get_uploader.username,
-                    media=media.id)
+                    media_id=media.id)
 
 
     # Check whether media already exists in collection
@@ -250,7 +251,6 @@ def media_collect(request, media):
         collection_item = request.db.CollectionItem()
         collection_item.collection = collection.id
         collection_item.media_entry = media.id
-        collection_item.author = request.user.id
         collection_item.note = request.form['note']
         collection_item.save()
 

From 7e4a87dca5c8afa13b64f76c4b9ce440d38a91b5 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Mon, 4 Mar 2013 10:57:21 -0600
Subject: [PATCH 14/16] Give a more useful error if a table already exists and
 so we can't create it during migrations

This commit sponsored by Andrzej Prochyra.  Thanks!
---
 mediagoblin/db/migration_tools.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/mediagoblin/db/migration_tools.py b/mediagoblin/db/migration_tools.py
index e5380a3b..c0c7e998 100644
--- a/mediagoblin/db/migration_tools.py
+++ b/mediagoblin/db/migration_tools.py
@@ -17,6 +17,9 @@
 from mediagoblin.tools.common import simple_printer
 from sqlalchemy import Table
 
+class TableAlreadyExists(Exception):
+    pass
+
 
 class MigrationManager(object):
     """
@@ -128,7 +131,10 @@ class MigrationManager(object):
         # sanity check before we proceed, none of these should be created
         for model in self.models:
             # Maybe in the future just print out a "Yikes!" or something?
-            assert not model.__table__.exists(self.session.bind)
+            if model.__table__.exists(self.session.bind):
+                raise TableAlreadyExists(
+                    u"Intended to create table '%s' but it already exists" %
+                    model.__table__.name)
 
         self.migration_model.metadata.create_all(
             self.session.bind,

From e9b69c7d0eb00426ee06e4d83f8e1841b421deb2 Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Mon, 4 Mar 2013 11:45:14 -0600
Subject: [PATCH 15/16] Elrond points out that we should use
 form.collection.data

That's true; I'm not sure what it's fixing, but he thinks it's fixing
something.  Anyway, it's correct :)

This commit sponsored by Philippe Gauthier.  Thanks!
---
 mediagoblin/user_pages/views.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/mediagoblin/user_pages/views.py b/mediagoblin/user_pages/views.py
index 80919d47..dc562084 100644
--- a/mediagoblin/user_pages/views.py
+++ b/mediagoblin/user_pages/views.py
@@ -227,7 +227,7 @@ def media_collect(request, media):
     # Otherwise, use the collection selected from the drop-down
     else:
         collection = Collection.query.filter_by(
-            id=request.form.get('collection'),
+            id=form.collection.data,
             creator=request.user.id).first()
 
     # Make sure the user actually selected a collection

From f51a416778bc71ec373fac1cbfbf7df60815b68d Mon Sep 17 00:00:00 2001
From: Christopher Allan Webber <cwebber@dustycloud.org>
Date: Mon, 4 Mar 2013 11:53:04 -0600
Subject: [PATCH 16/16] Removing an unnecessary video write

In the case of if we're skipping transcoding, we don't need to copy
this file at all!

This commit sponsored by Frank Zambrini III.  Thanks!
---
 mediagoblin/media_types/video/processing.py | 3 ---
 1 file changed, 3 deletions(-)

diff --git a/mediagoblin/media_types/video/processing.py b/mediagoblin/media_types/video/processing.py
index 3da19a08..d6439b78 100644
--- a/mediagoblin/media_types/video/processing.py
+++ b/mediagoblin/media_types/video/processing.py
@@ -25,7 +25,6 @@ from mediagoblin.tools.translate import lazy_pass_to_ugettext as _
 from . import transcoders
 from .util import skip_transcode
 
-
 _log = logging.getLogger(__name__)
 _log.setLevel(logging.DEBUG)
 
@@ -94,8 +93,6 @@ def process_video(proc_state):
         # if we can skip it
         if skip_transcode(metadata):
             _log.debug('Skipping transcoding')
-            # Just push the submitted file to the tmp_dst
-            open(tmp_dst.name, 'wb').write(open(queued_filename, 'rb').read())
 
             dst_dimensions = metadata['videowidth'], metadata['videoheight']