Large in-progress checkin for filepicker integration.

author Seth Woodworth <seth@sethish.com>

Tue, 24 Sep 2013 13:53:16 +0000 (13:53 +0000)

committer Seth Woodworth <seth@sethish.com>

Tue, 24 Sep 2013 13:53:16 +0000 (13:53 +0000)
author Seth Woodworth <seth@sethish.com>
Tue, 24 Sep 2013 13:53:16 +0000 (13:53 +0000)
committer Seth Woodworth <seth@sethish.com>
Tue, 24 Sep 2013 13:53:16 +0000 (13:53 +0000)
diff --git a/karmaworld/apps/document_upload/forms.py b/karmaworld/apps/document_upload/forms.py

index ae790c958d62618e4e8783a3d57759d1dc08f5ae..1484367a7d6dae1fee96615cab9991a6817fc0a3 100644 (file)
--- a/karmaworld/apps/document_upload/forms.py
+++ b/karmaworld/apps/document_upload/forms.py
@@ -9,4 +9,4 @@ from karmaworld.apps.document_upload.models import RawDocument
  class RawDocumentForm(ModelForm):
      class Meta:
          model = RawDocument
-        fields = ('name', 'tags', 'course', 'fp_file')
+        fields = ('name', 'tags', 'course', 'fp_file', 'mimetype')
diff --git a/karmaworld/apps/document_upload/models.py b/karmaworld/apps/document_upload/models.py

index 766698ec67eedc4370fe9e20eda530d291eba6cb..876ee41d7f710f1045466fa9709eb425be77150f 100644 (file)
--- a/karmaworld/apps/document_upload/models.py
+++ b/karmaworld/apps/document_upload/models.py
@@ -25,6 +25,7 @@ class RawDocument(Document):
  
      def convert_to_note(self):
          """ polymorph this object into a note.models.Note object  """
+        print "begin convert_to_note"
          note = Note(
                  course=self.course,
                  name=self.name,
@@ -35,9 +36,13 @@ class RawDocument(Document):
          note.save()
          for tag in self.tags.all():
              note.tags.add(tag)
+        print "finish convert_to_note"
          return note
  
      def save(self, *args, **kwargs):
-        if not is_processed:
-            tasks.process_raw_document(self)
+        print "`RawDocument.save()`"
          super(RawDocument, self).save(*args, **kwargs)
+        if not self.is_processed:
+            print "\t document not processed yet, doing that now"
+            tasks.process_raw_document.delay(self)
+            print "\t this arrow should point to the word now ^"
diff --git a/karmaworld/apps/document_upload/tasks.py b/karmaworld/apps/document_upload/tasks.py

index df7021ea96df7a3d4c3f07a80b25280ab5165ad0..e8630859915f46456fb2594b6c7c54342f4af854 100644 (file)
--- a/karmaworld/apps/document_upload/tasks.py
+++ b/karmaworld/apps/document_upload/tasks.py
@@ -2,11 +2,15 @@
  # -*- coding:utf8 -*-
  # Copyright (C) 2013  FinalsClub Foundation
  
-from celery.task import task
-from karmaworld.apps.notes.gdrive import convert_with_google_drive
+from celery import Celery
+from celery import task
+from karmaworld.apps.notes.gdrive import convert_raw_document
  
-@task
+#@Celery.task()
+@task()
  def process_raw_document(raw_document):
      """ Process a RawDocument instance in to a Note instance """
+    print "="*80
+    print "this line should be deferred and only printed by celery"
      convert_raw_document(raw_document)
  
diff --git a/karmaworld/apps/document_upload/views.py b/karmaworld/apps/document_upload/views.py

index 4352ed263f499d2f0165c4384865dee84e9db289..a72d271d910c3c48259d0147c10dc465832c5ead 100644 (file)
--- a/karmaworld/apps/document_upload/views.py
+++ b/karmaworld/apps/document_upload/views.py
@@ -13,11 +13,26 @@ from karmaworld.apps.document_upload.models import RawDocument
  from karmaworld.apps.document_upload.forms import RawDocumentForm
  
  def save_fp_upload(request):
+    """ ajax endpoint for saving a FilePicker uploaded file form
+    """
      r_d_f = RawDocumentForm(request.POST)
      if r_d_f.is_valid():
-        model_instance = r_d_f.save(commit=False)
-        model_instance.uploaded_at = datetime.datetime.utcnow()
-        model_instance.save()
+        raw_document = r_d_f.save(commit=False)
+
+        print request.POST.keys()
+        time_a = datetime.datetime.now()
+        raw_document.fp_file = request.POST['fp_file']
+
+        time_b = datetime.datetime.now()
+        delta = time_b - time_a
+        raw_document.ip = request.META['REMOTE_ADDR']
+        raw_document.uploaded_at = datetime.datetime.utcnow()
+        time_c = datetime.datetime.now()
+        # note that .save() has the side-effect of kicking of a celery processing task
+        raw_document.save()
+        time_d = datetime.datetime.now()
+        delta = time_d - time_c
+        print "d\t%s" % delta
          return HttpResponse({'success'})
      else:
          return HttpResponse(r_d_f.errors, status=400)
diff --git a/karmaworld/apps/notes/gdrive.py b/karmaworld/apps/notes/gdrive.py

index 105516bf7c378135a09b1a659ffa62894a2f0eeb..5b8760e0c14ceafcff784abda7ee630a7936c269 100644 (file)
--- a/karmaworld/apps/notes/gdrive.py
+++ b/karmaworld/apps/notes/gdrive.py
@@ -11,6 +11,7 @@ import time
  import httplib2
  from apiclient.discovery import build
  from apiclient.http import MediaFileUpload
+from apiclient.http import MediaInMemoryUpload
  from django.conf import settings
  from django.core.files import File
  from oauth2client.client import flow_from_clientsecrets
@@ -27,6 +28,8 @@ except:
  
  EXT_TO_MIME = {'.docx': 'application/msword'}
  
+PPT_MIMETYPES = ['application/vnd.ms-powerpoint', 'application/vnd.openxmlformats-officedocument.presentationml.presentation']
+
  def build_flow():
      """ Create an oauth2 autentication object with our preferred details """
      scopes = [
@@ -84,12 +87,16 @@ def check_and_refresh(creds, auth):
          auth.save()
      return creds, auth
  
-def download_from_gdrive(file_dict, http, extension):
+def download_from_gdrive(file_dict, http, extension=None, mimetype=None):
      """ get urls from file_dict and download contextual files from google """
      download_urls = {}
      download_urls['text'] = file_dict[u'exportLinks']['text/plain']
  
-    if extension.lower() in ['.ppt', 'pptx']:
+    if extension:
+        extension = extension.lower()
+
+    if extension in ['.ppt', 'pptx'] \
+        or mimetype in PPT_MIMETYPES:
          download_urls['pdf'] = file_dict[u'exportLinks']['application/pdf']
      else:
          download_urls['html'] = file_dict[u'exportLinks']['text/html']
@@ -109,11 +116,19 @@ def download_from_gdrive(file_dict, http, extension):
  
      return content_dict
  
-def upload_to_gdrive(service, media, filename, extension):
+def upload_to_gdrive(service, media, filename, extension=None, mimetype=None):
      """ take a gdrive service object, and a media wrapper and upload to gdrive
-        returns a file_dict """
+        returns a file_dict
+        You must provide an `extension` or `mimetype`
+    """
      _resource = {'title': filename}
-    if extension.lower() in ['.pdf', '.jpeg', '.jpg', '.png']:
+
+    # clean up extensions for type checking
+    if extension:
+        extension = extension.lower()
+
+    if extension in ['.pdf', '.jpeg', '.jpg', '.png'] \
+        or mimetype in ['application/pdf']:
          # include OCR on ocr-able files
          file_dict = service.files().insert(body=_resource, media_body=media, convert=True, ocr=True).execute()
  
@@ -206,17 +221,23 @@ def convert_with_google_drive(note):
  
  def convert_raw_document(raw_document):
      """ Upload a raw document to google drive and get a Note back """
+    fp_file = raw_document.get_file()
  
+    # download the file to memory
      # get the file's mimetype
-    file_type, _ = mimetypes=guess_type(raw_document.fp_file.path)
+    #file_type, _ = mimetypes.guess_type(raw_document.fp_file.path)
      # get the file extension
-    filename, extension = os.path.splitext(raw_document.fp_file.path)
-
-    if file_type == None:
-        media = MediaFileUpload(note.note_file.path,
+    #filename, extension = os.path.splitext(raw_document.fp_file.path)
+    filename = raw_document.name
+    print "this is the mimetype of the document to check:"
+    print raw_document.mimetype
+    print ""
+
+    if raw_document.mimetype == None:
+        media = MediaInMemoryUpload(fp_file.read(),
                      chunksize=1024*1024, resumable=True)
      else:
-        media = MediaFileUpload(note.note_file.path, mimetype=file_type,
+        media = MediaInMemoryUpload(fp_file.read(), mimetype=raw_document.mimetype,
                      chunksize=1024*1024, resumable=True)
  
      auth = DriveAuth.objects.filter(email=GOOGLE_USER).all()[0]
@@ -226,14 +247,18 @@ def convert_raw_document(raw_document):
      service, http = build_api_service(creds)
  
      # prepare the upload
-    file_dict = upload_to_gdrive(service, media, filename, extension)
-    content_dict = download_from_gdrive(file_dict, http, extension)
+    file_dict = upload_to_gdrive(service, media, filename, mimetype=raw_document.mimetype)
+    content_dict = download_from_gdrive(file_dict, http, mimetype=raw_document.mimetype)
+
+    # this should have already happened, lets see why it hasn't
+    raw_document.save()
  
      note = raw_document.convert_to_note()
-    if extension.lower() == '.pdf':
+
+    if raw_document.mimetype == 'application/pdf':
          note.file_type = 'pdf'
  
-    elif extension.lower() in ['.ppt', '.pptx']:
+    elif raw_document.mimetype in PPT_MIMETYPES:
          note.file_type = 'ppt'
          now = datetime.datetime.utcnow()
          # create a folder path to store the ppt > pdf file with year and month folders
diff --git a/karmaworld/apps/notes/models.py b/karmaworld/apps/notes/models.py

index b8ce9ce5d01d853b66f9aeb0babe43b84cb03d1a..63e3a9cbfc72823bc496db8f3d0bfd1bb716d065 100644 (file)
--- a/karmaworld/apps/notes/models.py
+++ b/karmaworld/apps/notes/models.py
@@ -7,8 +7,11 @@
      Contains only the minimum for handling files and their representation
  """
  import datetime
+import os
+import urllib
  
  from django.conf import settings
+from django.core.files import File
  from django.core.files.storage import FileSystemStorage
  from django.db import models
  from django.template import defaultfilters
@@ -57,8 +60,10 @@ class Document(models.Model):
  
      fp_file = django_filepicker.models.FPFileField(
              upload_to=_choose_upload_to,
+            storage=fs,                 \
              null=True, blank=True,
              help_text=u"An uploaded file reference from Filepicker.io")
+    mimetype = models.CharField(max_length=255, blank=True, null=True)
  
      class Meta:
          abstract = True
@@ -78,6 +83,35 @@ class Document(models.Model):
                      self.uploaded_at.day, self.uploaded_at.microsecond)
          self.slug = _slug
  
+    def get_file(self):
+        """ Downloads the file from filepicker.io and returns a
+        Django File wrapper object """
+        # clean up any old downloads that are still hanging around
+        if hasattr(self, 'tempfile'):
+            self.tempfile.close()
+            delattr(self, 'tempfile')
+
+        if hasattr(self, 'filename'):
+            # the file might have been moved in the meantime so
+            # check first
+            if os.path.exists(self.filename):
+                os.remove(self.filename)
+            delattr(self, 'filename')
+
+        # The temporary file will be created in a directory set by the
+        # environment (TEMP_DIR, TEMP or TMP)
+        self.filename, header = urllib.urlretrieve(self.fp_file.name)
+        name = os.path.basename(self.filename)
+        disposition = header.get('Content-Disposition')
+        if disposition:
+            name = disposition.rpartition("filename=")[2].strip('" ')
+        filename = header.get('X-File-Name')
+        if filename:
+            name = filename
+
+        self.tempfile = open(self.filename, 'r')
+        return File(self.tempfile, name=name)
+
      def save(self, *args, **kwargs):
          if self.name and not self.slug:
              self._generate_unique_slug()
diff --git a/karmaworld/templates/partial/filepicker.html b/karmaworld/templates/partial/filepicker.html

index 4fc90f065d1b0c6b04f09e9ae1959f59054664b4..feaa9b96ecc962420131cd49c3d2e6e0ad923db9 100644 (file)
--- a/karmaworld/templates/partial/filepicker.html
+++ b/karmaworld/templates/partial/filepicker.html
@@ -47,6 +47,7 @@
          </div>
          <div class="hidden-fields" style="display:none;">
            <input type="text" id="id_fpfile" name="fpfile" class="fpurl">
+          <input type="text" id="id_mimetype" name="mimetype" class="mimetype">
            <input type="text" id="id_course" name="course" value="{{ course.id }}"
              class="course_id">
            {% csrf_token %}
@@ -68,11 +69,16 @@
         */
        makeFileForm = function(upFile) {
          var _form = document.getElementById('form-template').cloneNode(deep=true);
-        // FIXME: VVVVVV
+        // save the Filename to the form name field
          $(_form.children[0].children[0].children[1]).val(upFile.filename); // replace with upFile name
          _form.style.display = "inline";
          _form.id = null; // clear the unique id
+        // save the FP url to the form
          $(_form.children[0].children[2].children[0]).val(upFile.url);
+        console.log(upFile);
+        // save the mimetype to the form
+        $(_form.children[0].children[2].children[1]).val(upFile.mimetype);
+
          document.getElementById('forms_container').appendChild(_form);
        };
  
@@ -124,13 +130,16 @@
            }
        });
        $('#save-btn').on('click', function(e){
-        $('.inline-form').each(function(i,el){
+        e.stopPropagation();
+        $('#forms_container .inline-form').each(function(i,el){
+            console.log("inline form " + i + "el: " + el);
              var name, tags, fpurl, course;
              name = $(el).find('.intext').val();
              fp_file = $(el).find('.fpurl').val();
              tags = $(el).find('.taggit-tags').val();
              course = $(el).find('.course_id').val();
              csrf = $(el).find('.csrf').val();
+            mimetype = $(el).find('.mimetype').val();
  
              $.post('{% url 'upload_post' %}', {
                'name': name,
@@ -138,6 +147,7 @@
                'tags': tags,
                'course': course,
                'csrfmiddlewaretoken': csrf,
+              'mimetype': mimetype
              });
          });
        });
author	Seth Woodworth <seth@sethish.com>
	Tue, 24 Sep 2013 13:53:16 +0000 (13:53 +0000)
committer	Seth Woodworth <seth@sethish.com>
	Tue, 24 Sep 2013 13:53:16 +0000 (13:53 +0000)
karmaworld/apps/document_upload/forms.py		patch \| blob \| history
karmaworld/apps/document_upload/models.py		patch \| blob \| history
karmaworld/apps/document_upload/tasks.py		patch \| blob \| history
karmaworld/apps/document_upload/views.py		patch \| blob \| history
karmaworld/apps/notes/gdrive.py		patch \| blob \| history
karmaworld/apps/notes/models.py		patch \| blob \| history
karmaworld/templates/partial/filepicker.html		patch \| blob \| history