add parsing of overview content blob

eda70ad7 · Chris Dodge · 759898b8 · eda70ad7
Commit eda70ad7 authored Apr 17, 2014 by Chris Dodge
Hide whitespace changes
Inline Side-by-side

Showing with 32 additions and 12 deletions

lms/djangoapps/api_manager/courses_views.py
+32 -12

No files found.
--- a/lms/djangoapps/api_manager/courses_views.py
+++ b/lms/djangoapps/api_manager/courses_views.py
@@ -4,6 +4,7 @@ from django.contrib.auth.models import Group
 from django.core.exceptions import ObjectDoesNotExist
 from lxml import etree
 from StringIO import StringIO
+from collections import OrderedDict
 from rest_framework import status
 from rest_framework.decorators import api_view, permission_classes
@@ -315,18 +316,38 @@ def _parse_about_html(html):
    for section in sections:
        section_class = section.get('class')
        if section_class:
-            section_data = {}
+            section_data = OrderedDict()
-            section_data['name'] = section_class
+            section_data['class'] = section_class
-            section_data['articles'] = []
            articles = section.findall('article')
            if articles:
+                section_data['articles'] = []
                for article in articles:
                    article_class = article.get('class')
                    if article_class:
-                        article_data = {}
+                        article_data = OrderedDict()
-                        article_data['name'] = article_class
+                        article_data['class'] = article_class
-                        article_data['body'] = etree.tostring(article)
+                        if article_class == "teacher":
+                            name_element = article.find('h3')
+                            if name_element is not None:
+                                article_data['name'] = name_element.text
+                            image_element = article.find("./div[@class='teacher-image']/img")
+                            if image_element is not None:
+                                article_data['image_src'] = image_element.get('src')
+                            bios = article.findall('p')
+                            bio_html = ''
+                            for bio in bios:
+                                bio_html += etree.tostring(bio)
+                            if bio_html:
+                                article_data['bio'] = bio_html
+                        else:
+                            article_data['body'] = etree.tostring(article)
                        section_data['articles'].append(article_data)
            else:
                section_data['body'] = etree.tostring(section)
@@ -344,7 +365,7 @@ def course_about(request, course_id):
    naming convention {"_id.org":"i4x", "_id.course":<course_num>, "_id.category":"about", "_id.name":"overview"}
    """
    store = modulestore()
-    response_data = {}
+    response_data = OrderedDict()
    try:
        course_module = store.get_course(course_id)
@@ -352,12 +373,11 @@ def course_about(request, course_id):
            return Response({}, status=status.HTTP_404_NOT_FOUND)
        overview = get_course_about_section(course_module, 'overview')
-        short_description = get_course_about_section(course_module, 'short_description')
-        response_data['sections'] = _parse_about_html(overview)
+        if request.GET.get('parsed'):
+            response_data['sections'] = _parse_about_html(overview)
-        response_data['overview_html'] = overview
+        else:
-        response_data['short_description'] = short_description
+            response_data['overview_html'] = overview
    except InvalidLocationError:
        return Response({}, status=status.HTTP_404_NOT_FOUND)