Remove AI grading

This work was done in the context of a larger PR, I'd be shocked if this commit can be successfully reverted by itself. If you're trying to restore AI grading though, it's a good place to start.

Remove AI grading
This work was done in the context of a larger PR, I'd be shocked if this commit can be successfully reverted by itself. If you're trying to restore AI grading though, it's a good place to start.
5a07f1f0 · Eric Fischer · 43aa53ea · 43aa53ea · 43aa53ea · 43aa53ea
Commit 5a07f1f0 authored Jul 21, 2017 by Eric Fischer
38 changed files
--- a/apt-packages.txt
+++ b/apt-packages.txt
-aspell
-g++
-gcc
-git
-gfortran
-libblas-dev
-liblapack-dev
-libatlas-base-dev
-libfontconfig1
-libmysqlclient-dev
-libxml2-dev
-libxslt1-dev
-nodejs
-npm
-python2.7
-python2.7-dev
-python-mysqldb
-python-pip
-python-software-properties
-rubygems
--- a/conf/locale
+++ b/conf/locale
-../openassessment/locale/
\ No newline at end of file
--- a/logs/.gitkeep
+++ b/logs/.gitkeep
--- a/logs/README.txt
+++ b/logs/README.txt
-Log files:
-
-apps_info.log = INFO level logging for all edx-ora2 apps and OpenAssessmentBlock
-apps_debug.log = same as above, except DEBUG level
-errors.log = all ERROR and CRITICAL logs, stack traces
-events.log = Analytics events from the xblock-sdk workbench runtime's publish()
-trace.log = The kitchen sink. Massive because of SQL debug logs from Django.
--- a/openassessment/assessment/api/ai.py
+++ b/openassessment/assessment/api/ai.py
--- a/openassessment/assessment/api/ai_worker.py
+++ b/openassessment/assessment/api/ai_worker.py
--- a/openassessment/assessment/errors/ai.py
+++ b/openassessment/assessment/errors/ai.py
-"""
-Errors related to AI assessment.
-"""
-
-from celery.exceptions import InvalidTaskError, NotConfigured, NotRegistered, QueueNotFound
-from socket import error as socket_error
-
-ANTICIPATED_CELERY_ERRORS = (InvalidTaskError, NotConfigured, NotRegistered, QueueNotFound, socket_error)
-
-class AIError(Exception):
-    """
-    A general error occurred while using the AI assessment API.
-    """
-    pass
-
-
-class AITrainingRequestError(AIError):
-    """
-    There was a problem with the request sent to the AI assessment API.
-    """
-    pass
-
-
-class AITrainingInternalError(AIError):
-    """
-    An unexpected error occurred while using the AI assessment API.
-    """
-    pass
-
-
-class AIGradingRequestError(AIError):
-    """
-    There was a problem with the request sent to the AI assessment API.
-    """
-    pass
-
-
-class AIGradingInternalError(AIError):
-    """
-    An unexpected error occurred while using the AI assessment API.
-    """
-    pass
-
-
-class AIReschedulingRequestError(AIError):
-    """
-    There was a problem with the request sent to the AI assessment API.
-    """
-    pass
-
-
-class AIReschedulingInternalError(AIError):
-    """
-    An unexpected error occurred while using the AI assessment API.
-    """
-    pass
--- a/openassessment/assessment/migrations/0001_initial.py
+++ b/openassessment/assessment/migrations/0001_initial.py
@@ -4,8 +4,6 @@ from __future__ import unicode_literals

 from django.db import models, migrations
 import django.utils.timezone
-import django_extensions.db.fields
-import openassessment.assessment.models.ai


 class Migration(migrations.Migration):
@@ -15,54 +13,6 @@ class Migration(migrations.Migration):

    operations = [
        migrations.CreateModel(
-            name='AIClassifier',
-            fields=[
-                ('id', models.AutoField(verbose_name='ID', serialize=False, auto_created=True, primary_key=True)),
-                ('classifier_data', models.FileField(upload_to=openassessment.assessment.models.ai.upload_to_path)),
-            ],
-        ),
-        migrations.CreateModel(
-            name='AIClassifierSet',
-            fields=[
-                ('id', models.AutoField(verbose_name='ID', serialize=False, auto_created=True, primary_key=True)),
-                ('created_at', models.DateTimeField(default=django.utils.timezone.now, db_index=True)),
-                ('algorithm_id', models.CharField(max_length=128, db_index=True)),
-                ('course_id', models.CharField(max_length=40, db_index=True)),
-                ('item_id', models.CharField(max_length=128, db_index=True)),
-            ],
-            options={
-                'ordering': ['-created_at', '-id'],
-            },
-        ),
-        migrations.CreateModel(
-            name='AIGradingWorkflow',
-            fields=[
-                ('id', models.AutoField(verbose_name='ID', serialize=False, auto_created=True, primary_key=True)),
-                ('uuid', django_extensions.db.fields.UUIDField(db_index=True, unique=True, version=1, editable=False, blank=True)),
-                ('course_id', models.CharField(max_length=40, db_index=True)),
-                ('item_id', models.CharField(max_length=128, db_index=True)),
-                ('scheduled_at', models.DateTimeField(default=django.utils.timezone.now, db_index=True)),
-                ('completed_at', models.DateTimeField(null=True, db_index=True)),
-                ('algorithm_id', models.CharField(max_length=128, db_index=True)),
-                ('submission_uuid', models.CharField(max_length=128, db_index=True)),
-                ('essay_text', models.TextField(blank=True)),
-                ('student_id', models.CharField(max_length=40, db_index=True)),
-            ],
-        ),
-        migrations.CreateModel(
-            name='AITrainingWorkflow',
-            fields=[
-                ('id', models.AutoField(verbose_name='ID', serialize=False, auto_created=True, primary_key=True)),
-                ('uuid', django_extensions.db.fields.UUIDField(db_index=True, unique=True, version=1, editable=False, blank=True)),
-                ('course_id', models.CharField(max_length=40, db_index=True)),
-                ('item_id', models.CharField(max_length=128, db_index=True)),
-                ('scheduled_at', models.DateTimeField(default=django.utils.timezone.now, db_index=True)),
-                ('completed_at', models.DateTimeField(null=True, db_index=True)),
-                ('algorithm_id', models.CharField(max_length=128, db_index=True)),
-                ('classifier_set', models.ForeignKey(related_name='+', default=None, to='assessment.AIClassifierSet', null=True)),
-            ],
-        ),
-        migrations.CreateModel(
            name='Assessment',
            fields=[
                ('id', models.AutoField(verbose_name='ID', serialize=False, auto_created=True, primary_key=True)),
@@ -235,41 +185,6 @@ class Migration(migrations.Migration):
            name='rubric',
            field=models.ForeignKey(to='assessment.Rubric'),
        ),
-        migrations.AddField(
-            model_name='aitrainingworkflow',
-            name='training_examples',
-            field=models.ManyToManyField(related_name='+', to='assessment.TrainingExample'),
-        ),
-        migrations.AddField(
-            model_name='aigradingworkflow',
-            name='assessment',
-            field=models.ForeignKey(related_name='+', default=None, to='assessment.Assessment', null=True),
-        ),
-        migrations.AddField(
-            model_name='aigradingworkflow',
-            name='classifier_set',
-            field=models.ForeignKey(related_name='+', default=None, to='assessment.AIClassifierSet', null=True),
-        ),
-        migrations.AddField(
-            model_name='aigradingworkflow',
-            name='rubric',
-            field=models.ForeignKey(related_name='+', to='assessment.Rubric'),
-        ),
-        migrations.AddField(
-            model_name='aiclassifierset',
-            name='rubric',
-            field=models.ForeignKey(related_name='+', to='assessment.Rubric'),
-        ),
-        migrations.AddField(
-            model_name='aiclassifier',
-            name='classifier_set',
-            field=models.ForeignKey(related_name='classifiers', to='assessment.AIClassifierSet'),
-        ),
-        migrations.AddField(
-            model_name='aiclassifier',
-            name='criterion',
-            field=models.ForeignKey(related_name='+', to='assessment.Criterion'),
-        ),
        migrations.AlterUniqueTogether(
            name='studenttrainingworkflowitem',
            unique_together=set([('workflow', 'order_num')]),

--- a/openassessment/assessment/migrations/0003_expand_course_id.py
+++ b/openassessment/assessment/migrations/0003_expand_course_id.py
@@ -13,21 +13,6 @@ class Migration(migrations.Migration):

    operations = [
        migrations.AlterField(
-            model_name='aiclassifierset',
-            name='course_id',
-            field=models.CharField(max_length=255, db_index=True),
-        ),
-        migrations.AlterField(
-            model_name='aigradingworkflow',
-            name='course_id',
-            field=models.CharField(max_length=255, db_index=True),
-        ),
-        migrations.AlterField(
-            model_name='aitrainingworkflow',
-            name='course_id',
-            field=models.CharField(max_length=255, db_index=True),
-        ),
-        migrations.AlterField(
            model_name='peerworkflow',
            name='course_id',
            field=models.CharField(max_length=255, db_index=True),

--- a/openassessment/assessment/models/ai.py
+++ b/openassessment/assessment/models/ai.py
--- a/openassessment/assessment/tasks.py
+++ b/openassessment/assessment/tasks.py
-"""
-Celery looks for tasks in this module,
-so import the tasks we want the workers to implement.
-"""
-# pylint:disable=W0611
-from .worker.training import train_classifiers, reschedule_training_tasks
-from .worker.grading import grade_essay, reschedule_grading_tasks
--- a/openassessment/assessment/test/test_ai.py
+++ b/openassessment/assessment/test/test_ai.py
--- a/openassessment/assessment/test/test_ai_algorithm.py
+++ b/openassessment/assessment/test/test_ai_algorithm.py
-# coding=utf-8
-"""
-Tests for AI algorithm implementations.
-"""
-import unittest
-import json
-import mock
-from openassessment.test_utils import CacheResetTest
-from openassessment.assessment.worker.algorithm import (
-    AIAlgorithm, FakeAIAlgorithm, EaseAIAlgorithm,
-    TrainingError, InvalidClassifier
-)
-
-
-EXAMPLES = [
-    AIAlgorithm.ExampleEssay(u"Mine's a tale that can't be told, my ƒяєє∂σм I hold dear.", 2),
-    AIAlgorithm.ExampleEssay(u"How years ago in days of old, when 𝒎𝒂𝒈𝒊𝒄 filled th air.", 1),
-    AIAlgorithm.ExampleEssay(u"Ṫ'ẅäṡ in the darkest depths of Ṁöṛḋöṛ, I met a girl so fair.", 1),
-    AIAlgorithm.ExampleEssay(u"But goﾚﾚuﾶ, and the evil one crept up and slipped away with her", 0),
-    AIAlgorithm.ExampleEssay(u"", 4),
-    AIAlgorithm.ExampleEssay(u".!?", 4),
-    AIAlgorithm.ExampleEssay(u"no punctuation", 4),
-    AIAlgorithm.ExampleEssay(u"one", 4),
-]
-
-INPUT_ESSAYS = [
-    u"Good times, 𝑩𝒂𝒅 𝑻𝒊𝒎𝒆𝒔, you know I had my share",
-    u"When my woman left home for a 𝒃𝒓𝒐𝒘𝒏 𝒆𝒚𝒆𝒅 𝒎𝒂𝒏",
-    u"Well, I still don't seem to 𝒄𝒂𝒓𝒆",
-    u"",
-    u".!?",
-    u"no punctuation",
-    u"one",
-]
-
-
-class AIAlgorithmTest(CacheResetTest):
-    """
-    Base class for testing AI algorithm implementations.
-    """
-    ALGORITHM_CLASS = None
-
-    def setUp(self):
-        self.algorithm = self.ALGORITHM_CLASS()   # pylint:disable=E1102
-
-    def _scores(self, classifier, input_essays):
-        """
-        Use the classifier to score multiple input essays.
-
-        Args:
-            input_essays (list of unicode): The essays to score.
-
-        Returns:
-            list of int: The scores
-
-        """
-        cache = {}
-        return [
-            self.algorithm.score(input_essay, classifier, cache)
-            for input_essay in input_essays
-        ]
-
-
-class FakeAIAlgorithmTest(AIAlgorithmTest):
-    """
-    Test for the fake AI algorithm implementation.
-    """
-    ALGORITHM_CLASS = FakeAIAlgorithm
-
-    def test_train_and_score(self):
-        classifier = self.algorithm.train_classifier(EXAMPLES)
-        expected_scores = [2, 0, 0, 0, 4, 2, 4]
-        scores = self._scores(classifier, INPUT_ESSAYS)
-        self.assertEqual(scores, expected_scores)
-
-    def test_score_classifier_missing_key(self):
-        with self.assertRaises(InvalidClassifier):
-            self.algorithm.score(u"Test input", {}, {})
-
-    def test_score_classifier_no_scores(self):
-        with self.assertRaises(InvalidClassifier):
-            self.algorithm.score(u"Test input", {'scores': []}, {})
-
-
-# Try to import EASE -- if we can't, then skip the tests that require it
-try:
-    import ease # pylint: disable=F0401,W0611
-    EASE_INSTALLED = True
-except ImportError:
-    EASE_INSTALLED = False
-
-
-@unittest.skipUnless(EASE_INSTALLED, "EASE library required")
-class EaseAIAlgorithmTest(AIAlgorithmTest):
-    """
-    Test for the EASE AI library wrapper.
-    """
-    ALGORITHM_CLASS = EaseAIAlgorithm
-
-    def test_train_and_score(self):
-        classifier = self.algorithm.train_classifier(EXAMPLES)
-        scores = self._scores(classifier, INPUT_ESSAYS)
-
-        # Check that we got scores in the correct range
-        valid_scores = set(example.score for example in EXAMPLES)
-        for score in scores:
-            self.assertIn(score, valid_scores)
-
-        # Check that the scores are consistent when we re-run the algorithm
-        repeat_scores = self._scores(classifier, INPUT_ESSAYS)
-        self.assertEqual(scores, repeat_scores)
-
-    def test_all_examples_have_same_score(self):
-        examples = [
-            AIAlgorithm.ExampleEssay(u"Test ëṡṡäÿ", 1),
-            AIAlgorithm.ExampleEssay(u"Another test ëṡṡäÿ", 1),
-        ]
-        # No assertion -- just verifying that this does not raise an exception
-        classifier = self.algorithm.train_classifier(examples)
-        self._scores(classifier, INPUT_ESSAYS)
-
-    def test_most_examples_have_same_score(self):
-        # All training examples have the same score except for one
-        examples = [
-            AIAlgorithm.ExampleEssay(u"Test ëṡṡäÿ", 1),
-            AIAlgorithm.ExampleEssay(u"Another test ëṡṡäÿ", 1),
-            AIAlgorithm.ExampleEssay(u"Different score", 0),
-        ]
-        classifier = self.algorithm.train_classifier(examples)
-        scores = self._scores(classifier, INPUT_ESSAYS)
-
-        # Check that we got scores back.
-        # This is not a very rigorous assertion -- we're mainly
-        # checking that we got this far without an exception.
-        self.assertEqual(len(scores), len(INPUT_ESSAYS))
-
-    def test_no_examples(self):
-        with self.assertRaises(TrainingError):
-            self.algorithm.train_classifier([])
-
-    def test_json_serializable(self):
-        classifier = self.algorithm.train_classifier(EXAMPLES)
-        serialized = json.dumps(classifier)
-        deserialized = json.loads(serialized)
-
-        # This should not raise an exception
-        scores = self._scores(deserialized, INPUT_ESSAYS)
-        self.assertEqual(len(scores), len(INPUT_ESSAYS))
-
-    @mock.patch('openassessment.assessment.worker.algorithm.pickle')
-    def test_pickle_serialize_error(self, mock_pickle):
-        mock_pickle.dumps.side_effect = Exception("Test error!")
-        with self.assertRaises(TrainingError):
-            self.algorithm.train_classifier(EXAMPLES)
-
-    def test_pickle_deserialize_error(self):
-        classifier = self.algorithm.train_classifier(EXAMPLES)
-        with mock.patch('openassessment.assessment.worker.algorithm.pickle.loads') as mock_call:
-            mock_call.side_effect = Exception("Test error!")
-            with self.assertRaises(InvalidClassifier):
-                self.algorithm.score(u"Test ëṡṡäÿ", classifier, {})
-
-    def test_serialized_classifier_not_a_dict(self):
-        with self.assertRaises(InvalidClassifier):
-            self.algorithm.score(u"Test ëṡṡäÿ", "not a dict", {})
--- a/openassessment/assessment/test/test_ai_models.py
+++ b/openassessment/assessment/test/test_ai_models.py
-# coding=utf-8
-"""
-Test AI Django models.
-"""
-import copy
-import ddt
-from django.test import TestCase
-
-from django.test.utils import override_settings
-from openassessment.test_utils import CacheResetTest
-from openassessment.assessment.models import (
-    AIClassifierSet, AIClassifier, AIGradingWorkflow, AI_CLASSIFIER_STORAGE,
-    CLASSIFIERS_CACHE_IN_MEM, essay_text_from_submission
-)
-from openassessment.assessment.serializers import rubric_from_dict
-from .constants import RUBRIC
-
-
-CLASSIFIERS_DICT = {
-    u"vøȼȺƀᵾłȺɍɏ": "test data",
-    u"ﻭɼค๓๓คɼ": "more test data"
-}
-COURSE_ID = u"†3ß† çøU®ß3"
-ITEM_ID = u"fake_item_id"
-
-
-@ddt.ddt
-class DataConversionTest(TestCase):
-
-    @ddt.data(
-        (u'Answer', u'Answer'),
-        ({'answer': {'text': u'Answer'}}, u'Answer'),
-        ({'answer': {'parts': [{'text': u'Answer 1'}, {'text': u'Answer 2'}]}}, u'Answer 1\nAnswer 2')
-    )
-    @ddt.unpack
-    def test_essay_text_from_submission(self, input, output):
-        self.assertEqual(essay_text_from_submission(input), output)
-
-
-class AIClassifierTest(CacheResetTest):
-    """
-    Tests for the AIClassifier model.
-    """
-
-    def test_upload_to_path_default(self):
-        # No path prefix provided in the settings
-        classifier = self._create_classifier()
-        components = classifier.classifier_data.name.split(u'/')
-        self.assertEqual(len(components), 2)
-        self.assertEqual(components[0], AI_CLASSIFIER_STORAGE)
-        self.assertGreater(len(components[1]), 0)
-
-    @override_settings(ORA2_FILE_PREFIX=u"ƒιℓє_ρяєƒιχ")
-    def test_upload_to_path_with_prefix(self):
-        classifier = self._create_classifier()
-        components = classifier.classifier_data.name.split(u'/')
-        self.assertEqual(len(components), 3)
-        self.assertEqual(components[0], u"ƒιℓє_ρяєƒιχ")
-        self.assertEqual(components[1], AI_CLASSIFIER_STORAGE)
-        self.assertGreater(len(components[2]), 0)
-
-    def _create_classifier(self):
-        """
-        Create and return an AIClassifier.
-        """
-        rubric = rubric_from_dict(RUBRIC)
-        classifier_set = AIClassifierSet.create_classifier_set(
-            CLASSIFIERS_DICT, rubric, "test_algorithm", COURSE_ID, ITEM_ID
-        )
-        return AIClassifier.objects.filter(classifier_set=classifier_set)[0]
-
-
-class AIClassifierSetTest(CacheResetTest):
-    """
-    Tests for the AIClassifierSet model.
-    """
-    def setUp(self):
-        super(AIClassifierSetTest, self).setUp()
-        rubric = rubric_from_dict(RUBRIC)
-        self.classifier_set = AIClassifierSet.create_classifier_set(
-            CLASSIFIERS_DICT, rubric, "test_algorithm", COURSE_ID, ITEM_ID
-        )
-
-    def test_cache_downloads(self):
-        # Retrieve the classifier dict twice, which should hit the caching code.
-        # We can check that we're using the cache by asserting that
-        # the number of database queries decreases.
-        with self.assertNumQueries(1):
-            first = self.classifier_set.classifier_data_by_criterion
-
-        with self.assertNumQueries(0):
-            second = self.classifier_set.classifier_data_by_criterion
-
-        # Verify that we got the same value both times
-        self.assertEqual(first, second)
-
-    def test_file_cache_downloads(self):
-        # Retrieve the classifiers dict, which should be cached
-        # both in memory and on the file system
-        first = self.classifier_set.classifier_data_by_criterion
-
-        # Clear the in-memory cache
-        # This simulates what happens when a worker process dies
-        # after exceeding the maximum number of retries.
-        CLASSIFIERS_CACHE_IN_MEM.clear()
-
-        # We should still be able to retrieve the classifiers dict
-        # from the on-disk cache, even if memory has been cleared
-        with self.assertNumQueries(0):
-            second = self.classifier_set.classifier_data_by_criterion
-
-        # Verify that we got the correct classifiers dict back
-        self.assertEqual(first, second)
-
-
-class AIGradingWorkflowTest(CacheResetTest):
-    """
-    Tests for the AIGradingWorkflow model.
-    """
-    CLASSIFIERS_DICT = {
-        u"vøȼȺƀᵾłȺɍɏ": "test data",
-        u"ﻭɼค๓๓คɼ": "more test data"
-    }
-    COURSE_ID = u"test"
-    ITEM_ID = u"test"
-    ALGORITHM_ID = "test"
-
-    def setUp(self):
-        """
-        Create a new grading workflow.
-        """
-        self.rubric = rubric_from_dict(RUBRIC)
-        self.workflow = AIGradingWorkflow.objects.create(
-            submission_uuid='test', essay_text='test',
-            rubric=self.rubric, algorithm_id=self.ALGORITHM_ID,
-            item_id=self.ITEM_ID, course_id=self.COURSE_ID
-        )
-
-        # Create a rubric with a similar structure, but different prompt
-        similar_rubric_dict = copy.deepcopy(RUBRIC)
-        similar_rubric_dict['prompts'] = [{"description": 'Different prompt!'}]
-        self.similar_rubric = rubric_from_dict(similar_rubric_dict)
-
-    def test_assign_most_recent_classifier_set(self):
-        # No classifier sets are available
-        found = self.workflow.assign_most_recent_classifier_set()
-        self.assertFalse(found)
-        self.assertIs(self.workflow.classifier_set, None)
-
-        # Same rubric (exact), but different course id
-        classifier_set = AIClassifierSet.create_classifier_set(
-            self.CLASSIFIERS_DICT, self.rubric, self.ALGORITHM_ID,
-            "different course!", self.ITEM_ID
-        )
-        found = self.workflow.assign_most_recent_classifier_set()
-        self.assertTrue(found)
-        self.assertEqual(classifier_set.pk, self.workflow.classifier_set.pk)
-
-        # Same rubric (exact) but different item id
-        classifier_set = AIClassifierSet.create_classifier_set(
-            self.CLASSIFIERS_DICT, self.rubric, self.ALGORITHM_ID,
-            self.COURSE_ID, "different item!"
-        )
-        found = self.workflow.assign_most_recent_classifier_set()
-        self.assertTrue(found)
-        self.assertEqual(classifier_set.pk, self.workflow.classifier_set.pk)
-
-        # Same rubric (exact), but different algorithm id
-        # Shouldn't change, since the algorithm ID doesn't match
-        AIClassifierSet.create_classifier_set(
-            self.CLASSIFIERS_DICT, self.rubric, "different algorithm!",
-            self.COURSE_ID, self.ITEM_ID
-        )
-        found = self.workflow.assign_most_recent_classifier_set()
-        self.assertTrue(found)
-        self.assertEqual(classifier_set.pk, self.workflow.classifier_set.pk)
-
-        # Same rubric *structure*, but in a different item
-        # Shouldn't change, since the rubric isn't an exact match.
-        AIClassifierSet.create_classifier_set(
-            self.CLASSIFIERS_DICT, self.similar_rubric, self.ALGORITHM_ID,
-            self.COURSE_ID, "different item!"
-        )
-        found = self.workflow.assign_most_recent_classifier_set()
-        self.assertTrue(found)
-        self.assertEqual(classifier_set.pk, self.workflow.classifier_set.pk)
-
-        # Same rubric *structure* AND in the same course/item
-        # This should replace our current classifier set
-        classifier_set = AIClassifierSet.create_classifier_set(
-            self.CLASSIFIERS_DICT, self.similar_rubric, self.ALGORITHM_ID,
-            self.COURSE_ID, self.ITEM_ID
-        )
-        found = self.workflow.assign_most_recent_classifier_set()
-        self.assertTrue(found)
-        self.assertEqual(classifier_set.pk, self.workflow.classifier_set.pk)
-
-        # Same rubric and same course/item
-        # This is the ideal, so we should always prefer it
-        classifier_set = AIClassifierSet.create_classifier_set(
-            self.CLASSIFIERS_DICT, self.rubric, self.ALGORITHM_ID,
-            self.COURSE_ID, self.ITEM_ID
-        )
-        found = self.workflow.assign_most_recent_classifier_set()
-        self.assertTrue(found)
-        self.assertEqual(classifier_set.pk, self.workflow.classifier_set.pk)
--- a/openassessment/assessment/test/test_ai_worker.py
+++ b/openassessment/assessment/test/test_ai_worker.py
--- a/openassessment/assessment/test/test_worker.py
+++ b/openassessment/assessment/test/test_worker.py
--- a/openassessment/assessment/worker/__init__.py
+++ b/openassessment/assessment/worker/__init__.py
--- a/openassessment/assessment/worker/algorithm.py
+++ b/openassessment/assessment/worker/algorithm.py
--- a/openassessment/assessment/worker/grading.py
+++ b/openassessment/assessment/worker/grading.py
--- a/openassessment/assessment/worker/training.py
+++ b/openassessment/assessment/worker/training.py
--- a/openassessment/management/commands/performance_test_for_submissions.py
+++ b/openassessment/management/commands/performance_test_for_submissions.py
-"""
-Gives the time taken by
-    find_active_assessments
-    get_submission_for_review
-    get_submission_for_over_grading
-    methods for particular set of workflows.
-"""
-import random
-import datetime
-
-from django.core.management.base import BaseCommand
-
-from openassessment.assessment.models import PeerWorkflow
-
-
-class Command(BaseCommand):
-    """
-    Note the time taken by queries.
-    """
-
-    help = ("Test the performance for "
-            "find_active_assessments, "
-            "get_submission_for_review & "
-            "get_submission_for_over_grading"
-            "methods.")
-
-    def __init__(self, *args, **kwargs):
-        super(Command, self).__init__(*args, **kwargs)
-
-    def handle(self, *args, **options):
-        """
-        Execute the command.
-
-        Args:
-            None
-        """
-        peer_workflow_count = PeerWorkflow.objects.filter(submission_uuid__isnull=False).count()
-
-        peer_workflow_ids = [random.randint(1, peer_workflow_count) for num in range(100)]
-        peer_workflows = list(PeerWorkflow.objects.filter(id__in=peer_workflow_ids))
-
-        pw_dt_before = datetime.datetime.now()
-
-        for peer_workflow in peer_workflows:
-            peer_workflow.find_active_assessments()
-
-        pw_dt_after = datetime.datetime.now()
-        time_taken = pw_dt_after - pw_dt_before
-
-        print "Time taken by (find_active_assessments) method Is:  %s " % time_taken
-
-        ####  get_submission_for_review ####
-
-        pw_dt_before = datetime.datetime.now()
-
-        for peer_workflow in peer_workflows:
-            peer_workflow.get_submission_for_review(2)
-
-        pw_dt_after = datetime.datetime.now()
-        time_taken = pw_dt_after - pw_dt_before
-
-        print "Time taken by (get_submission_for_review) method Is:  %s " % time_taken
-
-        ####   get_submission_for_over_grading ####
-
-        pw_dt_before = datetime.datetime.now()
-
-        for peer_workflow in peer_workflows:
-            peer_workflow.get_submission_for_over_grading()
-
-        pw_dt_after = datetime.datetime.now()
-        time_taken = pw_dt_after - pw_dt_before
-
-        print "Time taken by (get_submission_for_over_grading) method Is:  %s " % time_taken
--- a/openassessment/management/commands/simulate_ai_grading_error.py
+++ b/openassessment/management/commands/simulate_ai_grading_error.py
-# -*- coding: utf-8 -*-
-"""
-Simulate failure of the worker AI grading tasks.
-When the workers fail to successfully complete AI grading,
-the AI grading workflow in the database will never be marked complete.
-
-To simulate the error condition, therefore, we create incomplete
-AI grading workflows without scheduling a grading task.
-
-To recover, a staff member can reschedule incomplete grading tasks.
-
-"""
-from django.core.management.base import BaseCommand, CommandError
-from submissions import api as sub_api
-from openassessment.assessment.models import AIGradingWorkflow, AIClassifierSet
-from openassessment.assessment.serializers import rubric_from_dict
-from openassessment.assessment.worker.algorithm import AIAlgorithm
-
-
-class Command(BaseCommand):
-    """
-    Create submissions and AI incomplete grading workflows.
-    """
-
-    help = (
-        u"Simulate failure of the worker AI grading tasks "
-        u"by creating incomplete AI grading workflows in the database."
-    )
-
-    args = '<COURSE_ID> <PROBLEM_ID> <NUM_SUBMISSIONS> <ALGORITHM_ID>'
-
-    RUBRIC_OPTIONS = [
-        {
-            "order_num": 0,
-            "name": u"poor",
-            "explanation": u"Poor job!",
-            "points": 0,
-        },
-        {
-            "order_num": 1,
-            "name": u"good",
-            "explanation": u"Good job!",
-            "points": 1,
-        }
-    ]
-
-    RUBRIC = {
-        'prompts': [{"description": u"Test prompt"}],
-        'criteria': [
-            {
-                "order_num": 0,
-                "name": u"vocabulary",
-                "prompt": u"Vocabulary",
-                "options": RUBRIC_OPTIONS
-            },
-            {
-                "order_num": 1,
-                "name": u"grammar",
-                "prompt": u"Grammar",
-                "options": RUBRIC_OPTIONS
-            }
-        ]
-    }
-
-    EXAMPLES = {
-        "vocabulary": [
-            AIAlgorithm.ExampleEssay(
-                text=u"World Food Day is celebrated every year around the world on 16 October in honor "
-                u"of the date of the founding of the Food and Agriculture "
-                u"Organization of the United Nations in 1945.",
-                score=0
-            ),
-            AIAlgorithm.ExampleEssay(
-                text=u"Since 1981, World Food Day has adopted a different theme each year "
-                u"in order to highlight areas needed for action and provide a common focus.",
-                score=1
-            ),
-        ],
-        "grammar": [
-            AIAlgorithm.ExampleEssay(
-                text=u"Most of the themes revolve around agriculture because only investment in agriculture ",
-                score=0
-            ),
-            AIAlgorithm.ExampleEssay(
-                text=u"In spite of the importance of agriculture as the driving force "
-                u"in the economies of many developing countries, this "
-                u"vital sector is frequently starved of investment.",
-                score=1
-            )
-        ]
-    }
-
-    STUDENT_ID = u'test_student'
-    ANSWER = {"text": 'test answer'}
-
-    def handle(self, *args, **options):
-        """
-        Execute the command.
-
-        Args:
-            course_id (unicode): The ID of the course to create submissions/workflows in.
-            item_id (unicode): The ID of the problem in the course.
-            num_submissions (int): The number of submissions/workflows to create.
-            algorithm_id (unicode): The ID of the ML algorithm to use ("fake" or "ease")
-
-        Raises:
-            CommandError
-
-        """
-        if len(args) < 4:
-            raise CommandError(u"Usage: simulate_ai_grading_error {}".format(self.args))
-
-        # Parse arguments
-        course_id = args[0].decode('utf-8')
-        item_id = args[1].decode('utf-8')
-        num_submissions = int(args[2])
-        algorithm_id = args[3].decode('utf-8')
-
-        # Create the rubric model
-        rubric = rubric_from_dict(self.RUBRIC)
-
-        # Train classifiers
-        print u"Training classifiers using {algorithm_id}...".format(algorithm_id=algorithm_id)
-        algorithm = AIAlgorithm.algorithm_for_id(algorithm_id)
-        classifier_data = {
-            criterion_name: algorithm.train_classifier(example)
-            for criterion_name, example in self.EXAMPLES.iteritems()
-        }
-        print u"Successfully trained classifiers."
-
-        # Create the classifier set
-        classifier_set = AIClassifierSet.create_classifier_set(
-            classifier_data, rubric, algorithm_id, course_id, item_id
-        )
-        print u"Successfully created classifier set with id {}".format(classifier_set.pk)
-
-        # Create submissions and grading workflows
-        for num in range(num_submissions):
-            student_item = {
-                'course_id': course_id,
-                'item_id': item_id,
-                'item_type': 'openassessment',
-                'student_id': "{base}_{num}".format(base=self.STUDENT_ID, num=num)
-            }
-            submission = sub_api.create_submission(student_item, self.ANSWER)
-            workflow = AIGradingWorkflow.start_workflow(
-                submission['uuid'], self.RUBRIC, algorithm_id
-            )
-            workflow.classifier_set = classifier_set
-            workflow.save()
-            print u"{num}: Created incomplete grading workflow with UUID {uuid}".format(
-                num=num, uuid=workflow.uuid
-            )
--- a/openassessment/management/tests/test_simulate_ai_grading_error.py
+++ b/openassessment/management/tests/test_simulate_ai_grading_error.py
-# -*- coding: utf-8 -*-
-"""
-Tests for the simulate AI grading error management command.
-"""
-
-from django.test.utils import override_settings
-from openassessment.test_utils import CacheResetTest
-from openassessment.management.commands import simulate_ai_grading_error
-from openassessment.assessment.models import AIGradingWorkflow
-from openassessment.assessment.worker.grading import grade_essay
-
-
-class SimulateAIGradingErrorTest(CacheResetTest):
-    """
-    Tests for the simulate AI grading error management command.
-    """
-
-    COURSE_ID = u"TɘꙅT ↄoUᴙꙅɘ"
-    ITEM_ID = u"𝖙𝖊𝖘𝖙 𝖎𝖙𝖊𝖒"
-    NUM_SUBMISSIONS = 20
-
-    AI_ALGORITHMS = {
-        "fake": "openassessment.assessment.worker.algorithm.FakeAIAlgorithm"
-    }
-
-    @override_settings(ORA2_AI_ALGORITHMS=AI_ALGORITHMS)
-    def test_simulate_ai_grading_error(self):
-        # Run the command
-        cmd = simulate_ai_grading_error.Command()
-        cmd.handle(
-            self.COURSE_ID.encode('utf-8'),
-            self.ITEM_ID.encode('utf-8'),
-            self.NUM_SUBMISSIONS,
-            "fake"
-        )
-
-        # Check that the correct number of incomplete workflows
-        # were created.  These workflows should still have
-        # a classifier set, though, because otherwise they
-        # wouldn't have been scheduled for grading
-        # (that is, the submissions were made before classifier
-        # training completed).
-        incomplete_workflows = AIGradingWorkflow.objects.filter(
-            classifier_set__isnull=False,
-            completed_at__isnull=True
-        )
-        num_errors = incomplete_workflows.count()
-        self.assertEqual(self.NUM_SUBMISSIONS, num_errors)
-
-        # Verify that we can complete the workflows successfully
-        # (that is, make sure the classifier data is valid)
-        # We're calling a Celery task method here,
-        # but we're NOT using `apply_async`, so this will
-        # execute synchronously.
-        for workflow in incomplete_workflows:
-            grade_essay(workflow.uuid)
-
-        # Now there should be no incomplete workflows
-        remaining_incomplete = AIGradingWorkflow.objects.filter(
-            classifier_set__isnull=False,
-            completed_at__isnull=True
-        ).count()
-        self.assertEqual(remaining_incomplete, 0)
--- a/openassessment/templates/openassessmentblock/edit/oa_edit_example_based_assessment.html
+++ b/openassessment/templates/openassessmentblock/edit/oa_edit_example_based_assessment.html
-{% load i18n %}
-{% spaceless %}
-<li class="openassessment_assessment_module_settings_editor" id="oa_ai_assessment_editor">
-    <div class="drag-handle action"></div>
-    <div class="openassessment_inclusion_wrapper">
-        <input id="include_ai_assessment" type="checkbox"
-                {% if assessments.example_based_assessment %} checked="true" {% endif %}>
-        <label for="include_ai_assessment">{% trans "Step: Example-Based Assessment" %}</label>
-    </div>
-    <div class="openassessment_assessment_module_editor">
-        <p id="ai_assessment_description_closed" class="openassessment_description_closed {% if assessments.example_based_assessment %} is--hidden {% endif %}">
-            {% trans "An algorithm assesses learners' responses by comparing the responses to pre-assessed sample responses that the instructor provides."%}
-        </p>
-        <div id="ai_assessment_settings_editor" class="assessment_settings_wrapper {% if not assessments.example_based_assessment %} is--hidden {% endif %}">
-            <p class="openassessment_description">
-                {% trans "Enter one or more sample responses that you've created, and then specify the options that you would choose for each criterion in your rubric. Note that you must add your rubric to the Rubric tab before you can complete this step." %}
-            </p>
-            <textarea id="ai_training_examples">{{ assessments.example_based_assessment.examples }}</textarea>
-        </div>
-    </div>
-</li>
-{% endspaceless %}
--- a/openassessment/xblock/static/xml/example_based_example.xml
+++ b/openassessment/xblock/static/xml/example_based_example.xml
-<openassessment>
-    <title>Example Based Example</title>
-    <assessments>
-        <assessment name="example-based-assessment" algorithm_id="fake">
-            <example>
-                <answer>Born in northern New South Wales, Dowling entered the Royal Australian Naval College in 1915. After graduating in 1919 he went to sea aboard various Royal Navy and RAN vessels, and later specialised in gunnery. In 1937, he was given command of the sloop HMAS Swan. Following the outbreak of World War II, he saw action in the Mediterranean theatre as executive officer of the Royal Navy cruiser HMS Naiad, and survived her sinking by a German U-boat in March 1942. Returning to Australia, he served as Director of Plans and later Deputy Chief of Naval Staff before taking command of the light cruiser HMAS Hobart in November 1944. His achievements in the South West Pacific earned him the Distinguished Service Order.
-
-                    Dowling took command of the RAN's first aircraft carrier, HMAS Sydney, in 1948. He became Chief of Naval Personnel in 1950, and Flag Officer Commanding HM Australian Fleet in 1953. Soon after taking up the position of CNS in February 1955, he was promoted to vice admiral and appointed a Companion of the Order of the Bath. As CNS he had to deal with shortages of money, manpower and equipment, and with the increasing role of the United States in Australia's defence planning, at the expense of traditional ties with Britain. Knighted in 1957, Dowling was Chairman of COSC from March 1959 until May 1961, when he retired from the military. In 1963 he was appointed a Knight Commander of the Royal Victorian Order and became Australian Secretary to HM Queen Elizabeth II, serving until his death in 1969.
-                </answer>
-                <select criterion="Ideas" option="Bad" />
-                <select criterion="Content" option="Bad" />
-            </example>
-            <example>
-                <answer>Roy Russell Dowling was born on 28 May 1901 in Condong, a township on the Tweed River in northern New South Wales. His parents were sugar cane inspector Russell Dowling and his wife Lily. The youth entered the Royal Australian Naval College (RANC) at Jervis Bay, Federal Capital Territory, in 1915. An underachiever academically, he excelled at sports, and became chief cadet captain before graduating in 1918 with the King's Medal, awarded for "gentlemanly bearing, character, good influence among his fellows and officer-like qualities".[1][2] The following year he was posted to Britain as a midshipman, undergoing training with the Royal Navy and seeing service on HMS Ramillies and HMS Venturous.[3] By January 1923 he was back in Australia, serving aboard the cruiser HMAS Adelaide. He was promoted to lieutenant in March.[4] In April 1924, Adelaide joined the Royal Navy's Special Service Squadron on its worldwide cruise, taking in New Zealand, Canada, the United States, Panama, and the West Indies, before docking in September at Portsmouth, England. There Dowling left the ship for his next appointment, training as a gunnery officer and serving in that capacity at HMS Excellent.
-                </answer>
-                <select criterion="Ideas" option="Good" />
-                <select criterion="Content" option="Bad" />
-            </example>
-            <example>
-                <answer>After his return to Australia in December 1926, Dowling spent eighteen months on HMAS Platypus and HMAS Anzac, where he continued to specialise in gunnery. In July 1928, he took on an instructional role at the gunnery school in Flinders Naval Depot on Western Port Bay, Victoria. He married Jessie Blanch in Melbourne on 8 May 1930; the couple had two sons and three daughters.[1][6] Jessie accompanied him on his next posting to Britain commencing in January 1931.</answer>
-                <select criterion="Ideas" option="Bad" />
-                <select criterion="Content" option="Good" />
-            </example>
-            <example>
-                <answer>He was promoted to lieutenant commander on 15 March, and was appointed gunnery officer on the light cruiser HMS Colombo in May. Dowling returned to Australia in January 1933, and was appointed squadron gunnery officer aboard the heavy cruiser HMAS Canberra that April.[1][4] The ship operated mainly within Australian waters over the next two years.[7] In July 1935, Dowling took charge of the gunnery school at Flinders Naval Depot. He was promoted to commander on 31 December 1936.[1][4] The following month, he assumed command of the newly commissioned Grimsby-class sloop HMAS Swan, carrying out duties in the South West Pacific.[8] Completing his tenure on Swan in January 1939, he was briefly assigned to the Navy Office, Melbourne, before returning to Britain in March for duty at HMS Pembroke, where he awaited posting aboard the yet-to-be-commissioned anti-aircraft cruiser, HMS Naiad.</answer>
-                <select criterion="Ideas" option="Good" />
-                <select criterion="Content" option="Good" />
-            </example>
-        </assessment>
-    </assessments>
-    <rubric>
-        <prompt>
-            Censorship in the Libraries
-
-            'All of us can think of a book that we hope none of our children or any other children have taken off the shelf. But if I have the right to remove that book from the shelf -- that work I abhor -- then you also have exactly the same right and so does everyone else. And then we have no books left on the shelf for any of us.' --Katherine Paterson, Author
-
-            Write a persuasive essay to a newspaper reflecting your views on censorship in libraries. Do you believe that certain materials, such as books, music, movies, magazines, etc., should be removed from the shelves if they are found offensive? Support your position with convincing arguments from your own experience, observations, and/or reading.
-
-            Read for conciseness, clarity of thought, and form.
-        </prompt>
-        <criterion feedback="optional">
-            <name>Ideas</name>
-            <prompt>Determine if there is a unifying theme or main idea.</prompt>
-            <option points="0">
-                <name>Bad</name>
-                <explanation>Difficult for the reader to discern the main idea.  Too brief or too repetitive to establish or maintain a focus.</explanation>
-            </option>
-            <option points="3">
-                <name>Good</name>
-                <explanation>Presents a unifying theme or main idea, but may include minor tangents.  Stays somewhat focused on topic and task.</explanation>
-            </option>
-        </criterion>
-        <criterion>
-            <name>Content</name>
-            <prompt>Assess the content of the submission</prompt>
-            <option points="0">
-                <name>Bad</name>
-                <explanation>Includes little information with few or no details or unrelated details.  Unsuccessful in attempts to explore any facets of the topic.</explanation>
-            </option>
-            <option points="1">
-                <name>Good</name>
-                <explanation>Includes little information and few or no details.  Explores only one or two facets of the topic.</explanation>
-            </option>
-        </criterion>
-        <feedbackprompt>
-            (Optional) What aspects of this response stood out to you? What did it do well? How could it improve?
-        </feedbackprompt>
-        <feedback_default_text>
-            I noticed that this response...
-        </feedback_default_text>
-    </rubric>
-</openassessment>
--- a/openassessment/xblock/test/data/example_based_assessment.xml
+++ b/openassessment/xblock/test/data/example_based_assessment.xml
-<openassessment>
-    <title>Open Assessment Test</title>
-    <prompts>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat poverty?</description>
-        </prompt>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat pollution?</description>
-        </prompt>
-    </prompts>
-    <rubric>
-        <criterion>
-            <name>Ideas</name>
-            <prompt>How good are the ideas?</prompt>
-            <option points="0">
-                <name>Poor</name>
-                <explanation>Poor job!</explanation>
-            </option>
-            <option points="1">
-                <name>Fair</name>
-                <explanation>Fair job</explanation>
-            </option>
-            <option points="3">
-                <name>Good</name>
-                <explanation>Good job</explanation>
-            </option>
-        </criterion>
-        <criterion>
-            <name>Content</name>
-            <prompt>How good is the content?</prompt>
-            <option points="0">
-                <name>Poor</name>
-                <explanation>Poor job!</explanation>
-            </option>
-            <option points="1">
-                <name>Fair</name>
-                <explanation>Fair job</explanation>
-            </option>
-            <option points="3">
-                <name>Good</name>
-                <explanation>Good job</explanation>
-            </option>
-        </criterion>
-    </rubric>
-    <assessments>
-        <assessment name="example-based-assessment" algorithm_id="fake">
-            <example>
-                <answer>Example Answer One</answer>
-                <select criterion="Ideas" option="Poor" />
-                <select criterion="Content" option="Poor" />
-            </example>
-            <example>
-                <answer>Example Answer Two</answer>
-                <select criterion="Ideas" option="Fair" />
-                <select criterion="Content" option="Fair" />
-            </example>
-            <example>
-                <answer>Example Answer Three</answer>
-                <select criterion="Ideas" option="Fair" />
-                <select criterion="Content" option="Good" />
-            </example>
-            <example>
-                <answer>Example Answer Four</answer>
-                <select criterion="Ideas" option="Poor" />
-                <select criterion="Content" option="Good" />
-            </example>
-        </assessment>
-        <assessment name="peer-assessment" must_grade="5" must_be_graded_by="3" />
-        <assessment name="self-assessment" />
-    </assessments>
-</openassessment>
--- a/openassessment/xblock/test/data/example_based_only.xml
+++ b/openassessment/xblock/test/data/example_based_only.xml
-<openassessment>
-    <title>Open Assessment Test</title>
-    <prompts>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat poverty?</description>
-        </prompt>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat pollution?</description>
-        </prompt>
-    </prompts>
-    <rubric>
-        <criterion>
-            <name>Ideas</name>
-            <prompt>How good are the ideas?</prompt>
-            <option points="0">
-                <name>Poor</name>
-                <explanation>Poor job!</explanation>
-            </option>
-            <option points="1">
-                <name>Fair</name>
-                <explanation>Fair job</explanation>
-            </option>
-            <option points="3">
-                <name>Good</name>
-                <explanation>Good job</explanation>
-            </option>
-        </criterion>
-        <criterion>
-            <name>Content</name>
-            <prompt>How good is the content?</prompt>
-            <option points="0">
-                <name>Poor</name>
-                <explanation>Poor job!</explanation>
-            </option>
-            <option points="1">
-                <name>Fair</name>
-                <explanation>Fair job</explanation>
-            </option>
-            <option points="3">
-                <name>Good</name>
-                <explanation>Good job</explanation>
-            </option>
-        </criterion>
-    </rubric>
-    <assessments>
-        <assessment name="example-based-assessment" algorithm_id="fake">
-            <example>
-                <answer>Example Answer One</answer>
-                <select criterion="Ideas" option="Poor" />
-                <select criterion="Content" option="Poor" />
-            </example>
-            <example>
-                <answer>Example Answer Two</answer>
-                <select criterion="Ideas" option="Fair" />
-                <select criterion="Content" option="Fair" />
-            </example>
-            <example>
-                <answer>Example Answer Three</answer>
-                <select criterion="Ideas" option="Fair" />
-                <select criterion="Content" option="Good" />
-            </example>
-            <example>
-                <answer>Example Answer Four</answer>
-                <select criterion="Ideas" option="Poor" />
-                <select criterion="Content" option="Good" />
-            </example>
-        </assessment>
-    </assessments>
-</openassessment>
--- a/openassessment/xblock/test/data/feedback_only_criterion_ai.xml
+++ b/openassessment/xblock/test/data/feedback_only_criterion_ai.xml
-<openassessment>
-    <title>Feedback only criterion</title>
-    <prompts>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat poverty?</description>
-        </prompt>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat pollution?</description>
-        </prompt>
-    </prompts>
-    <rubric>
-        <criterion>
-            <name>vocabulary</name>
-            <prompt>How good is the vocabulary?</prompt>
-            <option points="0">
-                <name>bad</name>
-                <explanation>bad</explanation>
-            </option>
-            <option points="1">
-                <name>good</name>
-                <explanation>good</explanation>
-            </option>
-        </criterion>
-        <criterion feedback="required">
-            <name>𝖋𝖊𝖊𝖉𝖇𝖆𝖈𝖐 𝖔𝖓𝖑𝖞</name>
-            <prompt>This criterion accepts only written feedback, so it has no options</prompt>
-        </criterion>
-    </rubric>
-    <assessments>
-        <assessment name="example-based-assessment" algorithm_id="fake">
-            <example>
-                <answer>This is my answer.</answer>
-                <select criterion="vocabulary" option="good" />
-            </example>
-            <example>
-                <answer>тєѕт αηѕωєя</answer>
-                <select criterion="vocabulary" option="bad" />
-            </example>
-        </assessment>
-    </assessments>
-</openassessment>
--- a/openassessment/xblock/test/data/grade_scenario_ai_only.xml
+++ b/openassessment/xblock/test/data/grade_scenario_ai_only.xml
-<openassessment>
-    <title>Open Assessment Test</title>
-    <prompts>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat poverty?</description>
-        </prompt>
-        <prompt>
-            <description>Given the state of the world today, what do you think should be done to combat pollution?</description>
-        </prompt>
-    </prompts>
-    <rubric>
-        <criterion>
-            <name>𝓒𝓸𝓷𝓬𝓲𝓼𝓮</name>
-            <prompt>How concise is it?</prompt>
-            <option points="3">
-                <name>ﻉซƈﻉɭɭﻉกՇ</name>
-                <explanation>Extremely concise</explanation>
-            </option>
-            <option points="2">
-                <name>Ġööḋ</name>
-                <explanation>Concise</explanation>
-            </option>
-            <option points="1">
-                <name>ק๏๏г</name>
-                <explanation>Wordy</explanation>
-            </option>
-        </criterion>
-        <criterion>
-            <name>Form</name>
-            <prompt>How well-formed is it?</prompt>
-            <option points="3">
-                <name>Good</name>
-                <explanation>Good</explanation>
-            </option>
-            <option points="2">
-                <name>Fair</name>
-                <explanation>Fair</explanation>
-            </option>
-            <option points="1">
-                <name>Poor</name>
-                <explanation>Poor</explanation>
-            </option>
-        </criterion>
-    </rubric>
-    <assessments>
-        <assessment name="example-based-assessment" algorithm_id="fake">
-            <example>
-                <answer>Example Answer One</answer>
-                <select criterion="𝓒𝓸𝓷𝓬𝓲𝓼𝓮" option="Ġööḋ" />
-                <select criterion="Form" option="Poor" />
-            </example>
-            <example>
-                <answer>Example Answer Two</answer>
-                <select criterion="𝓒𝓸𝓷𝓬𝓲𝓼𝓮" option="ﻉซƈﻉɭɭﻉกՇ" />
-                <select criterion="Form" option="Fair" />
-            </example>
-            <example>
-                <answer>Example Answer Three</answer>
-                <select criterion="𝓒𝓸𝓷𝓬𝓲𝓼𝓮" option="Ġööḋ" />
-                <select criterion="Form" option="Good" />
-            </example>
-            <example>
-                <answer>Example Answer Four</answer>
-                <select criterion="𝓒𝓸𝓷𝓬𝓲𝓼𝓮" option="ﻉซƈﻉɭɭﻉกՇ" />
-                <select criterion="Form" option="Good" />
-            </example>
-        </assessment>
-    </assessments>
-</openassessment>
--- a/openassessment/xblock/test/test_ai_grade.py
+++ b/openassessment/xblock/test/test_ai_grade.py
-"""
-Integration test for example-based assessment (AI).
-"""
-import json
-import mock
-from django.test.utils import override_settings
-from submissions import api as sub_api
-from openassessment.xblock.openassessmentblock import OpenAssessmentBlock
-from .base import XBlockHandlerTestCase, scenario
-
-
-class AIAssessmentIntegrationTest(XBlockHandlerTestCase):
-    """
-    Integration test for example-based assessment (AI).
-    """
-    SUBMISSION = json.dumps({'submission': ('This is submission part 1!', 'This is submission part 2!')})
-    AI_ALGORITHMS = {
-        'fake': 'openassessment.assessment.worker.algorithm.FakeAIAlgorithm'
-    }
-
-    @mock.patch.object(OpenAssessmentBlock, 'is_admin', new_callable=mock.PropertyMock)
-    @override_settings(ORA2_AI_ALGORITHMS=AI_ALGORITHMS)
-    @scenario('data/example_based_only.xml', user_id='Bob')
-    def test_asynch_generate_score(self, xblock, mock_is_admin):
-        # Test that AI grading, which creates assessments asynchronously,
-        # updates the workflow so students can receive a score.
-        mock_is_admin.return_value = True
-
-        # Train classifiers for the problem
-        self.request(xblock, 'schedule_training', json.dumps({}), response_format='json')
-
-        # Submit a response
-        self.request(xblock, 'submit', self.SUBMISSION, response_format='json')
-
-        # BEFORE viewing the grade page, check that we get a score
-        score = sub_api.get_score(xblock.get_student_item_dict())
-        self.assertIsNot(score, None)
-        self.assertEqual(score['submission_uuid'], xblock.submission_uuid)
-
-    @mock.patch.object(OpenAssessmentBlock, 'is_admin', new_callable=mock.PropertyMock)
-    @override_settings(ORA2_AI_ALGORITHMS=AI_ALGORITHMS)
-    @scenario('data/feedback_only_criterion_ai.xml', user_id='Bob')
-    def test_feedback_only_criterion(self, xblock, mock_is_admin):
-        # Test that AI grading, which creates assessments asynchronously,
-        # updates the workflow so students can receive a score.
-        mock_is_admin.return_value = True
-
-        # Train classifiers for the problem and submit a response
-        self.request(xblock, 'schedule_training', json.dumps({}), response_format='json')
-        self.request(xblock, 'submit', self.SUBMISSION, response_format='json')
-
-        # Render the grade page
-        resp = self.request(xblock, 'render_grade', json.dumps({}))
-        self.assertIn('example-based', resp.lower())
--- a/scripts/data/ai-test-data.json
+++ b/scripts/data/ai-test-data.json
-[
-    {
-        "text": "Food is any substance[1] consumed to provide nutritional support for the body. It is usually of plant or animal origin, and contains essential nutrients, such as carbohydrates, fats, proteins, vitamins, or minerals. The substance is ingested by an organism and assimilated by the organism's cells in an effort to produce energy, maintain life, or stimulate growth.  Historically, people secured food through two methods: hunting and gathering, and agriculture. Today, most of the food energy consumed by the world population is supplied by the food industry.  Food safety and food security are monitored by agencies like the International Association for Food Protection, World Resources Institute, World Food Programme, Food and Agriculture Organization, and International Food Information Council. They address issues such as sustainability, biological diversity, climate change, nutritional economics, population growth, water supply, and access to food.",
-        "score": 0
-    },
-    {
-        "text": "Most food has its origin in plants. Some food is obtained directly from plants; but even animals that are used as food sources are raised by feeding them food derived from plants. Cereal grain is a staple food that provides more food energy worldwide than any other type of crop. Maize, wheat, and rice – in all of their varieties – account for 87% of all grain production worldwide.[2] Most of the grain that is produced worldwide is fed to livestock.  Some foods not from animal or plant sources include various edible fungi, especially mushrooms. Fungi and ambient bacteria are used in the preparation of fermented and pickled foods like leavened bread, alcoholic drinks, cheese, pickles, kombucha, and yogurt. Another example is blue-green algae such as Spirulina.[3] Inorganic substances such as salt, baking soda and cream of tartar are used to preserve or chemically alter an ingredient.",
-        "score": 1
-    },
-    {
-        "text": "Many plants or plant parts are eaten as food. There are around 2,000 plant species which are cultivated for food, and many have several distinct cultivars.[4] Seeds of plants are a good source of food for animals, including humans, because they contain the nutrients necessary for the plant's initial growth, including many healthful fats, such as Omega fats. In fact, the majority of food consumed by human beings are seed-based foods. Edible seeds include cereals (maize, wheat, rice, et cetera), legumes (beans, peas, lentils, et cetera), and nuts. Oilseeds are often pressed to produce rich oils - sunflower, flaxseed, rapeseed (including canola oil), sesame, et cetera.[5] Seeds are typically high in unsaturated fats and, in moderation, are considered a health food, although not all seeds are edible. Large seeds, such as those from a lemon, pose a choking hazard, while seeds from cherries and apples contain cyanide which could be poisonous only if consumed in large volumes.[6] Fruits are the ripened ovaries of plants, including the seeds within. Many plants and animals have coevolved such that the fruits of the former are an attractive food source to the latter, because animals that eat the fruits may excrete the seeds some distance away. Fruits, therefore, make up a significant part of the diets of most cultures. Some botanical fruits, such as tomatoes, pumpkins, and eggplants, are eaten as vegetables.[7] (For more information, see list of fruits.) Vegetables are a second type of plant matter that is commonly eaten as food. These include root vegetables (potatoes and carrots), bulbs (onion family), leaf vegetables (spinach and lettuce), stem vegetables (bamboo shoots and asparagus), and inflorescence vegetables (globe artichokes and broccoli and other vegetables such as cabbage or cauliflower).[8]",
-        "score": 0
-    },
-    {
-        "text": "Animals are used as food either directly or indirectly by the products they produce. Meat is an example of a direct product taken from an animal, which comes from muscle systems or from organs.  Various raw meats Food products produced by animals include milk produced by mammary glands, which in many cultures is drunk or processed into dairy products (cheese, butter, etc.). In addition, birds and other animals lay eggs, which are often eaten, and bees produce honey, a reduced nectar from flowers, which is a popular sweetener in many cultures. Some cultures consume blood, sometimes in the form of blood sausage, as a thickener for sauces, or in a cured, salted form for times of food scarcity, and others use blood in stews such as jugged hare.[9] Some cultures and people do not consume meat or animal food products for cultural, dietary, health, ethical, or ideological reasons. Vegetarians choose to forgo food from animal sources to varying degrees. Vegans do not consume any foods that are or contain ingredients from an animal source.",
-        "score": 2
-    },
-    {
-        "text": "Most food has always been obtained through agriculture. With increasing concern over both the methods and products of modern industrial agriculture, there has been a growing trend toward sustainable agricultural practices. This approach, partly fueled by consumer demand, encourages biodiversity, local self-reliance and organic farming methods.[10] Major influences on food production include international organizations (e.g. the World Trade Organization and Common Agricultural Policy), national government policy (or law), and war.[11] In popular culture, the mass production of food, specifically meats such as chicken and beef, has come under fire from various documentaries, most recently Food, Inc, documenting the mass slaughter and poor treatment of animals, often for easier revenues from large corporations. Along with a current trend towards environmentalism, people in Western culture have had an increasing trend towards the use of herbal supplements, foods for a specific group of person (such as dieters, women, or athletes), functional foods (fortified foods, such as omega-3 eggs), and a more ethnically diverse diet.[12] Several organisations have begun calling for a new kind of agriculture in which agroecosystems provide food but also support vital ecosystem services so that soil fertility and biodiversity are maintained rather than compromised. According to the International Water Management Institute and UNEP, well-managed agroecosystems not only provide food, fiber and animal products, they also provide services such as flood mitigation, groundwater recharge, erosion control and habitats for plants, birds fish and other animals.[13]",
-        "score": 3
-    },
-    {
-        "text": "Generally regarded as the most pleasant taste, sweetness is almost always caused by a type of simple sugar such as glucose or fructose, or disaccharides such as sucrose, a molecule combining glucose and fructose.[16] Complex carbohydrates are long chains and thus do not have the sweet taste. Artificial sweeteners such as sucralose are used to mimic the sugar molecule, creating the sensation of sweet, without the calories. Other types of sugar include raw sugar, which is known for its amber color, as it is unprocessed. As sugar is vital for energy and survival, the taste of sugar is pleasant.  The stevia plant contains a compound known as steviol which, when extracted, has 300 times the sweetness of sugar while having minimal impact on blood sugar.[17] Sour Sourness is caused by the taste of acids, such as vinegar in alcoholic beverages. Sour foods include citrus, specifically lemons, limes, and to a lesser degree oranges. Sour is evolutionarily significant as it is a sign for a food that may have gone rancid due to bacteria.[18] Many foods, however, are slightly acidic, and help stimulate the taste buds and enhance flavor.",
-        "score": 1
-    },
-    {
-        "text": "Saltiness is the taste of alkali metal ions such as sodium and potassium. It is found in almost every food in low to moderate proportions to enhance flavor, although to eat pure salt is regarded as highly unpleasant. There are many different types of salt, with each having a different degree of saltiness, including sea salt, fleur de sel, kosher salt, mined salt, and grey salt. Other than enhancing flavor, its significance is that the body needs and maintains a delicate electrolyte balance, which is the kidney's function. Salt may be iodized, meaning iodine has been added to it, a necessary nutrient that promotes thyroid function. Some canned foods, notably soups or packaged broths, tend to be high in salt as a means of preserving the food longer. Historically speaking, salt has been used as a meat preservative as salt promotes water excretion, thus working as a preservative. Similarly, dried foods also promote food safety.[19] Bitter Bitterness is a sensation often considered unpleasant characterized by having a sharp, pungent taste. Dark, unsweetened chocolate, caffeine, lemon rind, and some types of fruit are known to be bitter.  Umami Also named as Savoury.  Umami, the Japanese word for delicious, is the least known in Western popular culture but has a long tradition in Asian cuisine. Umami is the taste of glutamates, especially monosodium glutamate (MSG).[16] It is characterized as savory, meaty, and rich in flavor. Salmon and mushrooms are foods high in umami. Meat and other animal byproducts are described as having this taste.[citation needed]",
-        "score": 2
-    }
-]
--- a/scripts/download-nltk-data.sh
+++ b/scripts/download-nltk-data.sh
-#!/usr/bin/env bash
-
-PYTHON=`which python`
-$PYTHON -m nltk.downloader stopwords maxent_treebank_pos_tagger wordnet --quiet
--- a/storage/dev/.gitkeep
+++ b/storage/dev/.gitkeep
--- a/storage/test/.gitkeep
+++ b/storage/test/.gitkeep
--- a/test/performance/README.rst
+++ b/test/performance/README.rst
-Performance Tests
-=================
-
-1. Install performance test requirements:
-
-.. code:: bash
-
-    cd ora2
-    pip install -r requirements/perf.txt
-
-2. Import ``course.tar.gz`` into Studio:
-
-    * Course ID: 1
-    * Course Org: ora2
-    * Course Run: 1
-
-3. Enable ``auto_auth`` in the LMS feature flags:
-
-.. code:: javascript
-
-    {
-        "FEATURES": {
-            "AUTOMATIC_AUTH_FOR_TESTING": true
-        }
-    }
-
-4. Log in as a staff user and schedule a training task in the Course Staff Debug of the example based assessment problem.
-
-5. **Optional**: Increase open file limit:
-
-.. code:: bash
-
-    ulimit -n 2048
-
-6. Start the Locust server, and point it at the test server.  **NOTE**: You *must* include the trailing slash in the host URL.
-
-.. code:: bash
-
-    cd performance
-    locust --host=http://example.com/
-
-
-If your server has basic auth enabled, provide credentials with environment vars:
-
-.. code:: bash
-
-    cd performance
-    BASIC_AUTH_USER=foo BASIC_AUTH_PASSWORD=bar locust --host=http://example.com/
-
-7. Visit the `Locust web UI <http://localhost:8089>`_ to start the test.
--- a/test/performance/__init__.py
+++ b/test/performance/__init__.py
--- a/test/performance/course.tar.gz
+++ b/test/performance/course.tar.gz
--- a/test/performance/locustfile.py
+++ b/test/performance/locustfile.py
-"""
-Performance tests for the OpenAssessment XBlock.
-"""
-
-import os
-import json
-import random
-from collections import namedtuple
-import gevent
-import loremipsum
-from locust import HttpLocust, TaskSet, task
-
-
-
-class OpenAssessmentPage(object):
-    """
-    Encapsulate interactions with the OpenAssessment XBlock's pages.
-    """
-
-    # These assume that the course fixture has been installed
-    ProblemFixture = namedtuple('ProblemFixture', [
-        'course_id', 'base_url', 'base_handler_url',
-        'rubric_options', 'render_step_handlers'
-    ])
-
-    PROBLEMS = {
-        'peer_then_self': ProblemFixture(
-            course_id="ora2/1/1",
-            base_url= "courses/ora2/1/1/courseware/efa85eb090164a208d772a344df7181d/69f15a02c5af4e95b9c5525771b8f4ee/",
-            base_handler_url="courses/ora2/1/1/xblock/i4x:;_;_ora2;_1;_openassessment;_0e2bbf6cc89e45d98b028fa4e2d46314/handler/",
-            rubric_options={
-                'Ideas': ['Poor', 'Fair', 'Good'],
-                'Content': ['Poor', 'Fair', 'Good', 'Excellent']
-            },
-            render_step_handlers=[
-                'render_submission', 'render_peer_assessment',
-                'render_self_assessment', 'render_grade',
-            ]
-        ),
-
-        'example_based': ProblemFixture(
-            course_id="ora2/1/1",
-            base_url="courses/ora2/1/1/courseware/efa85eb090164a208d772a344df7181d/fb039ef8a34641509190918ada79122a/",
-            base_handler_url="courses/ora2/1/1/xblock/i4x:;_;_ora2;_1;_openassessment;_8df3fa4de26747e0ad99b4157e45f5e5/handler/",
-            rubric_options={
-                'Ideas': ['Bad', 'Good'],
-                'Content': ['Bad', 'Good']
-            },
-            render_step_handlers=['render_submission', 'render_grade']
-        )
-    }
-
-    def __init__(self, hostname, client, problem_name):
-        """
-        Initialize the page to use specified HTTP client.
-
-        Args:
-            hostname (unicode): The hostname (used for the referer HTTP header)
-            client (HttpSession): The HTTP client to use.
-            problem_name (unicode): Name of the problem (one of the keys in `OpenAssessmentPage.PROBLEMS`)
-
-        """
-        self.hostname = hostname
-        self.client = client
-        self.problem_fixture = self.PROBLEMS[problem_name]
-        self.logged_in = False
-
-        # Configure basic auth
-        if 'BASIC_AUTH_USER' in os.environ and 'BASIC_AUTH_PASSWORD' in os.environ:
-            self.client.auth = (os.environ['BASIC_AUTH_USER'], os.environ['BASIC_AUTH_PASSWORD'])
-
-    def log_in(self):
-        """
-        Log in as a unique user with access to the XBlock(s) under test.
-        """
-        resp = self.client.get(
-            "auto_auth",
-            params={'course_id': self.problem_fixture.course_id},
-            verify=False,
-            timeout=120
-        )
-        self.logged_in = (resp.status_code == 200)
-        return self
-
-    def load_steps(self):
-        """
-        Load all steps in the OpenAssessment flow.
-        """
-        # Load the container page
-        self.client.get(self.problem_fixture.base_url, verify=False)
-
-        # Load each of the steps in parallel
-        get_unverified = lambda url: self.client.get(url, verify=False)
-        gevent.joinall([
-            gevent.spawn(get_unverified, url) for url in [
-                self.handler_url(handler)
-                for handler in self.problem_fixture.render_step_handlers
-            ]
-        ], timeout=0.5)
-
-        return self
-
-    def submit_response(self):
-        """
-        Submit a response.
-        """
-        payload = json.dumps({
-            'submission': u' '.join(loremipsum.get_paragraphs(random.randint(1, 10))),
-        })
-        self.client.post(self.handler_url('submit'), data=payload, headers=self._post_headers, verify=False)
-
-    def peer_assess(self, continue_grading=False):
-        """
-        Assess a peer.
-
-        Kwargs:
-            continue_grading (bool): If true, simulate "continued grading"
-                in which a student asks to assess peers in addition to the required number.
-
-        """
-        params = {
-            'options_selected': self._select_random_options(),
-            'overall_feedback': loremipsum.get_paragraphs(random.randint(1, 3)),
-            'criterion_feedback': {}
-        }
-
-        if continue_grading:
-            params['continue_grading'] = True
-
-        payload = json.dumps(params)
-        self.client.post(self.handler_url('peer_assess'), data=payload, headers=self._post_headers, verify=False)
-
-    def self_assess(self):
-        """
-        Complete a self-assessment.
-        """
-        payload = json.dumps({
-            'options_selected': self._select_random_options()
-        })
-        self.client.post(self.handler_url('self_assess'), data=payload, headers=self._post_headers, verify=False)
-
-    def handler_url(self, handler_name):
-        """
-        Return the full URL for an XBlock handler.
-
-        Args:
-            handler_name (str): The name of the XBlock handler method.
-
-        Returns:
-            str
-        """
-        return "{base}{handler}".format(base=self.problem_fixture.base_handler_url, handler=handler_name)
-
-    def _select_random_options(self):
-        """
-        Select random options for each criterion in the rubric.
-        """
-        return {
-            criterion: random.choice(options)
-            for criterion, options in self.problem_fixture.rubric_options.iteritems()
-        }
-
-    @property
-    def _post_headers(self):
-        """
-        Headers for a POST request, including the CSRF token.
-        """
-        return {
-            'Content-type': 'application/json',
-            'Accept': 'application/json',
-            'X-CSRFToken': self.client.cookies.get('csrftoken', ''),
-            'Referer': self.hostname
-        }
-
-
-class OpenAssessmentTasks(TaskSet):
-    """
-    Virtual user interactions with the OpenAssessment XBlock.
-    """
-
-    def __init__(self, *args, **kwargs):  # pylint: disable=W0613
-        """
-        Initialize the task set.
-        """
-        super(OpenAssessmentTasks, self).__init__(*args, **kwargs)
-        self.hostname = self.locust.host
-        self.page = None
-
-    @task
-    def peer_and_self(self):
-        """
-        Test the peer-->self workflow.
-        """
-        if self.page is None:
-            self.page = OpenAssessmentPage(self.hostname, self.client, 'peer_then_self')  # pylint: disable=E1101
-            self.page.log_in()
-
-        if not self.page.logged_in:
-            self.page.log_in()
-        else:
-            self._submit_response()
-
-            # Randomly peer/self assess or log in as a new user.
-            # This should be sufficient to get students through
-            # the entire flow (satisfying the requirements for peer assessment).
-            action = random.randint(0, 100)
-            if action <= 80:
-                continue_grading = random.randint(0, 10) < 4
-                self.page.peer_assess(continue_grading=continue_grading)
-                self.page.self_assess()
-            else:
-                self.page.log_in()
-
-    @task
-    def example_based(self):
-        """
-        Test example-based assessment only.
-        """
-        if self.page is None:
-            self.page = OpenAssessmentPage(self.hostname, self.client, 'example_based')  # pylint: disable=E1101
-            self.page.log_in()
-
-        if not self.page.logged_in:
-            self.page.log_in()
-        else:
-            self._submit_response()
-            if random.randint(0, 100) < 50:
-                self.page.log_in()
-
-    def _submit_response(self):
-        """
-        Simulate the user loading the page, submitting a response,
-        then reloading the steps (usually triggered by AJAX).
-        If the user has already submitted, the handler will return
-        an error message in the JSON, but the HTTP status will still be 200.
-        """
-        self.page.load_steps()
-        self.page.submit_response()
-        self.page.load_steps()
-
-
-class OpenAssessmentLocust(HttpLocust):
-    """
-    Performance test definition for the OpenAssessment XBlock.
-    """
-    task_set = OpenAssessmentTasks
-    min_wait = 10000
-    max_wait = 15000