From 4050d75eb889bdae93c6ff7f962fff818f161cd2 Mon Sep 17 00:00:00 2001
From: Phill Conrad as submit admin <pconrad@cs.ucsb.edu>
Date: Wed, 30 May 2018 13:24:36 -0700
Subject: [PATCH] ground truth May 30 2018

---
 submit/__init__.py             |   4 +-
 submit/helpers.py              |  16 +-
 submit/models.py               |   2 +-
 submit/views.py                |   4 +
 submit/workers/proxy.py        |  59 ++++++-
 submit/workers/proxy.py.backup | 293 +++++++++++++++++++++++++++++++++
 submit/workers/worker.py       |  26 ++-
 7 files changed, 377 insertions(+), 27 deletions(-)
 create mode 100644 submit/workers/proxy.py.backup

diff --git a/submit/__init__.py b/submit/__init__.py
index bf30fb3..3ed9c5a 100644
--- a/submit/__init__.py
+++ b/submit/__init__.py
@@ -8,7 +8,7 @@
 from .models import configure_sql, create_schema, populate_database
 from .security import get_user, group_finder
 
-__version__ = '1.2.0'
+__version__ = '1.0.3'
 
 
 class Root(object):
@@ -79,7 +79,7 @@ def main(global_config, **settings):
     engine = engine_from_config(settings, 'sqlalchemy.')
     configure_sql(engine)
 
-    secure_cookies = settings.get('secure_cookies') != 'false'
+    secure_cookies = True
     if 'pyramid_debugtoolbar' in settings['pyramid.includes']:
         create_schema(global_config['__file__'])
         populate_database()
diff --git a/submit/helpers.py b/submit/helpers.py
index 6ceee12..5683a85 100644
--- a/submit/helpers.py
+++ b/submit/helpers.py
@@ -71,9 +71,8 @@ class UmailAddress(EmailAddress):
 
     """A validator to verify that a umail address is correct."""
 
-    def run(self, value, errors, request, *args):
-        retval = super(UmailAddress, self).run(value.lower(), errors, request,
-                                               *args)
+    def run(self, value, errors, *args):
+        retval = super(UmailAddress, self).run(value.lower(), errors, *args)
         if errors:
             return retval
         if not retval.endswith('@umail.ucsb.edu'):
@@ -81,7 +80,7 @@ def run(self, value, errors, request, *args):
             return retval
         # Fetch name
         try:
-            name = fetch_name_by_umail(retval, request)
+            name = fetch_name_by_umail(retval)
         except Exception as exc:
             self.add_error(errors, exc.message)
             return retval
@@ -274,7 +273,7 @@ def fetch_request_ids(item_ids, cls, attr_name, verification_list=None):
     return items
 
 
-def fetch_name_by_umail(umail, request):
+def fetch_name_by_umail(umail):
     def extract(item):
         if len(data[item]) == 1:
             return data[item][0]
@@ -282,13 +281,8 @@ def extract(item):
 
     uid = umail.split('@')[0]
 
-    # Return the portion before @umail.ucsb.edu if ldap_uri is not provided
-    ldap_uri = request.registry.settings.get('ldap_uri')
-    if not ldap_uri:
-        return uid
-
     # connect to ldap
-    ldap_conn = ldap.initialize(ldap_uri)
+    ldap_conn = ldap.initialize('ldaps://directory.ucsb.edu')
     ldap_conn.protocol_version = ldap.VERSION3
     results = ldap_conn.search_s(
         'o=ucsb', ldap.SCOPE_ONELEVEL, filterstr='uid={}'.format(uid),
diff --git a/submit/models.py b/submit/models.py
index 4a4d5da..ddcc47d 100644
--- a/submit/models.py
+++ b/submit/models.py
@@ -407,7 +407,7 @@ class Project(BasicBase, Base):
     makefile = relationship(File, backref='makefile_for_projects')
     makefile_id = Column(Integer, ForeignKey('file.id'), nullable=True)
     name = Column(Unicode, nullable=False)
-    status = Column(Enum('locked', 'notready', 'ready', name='proj_status'),
+    status = Column(Enum('locked', 'notready', 'ready', name='status'),
                     nullable=False, server_default='notready')
     submissions = relationship('Submission', backref='project',
                                cascade='all, delete-orphan')
diff --git a/submit/views.py b/submit/views.py
index 1e6ab89..d3a6575 100644
--- a/submit/views.py
+++ b/submit/views.py
@@ -1071,6 +1071,10 @@ def submission_view(request, submission, as_user):
     else:
         prev_group = next_group = None
 
+
+    if not submission_admin and submission.project.name[0:4]=="EXAM":
+       files = {}
+
     return {'diff_table': diff_table,
             'extra_files': extra_files,
             'files': files,
diff --git a/submit/workers/proxy.py b/submit/workers/proxy.py
index 297de94..791117a 100644
--- a/submit/workers/proxy.py
+++ b/submit/workers/proxy.py
@@ -1,3 +1,4 @@
+import time
 import amqp_worker
 import json
 import os
@@ -57,6 +58,11 @@ def __init__(self):
 
         self.base_file_path = settings['file_directory']
         self.private_key_file = settings['ssh_priv_key']
+        self.sleep_short_min = int(settings['sleep_short_min'])
+        self.sleep_short_max = int(settings['sleep_short_max'])
+        self.sleep_long_min = int(settings['sleep_long_min'])
+        self.sleep_long_max = int(settings['sleep_long_max'])
+
         self.account = args.worker_account
         machines = settings['worker_machines']
         if isinstance(machines, basestring):
@@ -78,6 +84,15 @@ def __init__(self):
 
         worker.handle_command(args.command)
 
+
+    def get_short_sleep(self):
+       return random.uniform(self.sleep_short_min,self.sleep_short_max) 
+
+    def get_long_sleep(self):
+        return random.uniform(self.sleep_long_min,self.sleep_long_max) 
+
+
+
     @workers.wrapper
     def do_work(self, submission_id, testable_id, update_project=False):
         # Verify job
@@ -100,8 +115,11 @@ def do_work(self, submission_id, testable_id, update_project=False):
             # Fetch the best machine
             priority, machine = heappop(self.machines)
             # Log the start of the job
-            workers.log_msg('{}.{} begin ({})'
-                            .format(submission_id, testable_id, machine))
+            start_time = time.time()
+            workers.log_msg('{}.{} begin ({}) {} {} {} {}'
+                            .format(submission_id, testable_id, machine,
+                                    submission.project.class_.name,submission.project.name,submission.created_by.name,testable.name ))
+
             log_type = 'unhandled'
             try:
                 # Kill any processes on the worker
@@ -109,6 +127,7 @@ def do_work(self, submission_id, testable_id, update_project=False):
                 # Copy the files to the worker (and remove existing files)
                 self.push_files(machine, submission, testable)
                 # Run the remote worker
+
                 self.ssh(machine, 'python worker.py')
                 # Fetch and generate the results
                 self.fetch_results(machine, submission, testable,
@@ -119,21 +138,35 @@ def do_work(self, submission_id, testable_id, update_project=False):
                 attempt += 1
                 log_type = 'timeout'
                 priority += 10
-            except Exception:  # Increase priority and rereaise the exception
+            except Exception:  # Increase priority and re-raise the exception
                 log_type = 'exception'
                 priority += 5
+                sleep_time = self.get_long_sleep()
+                workers.log_msg('{}.{} {}  ({}) ({} sleep) {} {} {} {}'.format(submission_id,
+                                    testable_id, 'exception_sleep', sleep_time,
+                                    machine, 
+                                    submission.project.class_.name,submission.project.name,submission.created_by.name,testable.name ))
+                time.sleep(sleep_time)
                 raise
             finally:
                 # Add the machine back to the queue
                 heappush(self.machines, (priority, machine))
                 # Log the end of the job
-                workers.log_msg('{}.{} {} ({})'.format(submission_id,
-                                                       testable_id, log_type,
-                                                       machine))
+                elapsed_time = time.time() - start_time
+                workers.log_msg('{}.{} {} ({}) ({} sec) {} {} {} {}'.format(submission_id,
+                                    testable_id, log_type,
+                                    machine, elapsed_time,
+                                    submission.project.class_.name,submission.project.name,submission.created_by.name,testable.name ))
         raise Exception('{}.{} timed out 16 times.'
                         .format(submission_id, testable_id))
 
     def fetch_results(self, machine, submission, testable, update_project):
+
+        workers.log_msg('{}.{} {} ({}) {} {} {} {}'.format(submission.id,
+                                    testable.id, 'fetch_results',
+                                    machine, 
+                                    submission.project.class_.name,submission.project.name,submission.created_by.name,testable.name ))
+
         # Rsync to retrieve results
         self.rsync(machine)
         os.chdir('results')
@@ -193,6 +226,9 @@ def kill_processes(self, machine):
             raise Exception('killall did not work as expected')
         except subprocess.CalledProcessError as exc:
             if exc.returncode != 255 or exc.output.strip() != expected:
+                sleep_time = self.get_short_sleep()
+                workers.log_msg('kill_processes exc.returncode={} sleep={} output={}'.format(exc.returncode,sleep_time,exc.output.strip()))
+                time.sleep(sleep_time)
                 raise Exception('killall status: {} ({})'
                                 .format(exc.returncode, exc.output.strip()))
         return time.time() - start
@@ -265,6 +301,12 @@ def push_files(self, machine, submission, testable):
         self.rsync(machine, from_local=True)
 
     def rsync(self, machine, from_local=False):
+
+        sleep_time = self.get_short_sleep()
+        time.sleep(sleep_time)
+        workers.log_msg('rsync machine={} sleep={}'.format(machine,sleep_time))
+
+
         src = '{}@{}:working/'.format(self.account, machine)
         dst = '.'
         if from_local:
@@ -274,6 +316,11 @@ def rsync(self, machine, from_local=False):
         subprocess.check_call(cmd, stdout=open(os.devnull, 'w'), shell=True)
 
     def ssh(self, machine, command, timeout=None):
+
+        sleep_time = self.get_short_sleep()
+        time.sleep(sleep_time)
+        workers.log_msg('ssh machine={} command={} sleep={}'.format(machine,command,sleep_time))
+
         options = '-o ConnectTimeout={}'.format(timeout) if timeout else ''
         cmd = 'ssh -i {key} {options} {user}@{host} {command}'.format(
             key=self.private_key_file, user=self.account, host=machine,
diff --git a/submit/workers/proxy.py.backup b/submit/workers/proxy.py.backup
new file mode 100644
index 0000000..efd44d4
--- /dev/null
+++ b/submit/workers/proxy.py.backup
@@ -0,0 +1,293 @@
+import amqp_worker
+import json
+import os
+import pickle
+import random
+import subprocess
+import time
+from heapq import heappop, heappush
+from sqlalchemy import engine_from_config
+from .exceptions import HandledError, SSHConnectTimeout
+from .. import workers
+from ..diff_unit import Diff
+from ..models import (File, Session, Submission, TestCaseResult, Testable,
+                      TestableResult, configure_sql)
+
+
+def set_expected_files(testable, results, base_file_path):
+    # Update the expected output of each test case
+    for test_case in testable.test_cases:
+        if test_case.id not in results:
+            raise Exception('Missing test case result in project update: {0}'
+                            .format(test_case.id))
+        if test_case.output_type == 'diff':
+            output_file = 'tc_{0}'.format(test_case.id)
+            test_case.expected = File.fetch_or_create(
+                open(output_file).read(), base_file_path)
+    testable.is_locked = False
+    if not any(x.is_locked for x in testable.project.testables):
+        testable.project.status = u'notready'
+
+
+def compute_diff(test_case, test_case_result, output_file, base_file_path):
+    """Associate the diff (if exists) with the TestCaseResult.
+
+    Return whether or not the outputs match.
+
+    """
+    with open(File.file_path(base_file_path, test_case.expected.sha1)) as fp:
+        expected_output = fp.read()
+    actual_output = ''
+    if os.path.isfile(output_file):
+        with open('tc_{0}'.format(test_case.id)) as fp:
+            actual_output = fp.read()
+    unit = Diff(expected_output, actual_output)
+    if not unit.outputs_match():
+        test_case_result.diff = File.fetch_or_create(pickle.dumps(unit),
+                                                     base_file_path)
+        return False
+    return True
+
+
+class WorkerProxy():
+    def __init__(self):
+        parser = amqp_worker.base_argument_parser()
+        parser.add_argument('worker_account', type=str)
+        args, settings = amqp_worker.parse_base_args(parser, 'app:main')
+
+        self.base_file_path = settings['file_directory']
+        self.private_key_file = settings['ssh_priv_key']
+        self.account = args.worker_account
+        machines = settings['worker_machines']
+        if isinstance(machines, basestring):
+            machines = [machines]
+        random.shuffle(machines)
+        self.machines = [(5., x) for x in machines]
+        engine = engine_from_config(settings, 'sqlalchemy.')
+        configure_sql(engine)
+
+        worker = amqp_worker.AMQPWorker(
+            settings['queue_server'], settings['queue_tell_worker'],
+            self.do_work, is_daemon=args.daemon,
+            error_queue=settings.get('queue_tell_worker_error'),
+            log_file=settings['worker_proxy_log_file'].format(self.account),
+            pid_file=settings['worker_proxy_pid_file'].format(self.account),
+            email_subject='WorkerProxy {} Exception'.format(self.account),
+            email_from=settings['exc_mail_from'],
+            email_to=settings['exc_mail_to'])
+
+        worker.handle_command(args.command)
+
+    @workers.wrapper
+    def do_work(self, submission_id, testable_id, update_project=False):
+        # Verify job
+        submission = Submission.fetch_by_id(submission_id)
+        if not submission:
+            raise HandledError('Invalid submission id: {0}'.format(submission_id))
+
+        testable = Testable.fetch_by_id(testable_id)
+        if not testable:
+            raise HandledError('Invalid testable id: {0}'.format(testable_id))
+        if update_project and submission.project.status != u'locked':
+            raise HandledError('Rejecting update to unlocked project: {0}'
+                               .format(submission.project.id))
+        if update_project and not testable.is_locked:
+            raise HandledError('Rejecting update to unlocked testable: {0}'
+                               .format(testable_id))
+
+        attempt = 0
+        while attempt < 16:
+            # Fetch the best machine
+            priority, machine = heappop(self.machines)
+            # Log the start of the job
+            workers.log_msg('{}.{} begin ({})'
+                            .format(submission_id, testable_id, machine))
+            log_type = 'unhandled'
+            try:
+                # Kill any processes on the worker
+                priority = self.kill_processes(machine)
+                # Copy the files to the worker (and remove existing files)
+                self.push_files(machine, submission, testable)
+                # Run the remote worker
+                self.ssh(machine, 'python worker.py')
+                # Fetch and generate the results
+                self.fetch_results(machine, submission, testable,
+                                   update_project)
+                log_type = 'success'
+                return
+            except SSHConnectTimeout:  # Retry with a different host
+                attempt += 1
+                log_type = 'timeout'
+                priority += 10
+            except Exception:  # Increase priority and rereaise the exception
+                log_type = 'exception'
+                priority += 5
+                raise
+            finally:
+                # Add the machine back to the queue
+                heappush(self.machines, (priority, machine))
+                # Log the end of the job
+                workers.log_msg('{}.{} {} ({})'.format(submission_id,
+                                                       testable_id, log_type,
+                                                       machine))
+        raise Exception('{}.{} timed out 16 times.'
+                        .format(submission_id, testable_id))
+
+    def fetch_results(self, machine, submission, testable, update_project):
+        # Rsync to retrieve results
+        self.rsync(machine)
+        os.chdir('results')
+
+        # Create dictionary of completed test_cases
+        if os.path.isfile('test_cases'):
+            with open('test_cases') as fp:
+                results = {int(x[0]): x[1] for x in json.load(fp).items()}
+        else:
+            results = {}
+
+        if update_project:
+            set_expected_files(testable, results, self.base_file_path)
+            return
+
+        points = 0
+
+        # Set or update relevant test case results
+        for test_case in testable.test_cases:
+            test_case_result = TestCaseResult.fetch_by_ids(submission.id,
+                                                           test_case.id)
+            if test_case.id not in results:
+                if test_case_result:  # Delete existing result
+                    Session.delete(test_case_result)
+            else:
+                if test_case_result:
+                    test_case_result.update(results[test_case.id])
+                else:
+                    results[test_case.id]['submission_id'] = submission.id
+                    results[test_case.id]['test_case_id'] = test_case.id
+                    test_case_result = TestCaseResult(**results[test_case.id])
+                    Session.add(test_case_result)
+                output_file = 'tc_{0}'.format(test_case.id)
+                if test_case.output_type == 'diff':
+                    matches = compute_diff(test_case, test_case_result,
+                                           output_file, self.base_file_path)
+                    if matches and test_case_result.status == 'success':
+                        points += test_case.points
+                else:
+                    if os.path.isfile(output_file):  # Store file as the diff
+                        test_case_result.diff = File.fetch_or_create(
+                            open(output_file).read(), self.base_file_path)
+
+        # Create or update Testable
+        testable_data = json.load(open('testable'))
+        TestableResult.fetch_or_create(
+            make_results=testable_data.get('make'), points=points,
+            status=testable_data['status'], testable=testable,
+            submission=submission)
+
+    def kill_processes(self, machine):
+        expected = 'Connection to {} closed by remote host.'.format(machine)
+        start = time.time()
+        try:
+            self.ssh(machine, 'killall -9 -u {}'.format(self.account),
+                     timeout=1)
+            raise Exception('killall did not work as expected')
+        except subprocess.CalledProcessError as exc:
+            if exc.returncode != 255 or exc.output.strip() != expected:
+                raise Exception('killall status: {} ({})'
+                                .format(exc.returncode, exc.output.strip()))
+        return time.time() - start
+
+    def push_files(self, machine, submission, testable):
+        submitted = {x.filename: x.file.sha1 for x in submission.files}
+        build_files = {x.filename: x.file.sha1 for x in testable.build_files}
+
+        # Prepare build directory by symlinking the relevant submission files
+        os.mkdir('src')
+        for filev in testable.file_verifiers:
+            if filev.filename in submitted:
+                source = File.file_path(self.base_file_path,
+                                        submitted[filev.filename])
+                os.symlink(source, os.path.join('src', filev.filename))
+                if filev.filename in build_files:
+                    del build_files[filev.filename]
+            elif not filev.optional:
+                raise HandledError('File verifier not satisfied: {0}'
+                                   .format(filev.filename))
+        for name, sha1 in build_files.items():  # Symlink remaining build files
+            source = File.file_path(self.base_file_path, sha1)
+            os.symlink(source, os.path.join('src', name))
+
+        # Symlink Makefile to current directory if necessary
+        if submission.project.makefile and testable.make_target:
+            source = File.file_path(self.base_file_path,
+                                    submission.project.makefile.sha1)
+            os.symlink(source, 'Makefile')
+
+        # Symlink test inputs and copy build test case specifications
+        os.mkdir('inputs')
+        test_cases = []
+        for test_case in testable.test_cases:
+            test_cases.append(test_case.serialize())
+            if test_case.stdin:
+                destination = os.path.join('inputs', test_case.stdin.sha1)
+                if not os.path.isfile(destination):
+                    source = File.file_path(self.base_file_path,
+                                            test_case.stdin.sha1)
+                    os.symlink(source, destination)
+
+        # Copy execution files
+        os.mkdir('execution_files')
+        for execution_file in testable.execution_files:
+            destination = os.path.join('execution_files',
+                                       execution_file.filename)
+            source = File.file_path(self.base_file_path,
+                                    execution_file.file.sha1)
+            os.symlink(source, destination)
+        # Symlink sumbitted files that should be in the execution environment
+        for filev in testable.file_verifiers:
+            if filev.copy_to_execution and filev.filename in submitted:
+                destination = os.path.join('execution_files', filev.filename)
+                source = File.file_path(self.base_file_path,
+                                        submitted[filev.filename])
+                os.symlink(source, destination)
+
+        # Generate data dictionary
+        data = {'executable': testable.executable,
+                'key': '{}.{}'.format(submission.id, testable.id),
+                'make_target': testable.make_target,
+                'test_cases': test_cases}
+
+        # Save data specification
+        with open('data.json', 'w') as fp:
+            json.dump(data, fp)
+
+        # Rsync files
+        self.rsync(machine, from_local=True)
+
+    def rsync(self, machine, from_local=False):
+        src = '{}@{}:working/'.format(self.account, machine)
+        dst = '.'
+        if from_local:
+            src, dst = dst, src
+        cmd = ('rsync -e \'ssh -i {}\' --timeout=16 --delete -rLpv {} {}'
+               .format(self.private_key_file, src, dst))
+        subprocess.check_call(cmd, stdout=open(os.devnull, 'w'), shell=True)
+
+    def ssh(self, machine, command, timeout=None):
+        options = '-o ConnectTimeout={}'.format(timeout) if timeout else ''
+        cmd = 'ssh -i {key} {options} {user}@{host} {command}'.format(
+            key=self.private_key_file, user=self.account, host=machine,
+            command=command, options=options)
+        proc = subprocess.Popen(cmd, shell=True, stderr=subprocess.PIPE,
+                                stdout=subprocess.PIPE)
+        stdout, stderr = proc.communicate()
+        if proc.returncode != 0:
+            if stderr.strip().endswith('Connection timed out'):
+                raise SSHConnectTimeout()
+            output = stdout + '\n' + stderr if stdout else stderr
+            raise subprocess.CalledProcessError(proc.returncode, cmd,
+                                                output=output)
+
+
+def main():
+    WorkerProxy()
diff --git a/submit/workers/worker.py b/submit/workers/worker.py
index 6e02998..7e44300 100644
--- a/submit/workers/worker.py
+++ b/submit/workers/worker.py
@@ -21,7 +21,7 @@
 EXECUTION_FILES_PATH = 'execution_files'
 
 MAX_FILE_SIZE = 81920
-TIME_LIMIT = 4
+TIME_LIMIT = 8
 
 # Prepare Child Environemtn to disable CCACHE
 CHILD_ENV = os.environ.copy()
@@ -29,7 +29,7 @@
 
 
 def log_msg(msg):
-    print('{} {}'.format(datetime.now(), msg))
+    print('{} {} TIME_LIMIT={}'.format(datetime.now(), msg, TIME_LIMIT))
 
 
 class TimeoutAlarm(Exception):
@@ -43,7 +43,7 @@ def alarm_handler(_, _a):
 class Worker(object):
     @staticmethod
     def execute(command, stderr=None, stdin=None, stdout=None, files=None,
-                save=None):
+                save=None, log=None):
         if not stderr:
             stderr = open('/dev/null', 'w')
         if not stdout:
@@ -73,11 +73,18 @@ def execute(command, stderr=None, stdin=None, stdout=None, files=None,
 
         # Hacks to give more time to some scripts:
         time_limit = TIME_LIMIT
+
         if args[0] in ('valgrind',):
             time_limit *= 2
+        elif args[0]=='./kos':
+            time_limit = 60
         elif len(args) > 2 and args[1] == 'turtle_capture.sh':
             time_limit *= 4  # How can we run this faster?
 
+        if (log):
+            log.write('worker.execute: {date} args[0]={args0} time_limit={time_limit}\n'
+                     .format(date=datetime.now(), args0=args[0], time_limit=time_limit))
+
         # Run command with a timelimit
         # TODO: Do we only get partial output with stdout?
         try:
@@ -124,13 +131,18 @@ def execute(command, stderr=None, stdin=None, stdout=None, files=None,
                     shutil.copy(src, save[1])
             shutil.rmtree(tmp_dir)
 
-    def __init__(self):
+    def __init__(self, log):
+        self.log = log
         # Load testable information
         os.chdir('working')
         with open('data.json') as fp:
             self.data = json.load(fp)
 
     def run(self):
+
+        self.log.write('worker.run: {date} {key} executable={executable}\n'
+                     .format(date=datetime.now(), key=self.data['key'], executable=self.data['executable']))
+
         # Build and run tests
         os.mkdir(RESULTS_PATH)
         result = {}
@@ -196,9 +208,9 @@ def execute(*args, **kwargs):
                         stdout = None
                         stderr = output
                     execute(tc['args'], stderr=stderr, stdin=stdin,
-                            stdout=stdout)
+                            stdout=stdout, log=self.log)
             else:
-                execute(tc['args'], save=(tc['output_filename'], output_file))
+                execute(tc['args'], save=(tc['output_filename'], output_file), log=self.log)
                 if tc['output_filename'].endswith('.png'):
                     max_file_size = 131072  # Avoid truncating images
 
@@ -241,7 +253,7 @@ class TimeoutException(Exception):
 
 def main():
     with open('worker.log', 'a') as fp:
-        wp = Worker()
+        wp = Worker(fp)
         status = 'failed'
         start = time.time()
         try: