diff testcases.py @ 50:4ea7133ac25c

Converted 2.00 into the default branch
author Oleg Oshmyan <chortos@inbox.lv>
date Sun, 19 Dec 2010 23:25:13 +0200
parents 2.00/testcases.py@81f58c938ec5
children 1914ae9cfdce
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/testcases.py	Sun Dec 19 23:25:13 2010 +0200
@@ -0,0 +1,549 @@
+#! /usr/bin/env python
+# Copyright (c) 2010 Chortos-2 <chortos@inbox.lv>
+
+# TODO: copy the ansfile if not options.erase even if no validator is used
+
+from __future__ import division, with_statement
+
+try:
+	from compat import *
+	import files, problem, config
+except ImportError:
+	import __main__
+	__main__.import_error(sys.exc_info()[1])
+else:
+	from __main__ import clock, options
+
+import glob, re, sys, tempfile, time
+from subprocess import Popen, PIPE, STDOUT
+
+import os
+devnull = open(os.path.devnull, 'w+')
+
+try:
+	from signal import SIGTERM, SIGKILL
+except ImportError:
+	SIGTERM = 15
+	SIGKILL = 9
+
+try:
+	from _subprocess import TerminateProcess
+except ImportError:
+	# CPython 2.5 does define _subprocess.TerminateProcess even though it is
+	# not used in the subprocess module, but maybe something else does not
+	try:
+		import ctypes
+		TerminateProcess = ctypes.windll.kernel32.TerminateProcess
+	except (ImportError, AttributeError):
+		TerminateProcess = None
+
+
+# Do the hacky-wacky dark magic needed to catch presses of the Escape button.
+# If only Python supported forcible termination of threads...
+if not sys.stdin.isatty():
+	canceled = init_canceled = lambda: False
+	pause = None
+else:
+	try:
+		# Windows has select() too, but it is not the select() we want
+		import msvcrt
+	except ImportError:
+		try:
+			import select, termios, tty, atexit
+		except ImportError:
+			# It cannot be helped!
+			# Silently disable support for killing the program being tested
+			canceled = init_canceled = lambda: False
+			pause = None
+		else:
+			def cleanup(old=termios.tcgetattr(sys.stdin.fileno())):
+				termios.tcsetattr(sys.stdin.fileno(), termios.TCSAFLUSH, old)
+			atexit.register(cleanup)
+			del cleanup
+			tty.setcbreak(sys.stdin.fileno())
+			def canceled(select=select.select, stdin=sys.stdin, read=sys.stdin.read):
+				while select((stdin,), (), (), 0)[0]:
+					if read(1) == '\33':
+						return True
+				return False
+			def init_canceled():
+				while select.select((sys.stdin,), (), (), 0)[0]:
+					sys.stdin.read(1)
+			def pause():
+				sys.stdin.read(1)
+	else:
+		def canceled(kbhit=msvcrt.kbhit, getch=msvcrt.getch):
+			while kbhit():
+				c = getch()
+				if c == '\33':
+					return True
+				elif c == '\0':
+					# Let's hope no-one is fiddling with this
+					getch()
+			return False
+		def init_canceled():
+			while msvcrt.kbhit():
+				msvcrt.getch()
+		def pause():
+			msvcrt.getch()
+
+
+__all__ = ('TestCase', 'load_problem', 'TestCaseNotPassed',
+           'TimeLimitExceeded', 'CanceledByUser', 'WrongAnswer',
+           'NonZeroExitCode', 'CannotStartTestee',
+           'CannotStartValidator', 'CannotReadOutputFile',
+           'CannotReadInputFile', 'CannotReadAnswerFile')
+
+
+
+# Exceptions
+
+class TestCaseNotPassed(Exception): __slots__ = ()
+class TimeLimitExceeded(TestCaseNotPassed): __slots__ = ()
+class CanceledByUser(TestCaseNotPassed): __slots__ = ()
+
+class WrongAnswer(TestCaseNotPassed):
+	__slots__ = 'comment'
+	def __init__(self, comment=''):
+		self.comment = comment
+
+class NonZeroExitCode(TestCaseNotPassed):
+	__slots__ = 'exitcode'
+	def __init__(self, exitcode):
+		self.exitcode = exitcode
+
+class ExceptionWrapper(TestCaseNotPassed):
+	__slots__ = 'upstream'
+	def __init__(self, upstream):
+		self.upstream = upstream
+
+class CannotStartTestee(ExceptionWrapper): __slots__ = ()
+class CannotStartValidator(ExceptionWrapper): __slots__ = ()
+class CannotReadOutputFile(ExceptionWrapper): __slots__ = ()
+class CannotReadInputFile(ExceptionWrapper): __slots__ = ()
+class CannotReadAnswerFile(ExceptionWrapper): __slots__ = ()
+
+
+
+# Helper context managers
+
+class CopyDeleting(object):
+	__slots__ = 'case', 'file', 'name'
+	
+	def __init__(self, case, file, name):
+		self.case = case
+		self.file = file
+		self.name = name
+	
+	def __enter__(self):
+		if self.name:
+			try:
+				self.file.copy(self.name)
+			except:
+				try:
+					self.__exit__(None, None, None)
+				except:
+					pass
+				raise
+	
+	def __exit__(self, exc_type, exc_val, exc_tb):
+		if self.name:
+			self.case.files_to_delete.append(self.name)
+
+
+class Copying(object):
+	__slots__ = 'file', 'name'
+	
+	def __init__(self, file, name):
+		self.file = file
+		self.name = name
+	
+	def __enter__(self):
+		if self.name:
+			self.file.copy(self.name)
+	
+	def __exit__(self, exc_type, exc_val, exc_tb):
+		pass
+
+
+
+# Test case types
+
+class TestCase(object):
+	__slots__ = ('problem', 'id', 'isdummy', 'infile', 'outfile', 'points',
+	             'process', 'time_started', 'time_stopped', 'time_limit_string',
+	             'realinname', 'realoutname', 'maxtime', 'maxmemory',
+	             'has_called_back', 'files_to_delete')
+	
+	if ABCMeta:
+		__metaclass__ = ABCMeta
+	
+	def __init__(case, prob, id, isdummy, points):
+		case.problem = prob
+		case.id = id
+		case.isdummy = isdummy
+		case.points = points
+		case.maxtime = case.problem.config.maxtime
+		case.maxmemory = case.problem.config.maxmemory
+		if case.maxtime:
+			case.time_limit_string = '/%.3f' % case.maxtime
+		else:
+			case.time_limit_string = ''
+		if not isdummy:
+			case.realinname = case.problem.config.testcaseinname
+			case.realoutname = case.problem.config.testcaseoutname
+		else:
+			case.realinname = case.problem.config.dummyinname
+			case.realoutname = case.problem.config.dummyoutname
+	
+	@abstractmethod
+	def test(case): raise NotImplementedError
+	
+	def __call__(case, callback):
+		case.has_called_back = False
+		case.files_to_delete = []
+		try:
+			return case.test(callback)
+		finally:
+			now = clock()
+			if not getattr(case, 'time_started', None):
+				case.time_started = case.time_stopped = now
+			elif not getattr(case, 'time_stopped', None):
+				case.time_stopped = now
+			if not case.has_called_back:
+				callback()
+			case.cleanup()
+	
+	def cleanup(case):
+		#if getattr(case, 'infile', None):
+		#	case.infile.close()
+		#if getattr(case, 'outfile', None):
+		#	case.outfile.close()
+		if getattr(case, 'process', None):
+			# Try killing after three unsuccessful TERM attempts in a row
+			# (except on Windows, where TERMing is killing)
+			for i in range(3):
+				try:
+					try:
+						case.process.terminate()
+					except AttributeError:
+						# Python 2.5
+						if TerminateProcess and hasattr(proc, '_handle'):
+							# Windows API
+							TerminateProcess(proc._handle, 1)
+						else:
+							# POSIX
+							os.kill(proc.pid, SIGTERM)
+				except Exception:
+					time.sleep(0)
+					case.process.poll()
+				else:
+					case.process.wait()
+					break
+			else:
+				# If killing the process is unsuccessful three times in a row,
+				# just silently stop trying
+				for i in range(3):
+					try:
+						try:
+							case.process.kill()
+						except AttributeError:
+							# Python 2.5
+							if TerminateProcess and hasattr(proc, '_handle'):
+								# Windows API
+								TerminateProcess(proc._handle, 1)
+							else:
+								# POSIX
+								os.kill(proc.pid, SIGKILL)
+					except Exception:
+						time.sleep(0)
+						case.process.poll()
+					else:
+						case.process.wait()
+						break
+		if case.files_to_delete:
+			for name in case.files_to_delete:
+				try:
+					os.remove(name)
+				except Exception:
+					# It can't be helped
+					pass
+	
+	def open_infile(case):
+		try:
+			case.infile = files.File('/'.join((case.problem.name, case.realinname.replace('$', case.id))))
+		except IOError:
+			e = sys.exc_info()[1]
+			raise CannotReadInputFile(e)
+	
+	def open_outfile(case):
+		try:
+			case.outfile = files.File('/'.join((case.problem.name, case.realoutname.replace('$', case.id))))
+		except IOError:
+			e = sys.exc_info()[1]
+			raise CannotReadAnswerFile(e)
+
+
+class ValidatedTestCase(TestCase):
+	__slots__ = 'validator'
+	
+	def __init__(case, *args):
+		TestCase.__init__(case, *args)
+		if not case.problem.config.tester:
+			case.validator = None
+		else:
+			case.validator = case.problem.config.tester
+	
+	def validate(case, output):
+		if not case.validator:
+			# Compare the output with the reference output
+			case.open_outfile()
+			with case.outfile.open() as refoutput:
+				for line, refline in zip_longest(output, refoutput):
+					if refline is not None and not isinstance(refline, basestring):
+						line = bytes(line, sys.getdefaultencoding())
+					if line != refline:
+						raise WrongAnswer
+			return 1
+		elif callable(case.validator):
+			return case.validator(output)
+		else:                 
+			# Call the validator program
+			output.close()
+			if case.problem.config.ansname:
+				case.open_outfile()
+				case.outfile.copy(case.problem.config.ansname)
+			try:
+				case.process = Popen(case.validator, stdin=devnull, stdout=PIPE, stderr=STDOUT, universal_newlines=True, bufsize=-1)
+			except OSError:
+				raise CannotStartValidator(sys.exc_info()[1])
+			comment = case.process.communicate()[0].strip()
+			match = re.match(r'(?i)(ok|(?:correct|wrong)(?:(?:\s|_)*answer)?)(?:$|\s+|[.,!:]+\s*)', comment)
+			if match:
+				comment = comment[match.end():]
+			if not case.problem.config.maxexitcode:
+				if case.process.returncode:
+					raise WrongAnswer(comment)
+				else:
+					return 1, comment
+			else:
+				return case.process.returncode / case.problem.config.maxexitcode, comment
+
+
+class BatchTestCase(ValidatedTestCase):
+	__slots__ = ()
+	
+	def test(case, callback):
+		init_canceled()
+		if sys.platform == 'win32' or not case.maxmemory:
+			preexec_fn = None
+		else:
+			def preexec_fn():
+				try:
+					import resource
+					maxmemory = int(case.maxmemory * 1048576)
+					resource.setrlimit(resource.RLIMIT_AS, (maxmemory, maxmemory))
+					# I would also set a CPU time limit but I do not want the time
+					# that passes between the calls to fork and exec to be counted in
+				except MemoryError:
+					# We do not have enough memory for ourselves;
+					# let the parent know about this
+					raise
+				except Exception:
+					# Well, at least we tried
+					pass
+		case.open_infile()
+		case.time_started = None
+		if case.problem.config.stdio:
+			if options.erase and not case.validator and case.problem.config.inname:
+				# TODO: re-use the same file name if possible
+				# FIXME: 2.5 lacks the delete parameter
+				with tempfile.NamedTemporaryFile(delete=False) as f:
+					inputdatafname = f.name
+				contextmgr = CopyDeleting(case, case.infile, inputdatafname)
+			else:
+				inputdatafname = case.problem.config.inname
+				contextmgr = Copying(case.infile, inputdatafname)
+			with contextmgr:
+				# FIXME: this U doesn't do anything good for the child process, does it?
+				with open(inputdatafname, 'rU') as infile:
+					with tempfile.TemporaryFile('w+') if options.erase and not case.validator else open(case.problem.config.outname, 'w+') as outfile:
+						try:
+							try:
+								case.process = Popen(case.problem.config.path, stdin=infile, stdout=outfile, stderr=devnull, universal_newlines=True, bufsize=-1, preexec_fn=preexec_fn)
+							except MemoryError:
+								# If there is not enough memory for the forked test.py,
+								# opt for silent dropping of the limit
+								# TODO: show a warning somewhere
+								case.process = Popen(case.problem.config.path, stdin=infile, stdout=outfile, stderr=devnull, universal_newlines=True, bufsize=-1)
+						except OSError:
+							raise CannotStartTestee(sys.exc_info()[1])
+						case.time_started = clock()
+						time_next_check = case.time_started + .15
+						if not case.maxtime:
+							while True:
+								exitcode, now = case.process.poll(), clock()
+								if exitcode is not None:
+									case.time_stopped = now
+									break
+								# For some reason (probably Microsoft's fault),
+								# msvcrt.kbhit() is slow as hell
+								else:
+									if now >= time_next_check:
+										if canceled():
+											raise CanceledByUser
+										else:
+											time_next_check = now + .15
+									time.sleep(0)
+						else:
+							time_end = case.time_started + case.maxtime
+							while True:
+								exitcode, now = case.process.poll(), clock()
+								if exitcode is not None:
+									case.time_stopped = now
+									break
+								elif now >= time_end:
+									raise TimeLimitExceeded
+								else:
+									if now >= time_next_check:
+										if canceled():
+											raise CanceledByUser
+										else:
+											time_next_check = now + .15
+									time.sleep(0)
+						if config.globalconf.force_zero_exitcode and case.process.returncode:
+							raise NonZeroExitCode(case.process.returncode)
+						callback()
+						case.has_called_back = True
+						outfile.seek(0)
+						return case.validate(outfile)
+		else:
+			case.infile.copy(case.problem.config.inname)
+			try:
+				try:
+					case.process = Popen(case.problem.config.path, stdin=devnull, stdout=devnull, stderr=STDOUT, preexec_fn=preexec_fn)
+				except MemoryError:
+					# If there is not enough memory for the forked test.py,
+					# opt for silent dropping of the limit
+					# TODO: show a warning somewhere
+					case.process = Popen(case.problem.config.path, stdin=devnull, stdout=devnull, stderr=STDOUT)
+			except OSError:
+				raise CannotStartTestee(sys.exc_info()[1])
+			case.time_started = clock()
+			time_next_check = case.time_started + .15
+			if not case.maxtime:
+				while True:
+					exitcode, now = case.process.poll(), clock()
+					if exitcode is not None:
+						case.time_stopped = now
+						break
+					else:
+						if now >= time_next_check:
+							if canceled():
+								raise CanceledByUser
+							else:
+								time_next_check = now + .15
+						time.sleep(0)
+			else:
+				time_end = case.time_started + case.maxtime
+				while True:
+					exitcode, now = case.process.poll(), clock()
+					if exitcode is not None:
+						case.time_stopped = now
+						break
+					elif now >= time_end:
+						raise TimeLimitExceeded
+					else:
+						if now >= time_next_check:
+							if canceled():
+								raise CanceledByUser
+							else:
+								time_next_check = now + .15
+						time.sleep(0)
+			if config.globalconf.force_zero_exitcode and case.process.returncode:
+				raise NonZeroExitCode(case.process.returncode)
+			callback()
+			case.has_called_back = True
+			with open(case.problem.config.outname, 'rU') as output:
+				return case.validate(output)
+
+
+# This is the only test case type not executing any programs to be tested
+class OutputOnlyTestCase(ValidatedTestCase):
+	__slots__ = ()
+	def cleanup(case): pass
+
+class BestOutputTestCase(ValidatedTestCase):
+	__slots__ = ()
+
+# This is the only test case type executing two programs simultaneously
+class ReactiveTestCase(TestCase):
+	__slots__ = ()
+	# The basic idea is to launch the program to be tested and the grader
+	# and to pipe their standard I/O from and to each other,
+	# and then to capture the grader's exit code and use it
+	# like the exit code of an output validator is used.
+
+
+def load_problem(prob, _types={'batch'   : BatchTestCase,
+                               'outonly' : OutputOnlyTestCase,
+                               'bestout' : BestOutputTestCase,
+                               'reactive': ReactiveTestCase}):
+	# We will need to iterate over these configuration variables twice
+	try:
+		len(prob.config.dummies)
+	except Exception:
+		prob.config.dummies = tuple(prob.config.dummies)
+	try:
+		len(prob.config.tests)
+	except Exception:
+		prob.config.tests = tuple(prob.config.tests)
+	
+	if options.legacy:
+		prob.config.usegroups = False
+		prob.config.tests = list(prob.config.tests)
+		for i, name in enumerate(prob.config.tests):
+			# Same here; we'll need to iterate over them twice
+			try:
+				l = len(name)
+			except Exception:
+				try:
+					name = tuple(name)
+				except TypeError:
+					name = (name,)
+				l = len(name)
+			if len(name) > 1:
+				prob.config.usegroups = True
+				break
+			elif not len(name):
+				prob.config.tests[i] = (name,)
+	
+	# First get prob.cache.padoutput right,
+	# then yield the actual test cases
+	for i in prob.config.dummies:
+		s = 'sample ' + str(i).zfill(prob.config.paddummies)
+		prob.cache.padoutput = max(prob.cache.padoutput, len(s))
+	if prob.config.usegroups:
+		for group in prob.config.tests:
+			for i in group:
+				s = str(i).zfill(prob.config.padtests)
+				prob.cache.padoutput = max(prob.cache.padoutput, len(s))
+		for i in prob.config.dummies:
+			s = str(i).zfill(prob.config.paddummies)
+			yield _types[prob.config.kind](prob, s, True, 0)
+		for group in prob.config.tests:
+			yield problem.TestGroup()
+			for i in group:
+				s = str(i).zfill(prob.config.padtests)
+				yield _types[prob.config.kind](prob, s, False, prob.config.pointmap.get(i, prob.config.pointmap.get(None, prob.config.maxexitcode if prob.config.maxexitcode else 1)))
+			yield problem.test_context_end
+	else:
+		for i in prob.config.tests:
+			s = str(i).zfill(prob.config.padtests)
+			prob.cache.padoutput = max(prob.cache.padoutput, len(s))
+		for i in prob.config.dummies:
+			s = str(i).zfill(prob.config.paddummies)
+			yield _types[prob.config.kind](prob, s, True, 0)
+		for i in prob.config.tests:
+			s = str(i).zfill(prob.config.padtests)
+			yield _types[prob.config.kind](prob, s, False, prob.config.pointmap.get(i, prob.config.pointmap.get(None, prob.config.maxexitcode if prob.config.maxexitcode else 1)))
\ No newline at end of file