mirror of
https://github.com/QingdaoU/OnlineJudge.git
synced 2024-09-21 08:23:20 +00:00
ae931b4dba
我一定是sb了,使用Python的多线程跑cpu密集型的应用。 由于Python的GIL的存在,导致在cpu上每次只能有一个线程在运行。如果一个线程运行,而且cpu时间是3秒的话,那实际运行时间将大约3秒。如果两个线程同时在进行,那总运行时间几乎要翻倍。 而换用多进程之后,单个进行运行实际时间只是稍微大于cpu时间,两个进程同时运行的时候,总的时间也是cpu时间稍微增加。 同时Python2在多进程之间运行类方法的时候存在bug,使用了 http://stackoverflow.com/questions/1816958/cant-pickle-type-instancemethod-when-using-pythons-multiprocessing-pool-ma/7309686#7309686 的方法进行patch。然后不同进程之间共享的时候,要防止循环依赖,参考 http://stackoverflow.com/questions/25382455/python-notimplementederror-pool-objects-cannot-be-passed-between-processes
206 lines
7.5 KiB
Python
206 lines
7.5 KiB
Python
# coding=utf-8
|
||
import json
|
||
import time
|
||
import commands
|
||
from multiprocessing import Pool
|
||
from settings import max_running_number, lrun_gid, lrun_uid, use_tmpfs
|
||
from consts import Language, Result
|
||
|
||
from copy_reg import pickle
|
||
from types import MethodType
|
||
|
||
|
||
# 下面两个函数告诉Python怎么pickle类实例中的方法,否则Python2会报错,是Python2的已知bug
|
||
def _pickle_method(method):
|
||
func_name = method.im_func.__name__
|
||
obj = method.im_self
|
||
cls = method.im_class
|
||
return _unpickle_method, (func_name, obj, cls)
|
||
|
||
|
||
def _unpickle_method(func_name, obj, cls):
|
||
for cls in cls.mro():
|
||
try:
|
||
func = cls.__dict__[func_name]
|
||
except KeyError:
|
||
pass
|
||
else:
|
||
break
|
||
return func.__get__(obj, cls)
|
||
|
||
|
||
class JudgeClientException(Exception):
|
||
pass
|
||
|
||
|
||
class JudgeClient(object):
|
||
def __init__(self, language, exec_file_path, max_cpu_time,
|
||
max_real_time, max_memory, test_case_dir):
|
||
"""
|
||
:param language: 语言,见consts.py
|
||
:param exec_file_path: 可执行文件路径
|
||
:param max_cpu_time: 最大cpu时间,单位ms
|
||
:param max_real_time: 最大执行时间,单位ms
|
||
:param max_memory: 最大内存,单位MB
|
||
:param test_case_dir: 测试用户文件夹路径
|
||
:return:返回结果list
|
||
"""
|
||
self.language = language
|
||
self.exec_file_path = exec_file_path
|
||
self.max_cpu_time = max_cpu_time
|
||
self.max_real_time = max_real_time
|
||
self.max_memory = max_memory
|
||
self.test_case_dir = test_case_dir
|
||
# 进程池
|
||
self.pool = Pool(processes=max_running_number)
|
||
# 结果数组
|
||
self.results = []
|
||
# 测试用例配置项
|
||
self.test_case_info = self.load_test_case_info()
|
||
|
||
def load_test_case_info(self):
|
||
# 读取测试用例信息 转换为dict
|
||
# try:
|
||
# f = open(self.test_case_dir + "info")
|
||
# return json.loads(f.read())
|
||
# except IOError:
|
||
# raise JudgeClientException("Test case config file not found")
|
||
# except ValueError:
|
||
# raise JudgeClientException("Test case config file format error")
|
||
return {"test_case_number": 2,
|
||
"test_cases":
|
||
{
|
||
"1": {"input_name": "1.in",
|
||
"output_name": "1.out",
|
||
"output_md5": "yyy",
|
||
"output_size": 100},
|
||
|
||
"2": {"input_name": "2.in",
|
||
"output_name": "2.out",
|
||
"output_md5": "yyy",
|
||
"output_size": 100}
|
||
}
|
||
}
|
||
|
||
def generate_command(self, test_case_id):
|
||
"""
|
||
设置相关运行限制 进制访问网络 如果启用tmpfs 就把代码输出写入tmpfs,否则写入硬盘
|
||
"""
|
||
# todo 系统调用白名单 chroot等参数
|
||
# fixme 时间的单位问题
|
||
command = "lrun" + \
|
||
" --max-cpu-time " + str(self.max_cpu_time / 1000.0) + \
|
||
" --max-real-time " + str(self.max_real_time / 1000.0) + \
|
||
" --max-memory " + str(self.max_memory * 1000 * 1000) + \
|
||
" --network false" + \
|
||
" --uid " + str(lrun_uid) + \
|
||
" --gid " + str(lrun_gid)
|
||
#if use_tmpfs:
|
||
# command += (" --tmpfs /var " +
|
||
# str(int(self.test_case_info["test_cases"][str(test_case_id)]["output_size"] * 1.2)))
|
||
|
||
if self.language == Language.JAVA:
|
||
command += (" java " + self.exec_file_path)
|
||
else:
|
||
command += (" " + self.exec_file_path)
|
||
# fixme 输出路径
|
||
command += (" 0<" + self.test_case_dir + str(test_case_id) + ".in" +
|
||
" 1>" + "/var/judge/" + str(test_case_id) + ".out" +
|
||
" 3>&2")
|
||
return command
|
||
|
||
def parse_lrun_output(self, output):
|
||
lines = output.split("\n")
|
||
if len(lines) != 7:
|
||
raise JudgeClientException("Lrun result parse error")
|
||
result = {}
|
||
# 将lrun输出的各种带下划线 不带下划线的字符串统一处理
|
||
translate = {"MEMORY": "memory",
|
||
"CPUTIME": "cpu_time",
|
||
"CPU_TIME": "cpu_time",
|
||
"REALTIME": "real_time",
|
||
"REAL_TIME": "real_time",
|
||
"TERMSIG": "term_sig",
|
||
"SIGNALED": "siginaled",
|
||
"EXITCODE": "exit_code",
|
||
"EXCEED": "exceed"}
|
||
for line in lines:
|
||
name = line[:9].strip(" ")
|
||
value = line[9:]
|
||
print name, value
|
||
if name == "MEMORY":
|
||
result[translate[name]] = int(value)
|
||
elif name == "CPUTIME":
|
||
result[translate[name]] = float(value) * 1000
|
||
elif name == "REALTIME":
|
||
result[translate[name]] = float(value) * 1000
|
||
elif name == "EXITCODE":
|
||
result[translate[name]] = int(value)
|
||
elif name == "TERMSIG":
|
||
result[translate[name]] = int(value)
|
||
elif name == "SIGNALED":
|
||
result[translate[name]] = int(value)
|
||
elif name == "EXCEED":
|
||
if value == "none":
|
||
result[translate[name]] = None
|
||
else:
|
||
result[translate[name]] = translate[value]
|
||
return result
|
||
|
||
def judge_one(self, test_case_id):
|
||
# 运行lrun程序 接收返回值
|
||
command = self.generate_command(test_case_id)
|
||
status_code, output = commands.getstatusoutput(command)
|
||
if status_code:
|
||
raise JudgeClientException(output)
|
||
run_result = self.parse_lrun_output(output)
|
||
|
||
run_result["test_case_id"] = test_case_id
|
||
|
||
# 如果返回值非0,代表非正常结束
|
||
if run_result["exit_code"] or run_result["term_sig"] or run_result["siginaled"]:
|
||
run_result["result"] = Result.RUNTIME_ERROR
|
||
return run_result
|
||
|
||
# 代表内存或者时间超过限制了
|
||
if run_result["exceed"]:
|
||
if run_result["exceed"] == "memory":
|
||
run_result["result"] = Result.MEMORY_LIMIT_EXCEEDED
|
||
elif run_result["exceed"] in ["cpu_time", "real_time"]:
|
||
run_result["result"] = Result.TIME_LIMIT_EXCEEDED
|
||
else:
|
||
run_result["result"] = Result.SYSTEM_ERROR
|
||
return run_result
|
||
|
||
# 下面就是代码正常运行了
|
||
run_result["result"] = Result.ACCEPTED
|
||
return run_result
|
||
|
||
def collect_result(self, result):
|
||
self.results.append(result)
|
||
|
||
def run(self):
|
||
# 添加到任务队列
|
||
for i in range(self.test_case_info["test_case_number"]):
|
||
self.pool.apply_async(self.judge_one, args=(i + 1, ),
|
||
callback=self.collect_result)
|
||
self.pool.close()
|
||
self.pool.join()
|
||
print self.results
|
||
|
||
def __getstate__(self):
|
||
# 不同的pool之间进行pickle的时候要排除自己,否则报错
|
||
self_dict = self.__dict__.copy()
|
||
del self_dict['pool']
|
||
return self_dict
|
||
|
||
|
||
pickle(MethodType, _pickle_method, _unpickle_method)
|
||
client = JudgeClient(language=Language.C,
|
||
exec_file_path="/var/judge/a.out",
|
||
max_cpu_time=1000000,
|
||
max_real_time=200000,
|
||
max_memory=1,
|
||
test_case_dir="/var/test_case/1/")
|
||
client.run()
|