Final_Assignment_AWorld

Sleeping

App Files Files Community

Final_Assignment_AWorld / aworlddistributed /aworldspace /routes /tasks.py

Duibonduil

Rename AWorld-main/aworlddistributed/aworldspace/routes/tasks.py to aworlddistributed/aworldspace/routes/tasks.py

0c4049a verified 4 months ago

raw

history blame

16.9 kB

	import json
	import os
	import time
	from datetime import datetime
	from typing import AsyncGenerator, Optional, List

	from aworld.utils.common import get_local_ip
	from fastapi import APIRouter, Query, Response
	from fastapi.responses import StreamingResponse

	import logging
	import traceback
	from asyncio import Queue
	import asyncio

	from aworld.models.model_response import ModelResponse
	from pydantic import BaseModel, Field, PrivateAttr

	from aworldspace.db.db import AworldTaskDB, SqliteTaskDB, PostgresTaskDB
	from aworldspace.utils.job import generate_openai_chat_completion, call_pipeline
	from aworldspace.utils.log import task_logger
	from base import AworldTask, AworldTaskResult, OpenAIChatCompletionForm, OpenAIChatMessage, AworldTaskForm


	from config import ROOT_DIR

	__STOP_TASK__ = object()




	class AworldTaskExecutor(BaseModel):
	"""
	task executor
	- load task from db and execute task in a loop
	- use semaphore to limit concurrent tasks
	"""
	_task_db: AworldTaskDB = PrivateAttr()
	_tasks: Queue = PrivateAttr()
	max_concurrent: int = Field(default=os.environ.get("AWORLD_MAX_CONCURRENT_TASKS", 2), description="max concurrent tasks")

	def __init__(self, task_db: AworldTaskDB):
	super().__init__()
	self._task_db = task_db
	self._tasks = Queue()
	self._semaphore = asyncio.BoundedSemaphore(self.max_concurrent)

	async def start(self):
	"""
	execute task in a loop
	"""
	await asyncio.sleep(5)
	logging.info(f"🚀[task executor] start, max concurrent is {self.max_concurrent}")
	while True:
	# load task if queue is empty and semaphore is not full
	if self._tasks.empty():
	await self.load_task()
	task = await self._tasks.get()
	if not task:
	logging.info("task is none")
	continue
	if task == __STOP_TASK__:
	logging.info("✅[task executor] stop, all tasks finished")
	break
	# acquire semaphore
	await self._semaphore.acquire()
	asyncio.create_task(self._run_task_and_release_semaphore(task))


	async def stop(self):
	logging.info("🛑 task executor stop, wait for all tasks to finish")
	await self._tasks.put(__STOP_TASK__)

	async def _run_task_and_release_semaphore(self, task: AworldTask):
	"""
	execute task and release semaphore when done
	"""
	start_time = time.time()
	logging.info(f"🚀[task executor] execute task#{task.task_id} start, lock acquired")
	try:
	await self.execute_task(task)
	finally:
	# release semaphore
	self._semaphore.release()
	logging.info(f"✅[task executor] execute task#{task.task_id} success, use time {time.time() - start_time:.2f}s")

	async def load_task(self):
	interval = os.environ.get("AWORLD_TASK_LOAD_INTERVAL", 10)
	# calculate the number of tasks to load
	need_load = self._semaphore._value
	if need_load <= 0:
	logging.info(f"🔍[task executor] runner is busy, wait {interval}s and retry")
	await asyncio.sleep(interval)
	return await self.load_task()
	tasks = await self._task_db.query_tasks_by_status(status="INIT", nums=need_load)
	logging.info(f"🔍[task executor] load {len(tasks)} tasks from db (need {need_load})")


	if not tasks or len(tasks) == 0:
	logging.info(f"🔍[task executor] no task to load, wait {interval}s and retry")
	await asyncio.sleep(interval)
	return await self.load_task()
	for task in tasks:
	task.mark_running()
	await self._task_db.update_task(task)
	await self._tasks.put(task)
	return True

	async def execute_task(self, task: AworldTask):
	"""
	execute task
	"""
	try:
	result = await self._execute_task(task)
	task.mark_success()
	await self._task_db.update_task(task)
	await self._task_db.save_task_result(result)
	task_logger.log_task_submission(task, "execute_finished", task_result=result)
	except Exception as err:
	task.mark_failed()
	await self._task_db.update_task(task)
	traceback.print_exc()
	task_logger.log_task_submission(task, "execute_failed", details=f"err is {err}")

	async def _execute_task(self, task: AworldTask):

	# build params
	messages = [
	OpenAIChatMessage(role="user", content=task.agent_input)
	]
	# call_llm_model
	form_data = OpenAIChatCompletionForm(
	model=task.agent_id,
	messages=messages,
	stream=True,
	user={
	"user_id": task.user_id,
	"session_id": task.session_id,
	"task_id": task.task_id,
	"aworld_task": task.model_dump_json()
	}
	)
	data = await generate_openai_chat_completion(form_data)
	task_result = {}
	task.node_id = get_local_ip()
	items = []
	md_file = ""
	if data.body_iterator:
	if isinstance(data.body_iterator, AsyncGenerator):

	async for item_content in data.body_iterator:
	async def parse_item(_item_content) -> Optional[ModelResponse]:
	if item_content == "data: [DONE]":
	return None
	return ModelResponse.from_openai_stream_chunk(json.loads(item_content.replace("data:", "")))

	# if isinstance(item, ModelResponse)
	item = await parse_item(item_content)
	items.append(item)
	if not item:
	continue

	if item.content:
	md_file = task_logger.log_task_result(task, item)
	logging.info(f"task#{task.task_id} response data chunk is: {item}"[:500])

	if item.raw_response and item.raw_response and isinstance(item.raw_response, dict) and item.raw_response.get('task_output_meta'):
	task_result = item.raw_response.get('task_output_meta')

	data = {
	"task_result": task_result,
	"md_file": md_file,
	"replays_file": f"trace_data/{datetime.now().strftime('%Y%m%d')}/{get_local_ip()}/replays/task_replay_{task.task_id}.json"
	}
	result = AworldTaskResult(task=task, server_host=get_local_ip(), data=data)
	return result


	class AworldTaskManager(BaseModel):
	_task_db: AworldTaskDB = PrivateAttr()
	_task_executor: AworldTaskExecutor = PrivateAttr()

	def __init__(self, task_db: AworldTaskDB):
	super().__init__()
	self._task_db = task_db
	self._task_executor = AworldTaskExecutor(task_db=self._task_db)

	async def start_task_executor(self):
	asyncio.create_task(self._task_executor.start())

	async def stop_task_executor(self):
	self._task_executor.tasks.put_nowait(None)

	async def submit_task(self, task: AworldTask):
	# save to db
	await self._task_db.insert_task(task)
	# log it
	task_logger.log_task_submission(task, status="init")

	return AworldTaskResult(task = task)

	async def load_one_unfinished_task(self) -> Optional[AworldTask]:
	tasks = await self._task_db.query_tasks_by_status(status="INIT", nums=1)
	if not tasks or len(tasks) == 0:
	return None

	cur_task = tasks[0]
	cur_task.mark_running()
	await self._task_db.update_task(cur_task)
	# from db load one task by locked and mark task running
	return cur_task

	async def get_task_result(self, task_id: str) -> Optional[AworldTaskResult]:
	task = await self._task_db.query_task_by_id(task_id)
	if task:
	task_result = await self._task_db.query_latest_task_result_by_id(task_id)
	if task_result:
	return task_result
	return AworldTaskResult(task=task)

	async def get_batch_task_results(self, task_ids: List[str]) -> List[dict]:
	"""
	Batch retrieve task results, returns dictionary format
	Each dict contains: task (required) and task_result (may be None)
	"""
	results = []
	for task_id in task_ids:
	task = await self._task_db.query_task_by_id(task_id)

	if task:
	task_result = await self._task_db.query_latest_task_result_by_id(task_id)

	result_dict = {
	"task": task,
	"task_result": task_result # May be None
	}
	results.append(result_dict)
	return results

	async def query_and_download_task_results(
	self,
	start_time: Optional[datetime] = None,
	end_time: Optional[datetime] = None,
	task_id: Optional[str] = None,
	page_size: int = 100
	) -> List[dict]:
	"""
	Query tasks and get results, support time range and task_id filtering
	"""
	all_results = []
	page_num = 1

	while True:
	# Build query filter conditions
	filter_dict = {}
	if start_time:
	filter_dict['start_time'] = start_time
	if end_time:
	filter_dict['end_time'] = end_time
	if task_id:
	filter_dict['task_id'] = task_id

	# Page query tasks
	page_result = await self._task_db.page_query_tasks(
	filter=filter_dict,
	page_size=page_size,
	page_num=page_num
	)

	if not page_result['items']:
	break

	tasks = page_result['items']

	for task in tasks:
	# Only query task_result (may not exist)
	task_result = await self._task_db.query_latest_task_result_by_id(task.task_id)

	# Use task information to build results
	result_data = {
	"task_id": task.task_id,
	"agent_id": task.agent_id,
	"status": task.status,
	"created_at": task.created_at.isoformat() if task.created_at else None,
	"updated_at": task.updated_at.isoformat() if task.updated_at else None,
	"user_id": task.user_id,
	"session_id": task.session_id,
	"node_id": task.node_id,
	"client_id": task.client_id,
	"task_data": task.model_dump(mode='json'),
	"has_result": task_result is not None,
	"server_host": task_result.server_host if task_result else None,
	"result_data": task_result.data if task_result else None,
	}
	all_results.append(result_data)

	if len(page_result['items']) < page_size:
	break

	page_num += 1

	return all_results


	########################################################################################
	########################### API
	########################################################################################

	router = APIRouter()

	task_db_path = os.environ.get("AWORLD_TASK_DB_PATH", f"sqlite:///{ROOT_DIR}/db/aworld.db")

	if task_db_path.startswith("sqlite://"):
	task_db = SqliteTaskDB(db_path = task_db_path)
	elif task_db_path.startswith("mysql://"):
	task_db = None # todo: add mysql task db
	elif task_db_path.startswith("postgresql://") or task_db_path.startswith("postgresql+"):
	task_db = PostgresTaskDB(db_url=task_db_path)
	else:
	raise ValueError("❌ task_db_path is not a valid sqlite, mysql or postgresql path")

	task_manager = AworldTaskManager(task_db)

	@router.post("/submit_task")
	async def submit_task(form_data: AworldTaskForm) -> Optional[AworldTaskResult]:

	logging.info(f"🚀 submit task#{form_data.task.task_id} start")
	if not form_data.task:
	raise ValueError("task is empty")

	try:
	task_result = await task_manager.submit_task(form_data.task)
	logging.info(f"✅ submit task#{form_data.task.task_id} success")
	return task_result
	except Exception as err:
	traceback.print_exc()
	logging.error(f"❌ submit task#{form_data.task.task_id} failed, err is {err}")
	raise ValueError("❌ submit task failed, please see logs for details")


	@router.get("/task_result")
	async def get_task_result(task_id) -> Optional[AworldTaskResult]:
	if not task_id:
	raise ValueError("❌ task_id is empty")

	logging.info(f"🚀 get task result#{task_id} start")
	try:
	task_result = await task_manager.get_task_result(task_id)
	logging.info(f"✅ get task result#{task_id} success, task result is {task_result}")
	return task_result
	except Exception as err:
	traceback.print_exc()
	logging.error(f"❌ get task result#{task_id} failed, err is {err}")
	raise ValueError("❌ get task result failed, please see logs for details")

	@router.post("/get_batch_task_results")
	async def get_batch_task_results(task_ids: List[str]) -> List[dict]:
	if not task_ids or len(task_ids) == 0:
	raise ValueError("❌ task_ids is empty")

	logging.info(f"🚀 get batch task results start, task_ids: {task_ids}")
	try:
	batch_results = await task_manager.get_batch_task_results(task_ids)
	logging.info(f"✅ get batch task results success, found {len(batch_results)} results")
	return batch_results
	except Exception as err:
	traceback.print_exc()
	logging.error(f"❌ get batch task results failed, err is {err}")
	raise ValueError("❌ get batch task results failed, please see logs for details")

	@router.get("/download_task_results")
	async def download_task_results(
	start_time: Optional[str] = Query(None, description="Start time, format: YYYY-MM-DD HH:MM:SS"),
	end_time: Optional[str] = Query(None, description="End time, format: YYYY-MM-DD HH:MM:SS"),
	task_id: Optional[str] = Query(None, description="Task ID"),
	page_size: int = Query(100, description="Page size, ge=1, le=1000")
	) -> StreamingResponse:
	"""
	Download task results, generate jsonl format file
	Query parameters support: time range (based on creation time), task_id
	"""
	logging.info(f"🚀 download task results start, start_time: {start_time}, end_time: {end_time}, task_id: {task_id}")

	try:
	start_datetime = None
	end_datetime = None

	if start_time:
	try:
	start_datetime = datetime.strptime(start_time, "%Y-%m-%d %H:%M:%S")
	except ValueError:
	raise ValueError("❌ start_time格式错误，请使用 YYYY-MM-DD HH:MM:SS 格式")

	if end_time:
	try:
	end_datetime = datetime.strptime(end_time, "%Y-%m-%d %H:%M:%S")
	except ValueError:
	raise ValueError("❌ end_time格式错误，请使用 YYYY-MM-DD HH:MM:SS 格式")

	results = await task_manager.query_and_download_task_results(
	start_time=start_datetime,
	end_time=end_datetime,
	task_id=task_id,
	page_size=page_size
	)

	if not results:
	logging.info("📄 no task results found")

	def generate_empty():
	yield ""

	return StreamingResponse(
	generate_empty(),
	media_type="application/jsonl",
	headers={"Content-Disposition": "attachment; filename=task_results_empty.jsonl"}
	)

	# Generate jsonl content
	def generate_jsonl():
	for result in results:
	yield json.dumps(result, ensure_ascii=False) + "\n"

	# Generate file name
	timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
	filename = f"task_results_{timestamp}.jsonl"

	logging.info(f"✅ download task results success, total: {len(results)} results")

	return StreamingResponse(
	generate_jsonl(),
	media_type="application/jsonl",
	headers={"Content-Disposition": f"attachment; filename={filename}"}
	)

	except Exception as err:
	traceback.print_exc()
	logging.error(f"❌ download task results failed, err is {err}")
	raise ValueError(f"❌ download task results failed: {str(err)}")