[bug?] shall we use specific_trace replacing trace for experiment_list? · Issue #1244 · microsoft/RD-Agent

RD-Agent/rdagent/scenarios/qlib/proposal/model_proposal.py

Lines 86 to 127 in 59af538

    
           if len(trace.hist) == 0: 
        
               hypothesis_and_feedback = "No previous hypothesis and feedback available since it's the first round." 
        
           else: 
        
               specific_trace = Trace(trace.scen) 
        
               for i in range(len(trace.hist) - 1, -1, -1):  # Reverse iteration 
        
                   if not hasattr(trace.hist[i][0].hypothesis, "action") or trace.hist[i][0].hypothesis.action == "model": 
        
                       if last_experiment is None: 
        
                           last_experiment = trace.hist[i][0] 
        
                           last_feedback = trace.hist[i][1] 
        
                       if trace.hist[i][1].decision is True and sota_experiment is None: 
        
                           sota_experiment = trace.hist[i][0] 
        
                           sota_feedback = trace.hist[i][1] 
        
                       specific_trace.hist.insert(0, trace.hist[i]) 
        
               if len(specific_trace.hist) > 0: 
        
                   specific_trace.hist.reverse() 
        
                   hypothesis_and_feedback = T("scenarios.qlib.prompts:hypothesis_and_feedback").r( 
        
                       trace=specific_trace, 
        
                   ) 
        
               else: 
        
                   hypothesis_and_feedback = "No previous hypothesis and feedback available." 
        
           last_hypothesis_and_feedback = ( 
        
               T("scenarios.qlib.prompts:last_hypothesis_and_feedback").r( 
        
                   experiment=last_experiment, feedback=last_feedback 
        
               ) 
        
               if last_experiment is not None 
        
               else "No previous hypothesis and feedback available since it's the first round." 
        
           ) 
        
           sota_hypothesis_and_feedback = ( 
        
               T("scenarios.qlib.prompts:sota_hypothesis_and_feedback").r( 
        
                   experiment=sota_experiment, feedback=sota_feedback 
        
               ) 
        
               if sota_experiment is not None 
        
               else "No SOTA hypothesis and feedback available since previous experiments were not accepted." 
        
           ) 
        
           experiment_list: List[ModelExperiment] = [t[0] for t in trace.hist] 
        
           model_list = [] 
        
           for experiment in experiment_list: 
        
               model_list.extend(experiment.sub_tasks)

for fin_quant scenarios, there may both factor experiment and model experiment be in the trace, so if we want to gather all of model tasks, we need to list all the model experiments, shall we?

May be like that:

experiment_list: List[FactorExperiment] = [
t[0] for t in trace.hist
if isinstance(t[0], FactorExperiment)
]

Same problem is in convert_response func and also in factor_proposal.py

RD-Agent/rdagent/scenarios/qlib/proposal/model_proposal.py

Lines 40 to 165 in 59af538

    
                           if trace.hist[i][1].decision: 
        
                               sota_hypothesis_and_feedback = T("scenarios.qlib.prompts:sota_hypothesis_and_feedback").r( 
        
                                   experiment=trace.hist[i][0], feedback=trace.hist[i][1] 
        
                               ) 
        
                               break 
        
                       else: 
        
                           sota_hypothesis_and_feedback = ( 
        
                               "No SOTA hypothesis and feedback available since previous experiments were not accepted." 
        
                           ) 
        
                   context_dict = { 
        
                       "hypothesis_and_feedback": hypothesis_and_feedback, 
        
                       "last_hypothesis_and_feedback": last_hypothesis_and_feedback, 
        
                       "SOTA_hypothesis_and_feedback": sota_hypothesis_and_feedback, 
        
                       "RAG": "1. In Quantitative Finance, market data could be time-series, and GRU model/LSTM model are suitable for them. Do not generate GNN model as for now.\n2. The training data consists of less than 1 million samples for the training set and approximately 250,000 samples for the validation set. Please design the hyperparameters accordingly and control the model size. This has a significant impact on the training results. If you believe that the previous model itself is good but the training hyperparameters or model hyperparameters are not optimal, you can return the same model and adjust these parameters instead.", 
        
                       "hypothesis_output_format": T("scenarios.qlib.prompts:hypothesis_output_format").r(), 
        
                       "hypothesis_specification": T("scenarios.qlib.prompts:model_hypothesis_specification").r(), 
        
                   } 
        
                   return context_dict, True 
        
               def convert_response(self, response: str) -> Hypothesis: 
        
                   response_dict = json.loads(response) 
        
                   hypothesis = QlibModelHypothesis( 
        
                       hypothesis=response_dict.get("hypothesis"), 
        
                       reason=response_dict.get("reason"), 
        
                       concise_reason=response_dict.get("concise_reason"), 
        
                       concise_observation=response_dict.get("concise_observation"), 
        
                       concise_justification=response_dict.get("concise_justification"), 
        
                       concise_knowledge=response_dict.get("concise_knowledge"), 
        
                   ) 
        
                   return hypothesis 
        
           class QlibModelHypothesis2Experiment(ModelHypothesis2Experiment): 
        
               def prepare_context(self, hypothesis: Hypothesis, trace: Trace) -> Tuple[dict, bool]: 
        
                   if isinstance(trace.scen, QlibQuantScenario): 
        
                       scenario = trace.scen.get_scenario_all_desc(action="model") 
        
                   else: 
        
                       scenario = trace.scen.get_scenario_all_desc() 
        
                   experiment_output_format = T("scenarios.qlib.prompts:model_experiment_output_format").r() 
        
                   last_experiment = None 
        
                   last_feedback = None 
        
                   sota_experiment = None 
        
                   sota_feedback = None 
        
                   if len(trace.hist) == 0: 
        
                       hypothesis_and_feedback = "No previous hypothesis and feedback available since it's the first round." 
        
                   else: 
        
                       specific_trace = Trace(trace.scen) 
        
                       for i in range(len(trace.hist) - 1, -1, -1):  # Reverse iteration 
        
                           if not hasattr(trace.hist[i][0].hypothesis, "action") or trace.hist[i][0].hypothesis.action == "model": 
        
                               if last_experiment is None: 
        
                                   last_experiment = trace.hist[i][0] 
        
                                   last_feedback = trace.hist[i][1] 
        
                               if trace.hist[i][1].decision is True and sota_experiment is None: 
        
                                   sota_experiment = trace.hist[i][0] 
        
                                   sota_feedback = trace.hist[i][1] 
        
                               specific_trace.hist.insert(0, trace.hist[i]) 
        
                       if len(specific_trace.hist) > 0: 
        
                           specific_trace.hist.reverse() 
        
                           hypothesis_and_feedback = T("scenarios.qlib.prompts:hypothesis_and_feedback").r( 
        
                               trace=specific_trace, 
        
                           ) 
        
                       else: 
        
                           hypothesis_and_feedback = "No previous hypothesis and feedback available." 
        
                   last_hypothesis_and_feedback = ( 
        
                       T("scenarios.qlib.prompts:last_hypothesis_and_feedback").r( 
        
                           experiment=last_experiment, feedback=last_feedback 
        
                       ) 
        
                       if last_experiment is not None 
        
                       else "No previous hypothesis and feedback available since it's the first round." 
        
                   ) 
        
                   sota_hypothesis_and_feedback = ( 
        
                       T("scenarios.qlib.prompts:sota_hypothesis_and_feedback").r( 
        
                           experiment=sota_experiment, feedback=sota_feedback 
        
                       ) 
        
                       if sota_experiment is not None 
        
                       else "No SOTA hypothesis and feedback available since previous experiments were not accepted." 
        
                   ) 
        
                   experiment_list: List[ModelExperiment] = [t[0] for t in trace.hist] 
        
                   model_list = [] 
        
                   for experiment in experiment_list: 
        
                       model_list.extend(experiment.sub_tasks) 
        
                   return { 
        
                       "target_hypothesis": str(hypothesis), 
        
                       "scenario": scenario, 
        
                       "hypothesis_and_feedback": hypothesis_and_feedback, 
        
                       "last_hypothesis_and_feedback": last_hypothesis_and_feedback, 
        
                       "SOTA_hypothesis_and_feedback": sota_hypothesis_and_feedback, 
        
                       "experiment_output_format": experiment_output_format, 
        
                       "target_list": model_list, 
        
                       "RAG": "Note, the training data consists of less than 1 million samples for the training set and approximately 250,000 samples for the validation set. Please design the hyperparameters accordingly and control the model size. This has a significant impact on the training results. If you believe that the previous model itself is good but the training hyperparameters or model hyperparameters are not optimal, you can return the same model and adjust these parameters instead.", 
        
                   }, True 
        
               def convert_response(self, response: str, hypothesis: Hypothesis, trace: Trace) -> ModelExperiment: 
        
                   response_dict = json.loads(response) 
        
                   tasks = [] 
        
                   for model_name in response_dict: 
        
                       description = response_dict[model_name]["description"] 
        
                       formulation = response_dict[model_name]["formulation"] 
        
                       architecture = response_dict[model_name]["architecture"] 
        
                       variables = response_dict[model_name]["variables"] 
        
                       hyperparameters = response_dict[model_name]["hyperparameters"] 
        
                       training_hyperparameters = response_dict[model_name]["training_hyperparameters"] 
        
                       model_type = response_dict[model_name]["model_type"] 
        
                       tasks.append( 
        
                           ModelTask( 
        
                               name=model_name, 
        
                               description=description, 
        
                               formulation=formulation, 
        
                               architecture=architecture, 
        
                               variables=variables, 
        
                               hyperparameters=hyperparameters, 
        
                               training_hyperparameters=training_hyperparameters, 
        
                               model_type=model_type, 
        
                           ) 
        
                       ) 
        
                   exp = QlibModelExperiment(tasks, hypothesis=hypothesis) 
        
                   exp.based_experiments = [t[0] for t in trace.hist if t[1]] 
        
                   return exp

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

Uh oh!

Uh oh!

[bug?] shall we use specific_trace replacing trace for experiment_list? #1244

Metadata

Assignees

Labels

Type

Projects

Milestone

Relationships

Development

	if len(trace.hist) == 0:
	hypothesis_and_feedback = "No previous hypothesis and feedback available since it's the first round."
	else:
	specific_trace = Trace(trace.scen)
	for i in range(len(trace.hist) - 1, -1, -1): # Reverse iteration
	if not hasattr(trace.hist[i][0].hypothesis, "action") or trace.hist[i][0].hypothesis.action == "model":
	if last_experiment is None:
	last_experiment = trace.hist[i][0]
	last_feedback = trace.hist[i][1]
	if trace.hist[i][1].decision is True and sota_experiment is None:
	sota_experiment = trace.hist[i][0]
	sota_feedback = trace.hist[i][1]
	specific_trace.hist.insert(0, trace.hist[i])
	if len(specific_trace.hist) > 0:
	specific_trace.hist.reverse()
	hypothesis_and_feedback = T("scenarios.qlib.prompts:hypothesis_and_feedback").r(
	trace=specific_trace,
	)
	else:
	hypothesis_and_feedback = "No previous hypothesis and feedback available."

	last_hypothesis_and_feedback = (
	T("scenarios.qlib.prompts:last_hypothesis_and_feedback").r(
	experiment=last_experiment, feedback=last_feedback
	)
	if last_experiment is not None
	else "No previous hypothesis and feedback available since it's the first round."
	)

	sota_hypothesis_and_feedback = (
	T("scenarios.qlib.prompts:sota_hypothesis_and_feedback").r(
	experiment=sota_experiment, feedback=sota_feedback
	)
	if sota_experiment is not None
	else "No SOTA hypothesis and feedback available since previous experiments were not accepted."
	)

	experiment_list: List[ModelExperiment] = [t[0] for t in trace.hist]

	model_list = []
	for experiment in experiment_list:
	model_list.extend(experiment.sub_tasks)

	if trace.hist[i][1].decision:
	sota_hypothesis_and_feedback = T("scenarios.qlib.prompts:sota_hypothesis_and_feedback").r(
	experiment=trace.hist[i][0], feedback=trace.hist[i][1]
	)
	break
	else:
	sota_hypothesis_and_feedback = (
	"No SOTA hypothesis and feedback available since previous experiments were not accepted."
	)

	context_dict = {
	"hypothesis_and_feedback": hypothesis_and_feedback,
	"last_hypothesis_and_feedback": last_hypothesis_and_feedback,
	"SOTA_hypothesis_and_feedback": sota_hypothesis_and_feedback,
	"RAG": "1. In Quantitative Finance, market data could be time-series, and GRU model/LSTM model are suitable for them. Do not generate GNN model as for now.\n2. The training data consists of less than 1 million samples for the training set and approximately 250,000 samples for the validation set. Please design the hyperparameters accordingly and control the model size. This has a significant impact on the training results. If you believe that the previous model itself is good but the training hyperparameters or model hyperparameters are not optimal, you can return the same model and adjust these parameters instead.",
	"hypothesis_output_format": T("scenarios.qlib.prompts:hypothesis_output_format").r(),
	"hypothesis_specification": T("scenarios.qlib.prompts:model_hypothesis_specification").r(),
	}
	return context_dict, True

	def convert_response(self, response: str) -> Hypothesis:
	response_dict = json.loads(response)
	hypothesis = QlibModelHypothesis(
	hypothesis=response_dict.get("hypothesis"),
	reason=response_dict.get("reason"),
	concise_reason=response_dict.get("concise_reason"),
	concise_observation=response_dict.get("concise_observation"),
	concise_justification=response_dict.get("concise_justification"),
	concise_knowledge=response_dict.get("concise_knowledge"),
	)
	return hypothesis


	class QlibModelHypothesis2Experiment(ModelHypothesis2Experiment):
	def prepare_context(self, hypothesis: Hypothesis, trace: Trace) -> Tuple[dict, bool]:
	if isinstance(trace.scen, QlibQuantScenario):
	scenario = trace.scen.get_scenario_all_desc(action="model")
	else:
	scenario = trace.scen.get_scenario_all_desc()
	experiment_output_format = T("scenarios.qlib.prompts:model_experiment_output_format").r()

	last_experiment = None
	last_feedback = None
	sota_experiment = None
	sota_feedback = None

	if len(trace.hist) == 0:
	hypothesis_and_feedback = "No previous hypothesis and feedback available since it's the first round."
	else:
	specific_trace = Trace(trace.scen)
	for i in range(len(trace.hist) - 1, -1, -1): # Reverse iteration
	if not hasattr(trace.hist[i][0].hypothesis, "action") or trace.hist[i][0].hypothesis.action == "model":
	if last_experiment is None:
	last_experiment = trace.hist[i][0]
	last_feedback = trace.hist[i][1]
	if trace.hist[i][1].decision is True and sota_experiment is None:
	sota_experiment = trace.hist[i][0]
	sota_feedback = trace.hist[i][1]
	specific_trace.hist.insert(0, trace.hist[i])
	if len(specific_trace.hist) > 0:
	specific_trace.hist.reverse()
	hypothesis_and_feedback = T("scenarios.qlib.prompts:hypothesis_and_feedback").r(
	trace=specific_trace,
	)
	else:
	hypothesis_and_feedback = "No previous hypothesis and feedback available."

	last_hypothesis_and_feedback = (
	T("scenarios.qlib.prompts:last_hypothesis_and_feedback").r(
	experiment=last_experiment, feedback=last_feedback
	)
	if last_experiment is not None
	else "No previous hypothesis and feedback available since it's the first round."
	)

	sota_hypothesis_and_feedback = (
	T("scenarios.qlib.prompts:sota_hypothesis_and_feedback").r(
	experiment=sota_experiment, feedback=sota_feedback
	)
	if sota_experiment is not None
	else "No SOTA hypothesis and feedback available since previous experiments were not accepted."
	)

	experiment_list: List[ModelExperiment] = [t[0] for t in trace.hist]

	model_list = []
	for experiment in experiment_list:
	model_list.extend(experiment.sub_tasks)

	return {
	"target_hypothesis": str(hypothesis),
	"scenario": scenario,
	"hypothesis_and_feedback": hypothesis_and_feedback,
	"last_hypothesis_and_feedback": last_hypothesis_and_feedback,
	"SOTA_hypothesis_and_feedback": sota_hypothesis_and_feedback,
	"experiment_output_format": experiment_output_format,
	"target_list": model_list,
	"RAG": "Note, the training data consists of less than 1 million samples for the training set and approximately 250,000 samples for the validation set. Please design the hyperparameters accordingly and control the model size. This has a significant impact on the training results. If you believe that the previous model itself is good but the training hyperparameters or model hyperparameters are not optimal, you can return the same model and adjust these parameters instead.",
	}, True

	def convert_response(self, response: str, hypothesis: Hypothesis, trace: Trace) -> ModelExperiment:
	response_dict = json.loads(response)
	tasks = []
	for model_name in response_dict:
	description = response_dict[model_name]["description"]
	formulation = response_dict[model_name]["formulation"]
	architecture = response_dict[model_name]["architecture"]
	variables = response_dict[model_name]["variables"]
	hyperparameters = response_dict[model_name]["hyperparameters"]
	training_hyperparameters = response_dict[model_name]["training_hyperparameters"]
	model_type = response_dict[model_name]["model_type"]
	tasks.append(
	ModelTask(
	name=model_name,
	description=description,
	formulation=formulation,
	architecture=architecture,
	variables=variables,
	hyperparameters=hyperparameters,
	training_hyperparameters=training_hyperparameters,
	model_type=model_type,
	)
	)
	exp = QlibModelExperiment(tasks, hypothesis=hypothesis)
	exp.based_experiments = [t[0] for t in trace.hist if t[1]]
	return exp

Uh oh!

[bug?] shall we use specific_trace replacing trace for experiment_list? #1244

Description

Metadata

Metadata

Assignees

Labels

Type

Projects

Milestone

Relationships

Development

Issue actions