|
36 | 36 | "outputs": [], |
37 | 37 | "source": [ |
38 | 38 | "def setup_data_analysis_env(\n", |
39 | | - " query: str, dataset_folder: Path, language: NBLanguage = NBLanguage.PYTHON\n", |
| 39 | + " query: str, dataset: Path, language: NBLanguage = NBLanguage.PYTHON\n", |
40 | 40 | "):\n", |
41 | 41 | " # Hash the task to get a unique identifier\n", |
42 | 42 | " task_hash = hashlib.sha256(query.encode()).hexdigest()\n", |
|
46 | 46 | " trajectory_path.mkdir(parents=True, exist_ok=True)\n", |
47 | 47 | " nb_path = trajectory_path / NBEnvironment.NOTEBOOK_NAME\n", |
48 | 48 | " # Copy task data to trajectory path\n", |
49 | | - " for item in dataset_folder.iterdir():\n", |
50 | | - " if item.is_file():\n", |
51 | | - " shutil.copy2(item, trajectory_path)\n", |
52 | | - " elif item.is_dir():\n", |
53 | | - " shutil.copytree(item, trajectory_path / item.name, dirs_exist_ok=True)\n", |
| 49 | + " if dataset.is_dir():\n", |
| 50 | + " for item in dataset.iterdir():\n", |
| 51 | + " if item.is_file():\n", |
| 52 | + " shutil.copy2(item, trajectory_path)\n", |
| 53 | + " elif item.is_dir():\n", |
| 54 | + " shutil.copytree(item, trajectory_path / item.name, dirs_exist_ok=True)\n", |
| 55 | + " else:\n", |
| 56 | + " shutil.copy2(dataset, trajectory_path)\n", |
54 | 57 | " # Augment incoming task with CoT instructions\n", |
55 | 58 | " augmented_task = f\"\"\"\\\n", |
56 | 59 | " Here is the user query to address:\n", |
|
96 | 99 | "# This image includes many bioinformatics and data science packages\n", |
97 | 100 | "cfg.USE_DOCKER = False\n", |
98 | 101 | "# This can be R or PYTHON in Docker or with a local kernel if you have R installed\n", |
99 | | - "LANGUAGE = NBLanguage.R\n", |
| 102 | + "LANGUAGE = NBLanguage.PYTHON\n", |
100 | 103 | "MAX_STEPS = 3\n", |
101 | 104 | "MODEL_NAME = \"claude-3-7-sonnet-latest\"" |
102 | 105 | ] |
|
115 | 118 | "logger = logging.getLogger(__name__)\n", |
116 | 119 | "logger.info(\"Setting up data analysis environment\")\n", |
117 | 120 | "\n", |
118 | | - "dataset_folder = Path(\"dataset\")\n", |
| 121 | + "dataset = Path(\"datasets/brain_size_data.csv\")\n", |
119 | 122 | "query = \"Analyze the dataset and give me an in depth analysis using pretty plots. I am particularly interested in crows.\"\n", |
120 | | - "environment = setup_data_analysis_env(query, dataset_folder, LANGUAGE)\n", |
| 123 | + "environment = setup_data_analysis_env(query, dataset, LANGUAGE)\n", |
121 | 124 | "\n", |
122 | 125 | "agent = AgentConfig(\n", |
123 | 126 | " agent_type=\"ReActAgent\",\n", |
|
0 commit comments