fix(worker) : un dictionnaire de conf venant du client est passé à l'initial...
5f3160c2
hugo.roussaffa
committed
3 changed files
create_indicator.ipynb
/examples/create_indicator.ipynb-12+213
/examples/create_indicator.ipynb
Add comment 2 "cells": [
Add comment 3 {
Add comment 4 "cell_type": "code",
Add comment 5 Minus   "execution_count": null,
Add comment 5 Plus   "execution_count": 1,
Add comment 6 "metadata": {},
Add comment 7 "outputs": [],
Add comment 8 "source": [
Add comment 23 },
Add comment 24 {
Add comment 25 "cell_type": "code",
Add comment 26 Minus   "execution_count": null,
Add comment 26 Plus   "execution_count": 2,
Add comment 27 "metadata": {},
Add comment 28 "outputs": [],
Add comment 29 "source": [
Add comment 72 },
Add comment 73 {
Add comment 74 "cell_type": "code",
Add comment 75 Minus   "execution_count": null,
Add comment 75 Plus   "execution_count": 3,
Add comment 76 "metadata": {},
Add comment 77 "outputs": [],
Add comment 78 "source": [
Add comment 96 },
Add comment 97 {
Add comment 98 "cell_type": "code",
Add comment 99 Minus   "execution_count": null,
Add comment 99 Plus   "execution_count": 4,
Add comment 100 "metadata": {},
Add comment 101 Minus   "outputs": [],
Add comment 101 Plus   "outputs": [
Add comment 102 Plus   {
Add comment 103 Plus   "name": "stderr",
Add comment 104 Plus   "output_type": "stream",
Add comment 105 Plus   "text": [
Add comment 106 Plus   "20/02/2024 17:38:00 - INFO - Config - Settings Imported\n",
Add comment 107 Plus   "20/02/2024 17:38:00 - WARNING - The following variables are null: commun_path, project_dir, data_catalog_dir, data_output_dir, sig_data_path, project_db_schema\n",
Add comment 108 Plus   "20/02/2024 17:38:01 - INFO - Utils - Connection Imported\n",
Add comment 109 Plus   "20/02/2024 17:38:01 - INFO - Utils - Dataframe Imported\n",
Add comment 110 Plus   "20/02/2024 17:38:01 - INFO - Utils - Geometry Imported\n",
Add comment 111 Plus   "20/02/2024 17:38:01 - DEBUG - Could not import boto3, continuing with reduced functionality.\n",
Add comment 112 Plus   "20/02/2024 17:38:01 - INFO - Utils - Raster Imported\n",
Add comment 113 Plus   "20/02/2024 17:38:02 - DEBUG - Could not import boto3, continuing with reduced functionality.\n",
Add comment 114 Plus   "20/02/2024 17:38:02 - DEBUG - GDAL_DATA found in environment.\n",
Add comment 115 Plus   "20/02/2024 17:38:02 - DEBUG - PROJ_DATA found in environment.\n",
Add comment 116 Plus   "20/02/2024 17:38:02 - INFO - GeoIndicator - Gee Imported\n",
Add comment 117 Plus   "20/02/2024 17:38:02 - INFO - Utils - Interpolation Imported\n",
Add comment 118 Plus   "20/02/2024 17:38:02 - INFO - GeoIndicator - Distribution Imported\n",
Add comment 119 Plus   "20/02/2024 17:38:02 - INFO - GeoIndicator - Raster Imported\n",
Add comment 120 Plus   "20/02/2024 17:38:02 - INFO - GeoIndicator - Calculation Imported\n"
Add comment 121 Plus   ]
Add comment 122 Plus   }
Add comment 123 Plus   ],
Add comment 102 124 "source": [
Add comment 103 125 "%load_ext autoreload\n",
Add comment 104 126 "%autoreload 2\n",
Add comment 114 136 },
Add comment 115 137 {
Add comment 116 138 "cell_type": "code",
Add comment 117 Minus   "execution_count": null,
Add comment 139 Plus   "execution_count": 5,
Add comment 118 140 "metadata": {},
Add comment 119 Minus   "outputs": [],
Add comment 141 Plus   "outputs": [
Add comment 142 Plus   {
Add comment 143 Plus   "data": {
Add comment 144 Plus   "text/html": [
Add comment 145 Plus   "\n",
Add comment 146 Plus   " <style>\n",
Add comment 147 Plus   " .geemap-dark {\n",
Add comment 148 Plus   " --jp-widgets-color: white;\n",
Add comment 149 Plus   " --jp-widgets-label-color: white;\n",
Add comment 150 Plus   " --jp-ui-font-color1: white;\n",
Add comment 151 Plus   " --jp-layout-color2: #454545;\n",
Add comment 152 Plus   " background-color: #383838;\n",
Add comment 153 Plus   " }\n",
Add comment 154 Plus   " \n",
Add comment 155 Plus   " .geemap-dark .jupyter-button {\n",
Add comment 156 Plus   " --jp-layout-color3: #383838;\n",
Add comment 157 Plus   " }\n",
Add comment 158 Plus   " \n",
Add comment 159 Plus   " .geemap-colab {\n",
Add comment 160 Plus   " background-color: var(--colab-primary-surface-color, white);\n",
Add comment 161 Plus   " }\n",
Add comment 162 Plus   " \n",
Add comment 163 Plus   " .geemap-colab .jupyter-button {\n",
Add comment 164 Plus   " --jp-layout-color3: var(--colab-primary-surface-color, white);\n",
Add comment 165 Plus   " }\n",
Add comment 166 Plus   " </style>\n",
Add comment 167 Plus   " "
Add comment 168 Plus   ],
Add comment 169 Plus   "text/plain": [
Add comment 170 Plus   "<IPython.core.display.HTML object>"
Add comment 171 Plus   ]
Add comment 172 Plus   },
Add comment 173 Plus   "metadata": {},
Add comment 174 Plus   "output_type": "display_data"
Add comment 175 Plus   },
Add comment 176 Plus   {
Add comment 177 Plus   "name": "stderr",
Add comment 178 Plus   "output_type": "stream",
Add comment 179 Plus   "text": [
Add comment 180 Plus   "20/02/2024 17:38:02 - WARNING - La variable d'environnement SCHEDULER_IP doit être renseignée pour effectuer les traitements de manière distribuée\n",
Add comment 181 Plus   "20/02/2024 17:38:02 - INFO - on applique cette ip par défaut : 172.20.12.13:9786\n",
Add comment 182 Plus   "20/02/2024 17:38:02 - DEBUG - Using selector: EpollSelector\n"
Add comment 183 Plus   ]
Add comment 184 Plus   },
Add comment 185 Plus   {
Add comment 186 Plus   "data": {
Add comment 187 Plus   "text/plain": [
Add comment 188 Plus   "{'tcp://172.20.10.112:40691': None}"
Add comment 189 Plus   ]
Add comment 190 Plus   },
Add comment 191 Plus   "execution_count": 5,
Add comment 192 Plus   "metadata": {},
Add comment 193 Plus   "output_type": "execute_result"
Add comment 194 Plus   }
Add comment 195 Plus   ],
Add comment 120 196 "source": [
Add comment 121 197 "client = settings.getDaskClient()\n",
Add comment 198 Plus   "config = settings.initializeBilboProject(dotenvPath='.dev_env')\n",
Add comment 199 Plus   "client.run(settings.initializeWorkers, config)\n",
Add comment 122 200 "\n",
Add comment 123 Minus   "client.run(settings.initializeWorkers)\n",
Add comment 124 201 "\n",
Add comment 125 Minus   "config = settings.initializeBilboProject(dotenvPath='.dev_env')\n",
Add comment 126 Minus   "config"
Add comment 202 Plus   "\n"
Add comment 127 203 ]
Add comment 128 204 },
Add comment 129 205 {
Add comment 130 206 "cell_type": "code",
Add comment 131 Minus   "execution_count": null,
Add comment 207 Plus   "execution_count": 6,
Add comment 208 Plus   "metadata": {},
Add comment 209 Plus   "outputs": [
Add comment 210 Plus   {
Add comment 211 Plus   "data": {
Add comment 212 Plus   "text/html": [
Add comment 213 Plus   "\n",
Add comment 214 Plus   " <style>\n",
Add comment 215 Plus   " .geemap-dark {\n",
Add comment 216 Plus   " --jp-widgets-color: white;\n",
Add comment 217 Plus   " --jp-widgets-label-color: white;\n",
Add comment 218 Plus   " --jp-ui-font-color1: white;\n",
Add comment 219 Plus   " --jp-layout-color2: #454545;\n",
Add comment 220 Plus   " background-color: #383838;\n",
Add comment 221 Plus   " }\n",
Add comment 222 Plus   " \n",
Add comment 223 Plus   " .geemap-dark .jupyter-button {\n",
Add comment 224 Plus   " --jp-layout-color3: #383838;\n",
Add comment 225 Plus   " }\n",
Add comment 226 Plus   " \n",
Add comment 227 Plus   " .geemap-colab {\n",
Add comment 228 Plus   " background-color: var(--colab-primary-surface-color, white);\n",
Add comment 229 Plus   " }\n",
Add comment 230 Plus   " \n",
Add comment 231 Plus   " .geemap-colab .jupyter-button {\n",
Add comment 232 Plus   " --jp-layout-color3: var(--colab-primary-surface-color, white);\n",
Add comment 233 Plus   " }\n",
Add comment 234 Plus   " </style>\n",
Add comment 235 Plus   " "
Add comment 236 Plus   ],
Add comment 237 Plus   "text/plain": [
Add comment 238 Plus   "<IPython.core.display.HTML object>"
Add comment 239 Plus   ]
Add comment 240 Plus   },
Add comment 132 241 "metadata": {},
Add comment 133 Minus   "outputs": [],
Add comment 242 Plus   "output_type": "display_data"
Add comment 243 Plus   },
Add comment 244 Plus   {
Add comment 245 Plus   "name": "stderr",
Add comment 246 Plus   "output_type": "stream",
Add comment 247 Plus   "text": [
Add comment 248 Plus   "20/02/2024 17:38:07 - DEBUG - open file: /media/commun/commun/Informatique/SIG/Application/Jupyterhub/projets/catalogFiles/DWH_Dimensions.yaml\n",
Add comment 249 Plus   "20/02/2024 17:38:07 - INFO - step list : {steplist}\n",
Add comment 250 Plus   "20/02/2024 17:38:07 - INFO - Initial offset : 0 , limit : 10000\n",
Add comment 251 Plus   "20/02/2024 17:38:07 - INFO - Id Spatial qui seront calculés : ['0', 'C', 'F', 'G', 'B', 'D', 'A', 'E', '1', '2', '3', '98827', '98817', '98813', '98826', '98819', '98816', '98828', '98824', '98832', '98821', '98831', '98818', '98804', '98822', '98814', '98815', '98806', '98809', '98820', '98811', '98807', '98805', '98803', '98823', '98810', '98812', '98833', '98808', '98825', '98801', '98830', '98802', '98829']\n",
Add comment 252 Plus   "20/02/2024 17:38:07 - INFO - individu: H3_6_NC\n",
Add comment 253 Plus   "20/02/2024 17:38:07 - INFO - indicateur: KBA\n",
Add comment 254 Plus   "20/02/2024 17:38:07 - INFO - le nom de la table de faits en base de donnée en sortie de traitement répond au pré-requis : faits_kba_h3_nc_6\n",
Add comment 255 Plus   "20/02/2024 17:38:07 - INFO - nbchuncks: 300\n",
Add comment 256 Plus   "20/02/2024 17:38:07 - DEBUG - open file: /home/hugo/projets/bilbo-packages/examples/../test_catalog_file/h3.yaml\n",
Add comment 257 Plus   "20/02/2024 17:38:07 - INFO - {'sources': {'compte_entites': {'driver': 'sql', 'metadata': {}, 'args': {'uri': 'postgresql://{{env(\"DB_USER\")}}:{{env(\"DB_PWD\")}}@{{env(\"DB_HOST\")}}:{{env(\"DB_PORT\")}}/oeil_traitement', 'sql_expr': 'SELECT COUNT(*) as nb FROM bilbo.h3_nc_6;'}, 'description': 'Compter le nombre d’entités sans charger les géométries'}}}\n",
Add comment 258 Plus   "20/02/2024 17:38:07 - DEBUG - open file: /home/hugo/projets/bilbo-packages/examples/tmp.yaml\n",
Add comment 259 Plus   "20/02/2024 17:38:07 - INFO - bilbo.h3_nc_6 nblignes : 759\n",
Add comment 260 Plus   "20/02/2024 17:38:07 - INFO - sql_pagination : order by hex_id limit 10000 offset 0\n",
Add comment 261 Plus   "20/02/2024 17:38:07 - INFO - Settings - getPaths data_config_file ../test_catalog_file/config/ \n",
Add comment 262 Plus   "20/02/2024 17:38:07 - DEBUG - Settings - getPaths - config {'commun_path': '/media/commun/commun/', 'project_dir': '/media/commun/commun/Informatique/SIG/Application/Jupyterhub/projets/stac/', 'data_catalog_dir': '../test_catalog_file/', 'data_output_dir': '../target/', 'sig_data_path': '/media/commun/commun/Informatique/SIG/Donnees/', 'project_db_schema': 'bilbo', 'data_config_file': '../test_catalog_file/config/', 'dimension_catalog_dir': '/media/commun/commun/Informatique/SIG/Application/Jupyterhub/projets/catalogFiles/'}\n",
Add comment 263 Plus   "20/02/2024 17:38:07 - INFO - create_indicator: Etape 1\n",
Add comment 264 Plus   "20/02/2024 17:38:07 - DEBUG - open file: /home/hugo/projets/bilbo-packages/examples/../test_catalog_file/h3.yaml\n",
Add comment 265 Plus   "20/02/2024 17:38:07 - INFO - create_indicator: Etape 1 sans bbox\n",
Add comment 266 Plus   "20/02/2024 17:38:07 - INFO - create_indicator: Etape 1 --> indicateurSpec.get('catalogUri') and indicateurSpec.get('dataName') is not None\n",
Add comment 267 Plus   "20/02/2024 17:38:07 - INFO - create_indicator: Etape 1 --> sourceType : None\n",
Add comment 268 Plus   "20/02/2024 17:38:07 - INFO - source Type OTHER : ex . VECTOR \n",
Add comment 269 Plus   "20/02/2024 17:38:07 - DEBUG - open file: /home/hugo/projets/bilbo-packages/examples/../test_catalog_file/data_reference.yaml\n",
Add comment 270 Plus   "20/02/2024 17:38:07 - INFO - Calculation ...\n",
Add comment 271 Plus   "20/02/2024 17:38:07 - INFO - with Dask - metaModelList : ' ['hex_id', 'kba', 'geometry', 'id_split']\n",
Add comment 272 Plus   "20/02/2024 17:38:07 - INFO - reading intake source sources:\n",
Add comment 273 Plus   " h3_nc_6:\n",
Add comment 274 Plus   " args:\n",
Add comment 275 Plus   " geopandas_kwargs:\n",
Add comment 276 Plus   " crs: 3163\n",
Add comment 277 Plus   " geom_col: geometry\n",
Add comment 278 Plus   " sql_expr: select hex_id, geometry from bilbo.h3_nc_6 order by hex_id limit\n",
Add comment 279 Plus   " 10000 offset 0\n",
Add comment 280 Plus   " table: bilbo.h3_nc_6\n",
Add comment 281 Plus   " uri: postgresql://hroussaffa:mcot@172.20.12.13:5432/oeil_traitement\n",
Add comment 282 Plus   " description: \"Maille H3 niveau 6 sur les terres emerg\\xE9es de NC\"\n",
Add comment 283 Plus   " driver: intake_geopandas.geopandas.PostGISSource\n",
Add comment 284 Plus   " metadata:\n",
Add comment 285 Plus   " catalog_dir: /home/hugo/projets/bilbo-packages/examples/../test_catalog_file/\n",
Add comment 286 Plus   "...\n"
Add comment 287 Plus   ]
Add comment 288 Plus   },
Add comment 289 Plus   {
Add comment 290 Plus   "name": "stdout",
Add comment 291 Plus   "output_type": "stream",
Add comment 292 Plus   "text": [
Add comment 293 Plus   "sources:\n",
Add comment 294 Plus   " h3_nc_6:\n",
Add comment 295 Plus   " args:\n",
Add comment 296 Plus   " geopandas_kwargs:\n",
Add comment 297 Plus   " crs: 3163\n",
Add comment 298 Plus   " geom_col: geometry\n",
Add comment 299 Plus   " sql_expr: select hex_id, geometry from bilbo.h3_nc_6\n",
Add comment 300 Plus   " table: bilbo.h3_nc_6\n",
Add comment 301 Plus   " uri: postgresql://hroussaffa:mcot@172.20.12.13:5432/oeil_traitement\n",
Add comment 302 Plus   " description: \"Maille H3 niveau 6 sur les terres emerg\\xE9es de NC\"\n",
Add comment 303 Plus   " driver: intake_geopandas.geopandas.PostGISSource\n",
Add comment 304 Plus   " metadata:\n",
Add comment 305 Plus   " catalog_dir: /home/hugo/projets/bilbo-packages/examples/../test_catalog_file/\n",
Add comment 306 Plus   "\n"
Add comment 307 Plus   ]
Add comment 308 Plus   },
Add comment 309 Plus   {
Add comment 310 Plus   "name": "stderr",
Add comment 311 Plus   "output_type": "stream",
Add comment 312 Plus   "text": [
Add comment 313 Plus   "20/02/2024 17:38:07 - DEBUG - df: 759\n",
Add comment 314 Plus   "20/02/2024 17:38:07 - DEBUG - metaModelList ['hex_id', 'kba', 'geometry', 'id_split']\n",
Add comment 315 Plus   "20/02/2024 17:38:07 - DEBUG - Load data in memory (759, 2)\n",
Add comment 316 Plus   "20/02/2024 17:38:07 - DEBUG - converting to dask with chunksize 300\n",
Add comment 317 Plus   "20/02/2024 17:38:08 - DEBUG - PROJ_ERROR: proj_create: unrecognized format / unknown name\n",
Add comment 318 Plus   "20/02/2024 17:38:08 - DEBUG - data : Dask GeoDataFrame Structure:\n",
Add comment 319 Plus   " hex_id geometry\n",
Add comment 320 Plus   "npartitions=300 \n",
Add comment 321 Plus   "0 string geometry\n",
Add comment 322 Plus   "3 ... ...\n",
Add comment 323 Plus   "... ... ...\n",
Add comment 324 Plus   "757 ... ...\n",
Add comment 325 Plus   "758 ... ...\n",
Add comment 326 Plus   "Dask Name: to_pyarrow_string, 2 graph layers\n",
Add comment 327 Plus   "20/02/2024 17:38:08 - DEBUG - func : <function generateIndicateur_parallel_v2 at 0x7f58ac352ca0>\n",
Add comment 328 Plus   "20/02/2024 17:38:08 - INFO - Etape 1 - Result: <class 'dask_geopandas.core.GeoDataFrame'>\n",
Add comment 329 Plus   "20/02/2024 17:38:08 - INFO - create_indicator: Etape 2\n",
Add comment 330 Plus   "20/02/2024 17:38:08 - INFO - indexListIndicator None\n",
Add comment 331 Plus   "20/02/2024 17:38:08 - INFO - create_indicator: Etape 2 --> pas de indexListIndicator\n"
Add comment 332 Plus   ]
Add comment 333 Plus   }
Add comment 334 Plus   ],
Add comment 134 335 "source": [
Add comment 135 336 "%%time\n",
Add comment 136 337 "\n",
settings.py
/oeilnc_config/settings.py-46+21
/oeilnc_config/settings.py
Add comment 47 if null_variables:
Add comment 48 logging.warning("The following variables are null: {}".format(", ".join(null_variables)))
Add comment 49
Add comment 50 Minus  def initializeWorkers(dotenvPath='.env'):
Add comment 50 Plus  def initializeWorkers(config_dict: dict):
Add comment 51
Add comment 52 Minus  
Add comment 53 Minus  
Add comment 54 Minus   load_dotenv(dotenv_path=dotenvPath)
Add comment 55 Minus  
Add comment 56 52 global commun_path
Add comment 57 53 global data_catalog_dir
Add comment 58 54 global project_dir
Add comment 65 61 global pswd
Add comment 66 62 global host
Add comment 67 63 global port
Add comment 64 Plus   global home
Add comment 65 Plus   global db_traitement
Add comment 66 Plus   global db_ref
Add comment 67 Plus   global db_externe
Add comment 68
Add comment 69 Minus   commun_path = getenv("COMMUN_PATH")
Add comment 70 Minus   project_dir = getenv("PROJECT_PATH")
Add comment 71 Minus   data_catalog_dir = getenv("DATA_CATALOG_DIR")
Add comment 72 Minus   data_output_dir = getenv("DATA_OUTPUT_DIR")
Add comment 73 Minus   sig_data_path = getenv("SIG_DATA_PATH")
Add comment 74 Minus   project_db_schema = getenv("PROJECT_DB_SCHEMA")
Add comment 75 Minus   data_config_file = getenv("DATA_CONFIG_DIR")
Add comment 76 Minus   dimension_catalog_dir = getenv("DIM_CATALOG_DIR")
Add comment 77 Minus  
Add comment 78 Minus  
Add comment 79 Minus   user = getenv("DB_USER")
Add comment 80 Minus   pswd = getenv("DB_PWD")
Add comment 81 Minus   host = getenv("DB_HOST")
Add comment 82 Minus   port = getenv("DB_PORT")
Add comment 83 Minus  
Add comment 84 Minus   home = getenv("HOME_PATH")
Add comment 85 Minus   db_traitement = getenv("DB_WORKSPACE")
Add comment 86 Minus   db_ref = getenv("DB_REF")
Add comment 87 Minus   db_externe = getenv("DB_EXT")
Add comment 88 Minus  
Add comment 89 Minus  
Add comment 90 Minus   config_dict = {
Add comment 91 Minus   "user": user,
Add comment 92 Minus   "pswd": pswd,
Add comment 93 Minus   "host": host,
Add comment 94 Minus   "port": port,
Add comment 95 Minus   "home": home,
Add comment 96 Minus   "db_traitement": db_traitement,
Add comment 97 Minus   "db_ref": db_ref,
Add comment 98 Minus   "db_externe": db_externe,
Add comment 99 Minus   "commun_path": commun_path,
Add comment 100 Minus   "project_dir": project_dir,
Add comment 101 Minus   "data_catalog_dir": data_catalog_dir,
Add comment 102 Minus   "data_output_dir": data_output_dir,
Add comment 103 Minus   "sig_data_path": sig_data_path,
Add comment 104 Minus   "project_db_schema": project_db_schema,
Add comment 105 Minus   "data_config_file": data_config_file,
Add comment 106 Minus   "dimension_catalog_dir": dimension_catalog_dir
Add comment 107 Minus   }
Add comment 108 Minus  
Add comment 109 Minus   logging.debug(f'Workers Settings - getPaths - config {config_dict}')
Add comment 69 Plus   user = config_dict.get("user")
Add comment 70 Plus   pswd = config_dict.get("pswd")
Add comment 71 Plus   host = config_dict.get("host")
Add comment 72 Plus   port = config_dict.get("port")
Add comment 73 Plus   home = config_dict.get("home")
Add comment 74 Plus   db_traitement = config_dict.get("db_traitement")
Add comment 75 Plus   db_ref = config_dict.get("db_ref")
Add comment 76 Plus   db_externe = config_dict.get("db_externe")
Add comment 77 Plus   commun_path = config_dict.get("commun_path")
Add comment 78 Plus   project_dir = config_dict.get("project_dir")
Add comment 79 Plus   data_catalog_dir = config_dict.get("data_catalog_dir")
Add comment 80 Plus   data_output_dir = config_dict.get("data_output_dir")
Add comment 81 Plus   sig_data_path = config_dict.get("sig_data_path")
Add comment 82 Plus   project_db_schema = config_dict.get("project_db_schema")
Add comment 83 Plus   data_config_file = config_dict.get("data_config_file")
Add comment 84 Plus   dimension_catalog_dir = config_dict.get("dimension_catalog_dir")
Add comment 110 85
Add comment 111 86 return
Add comment 112 87
H3_6_NC.yaml
/test_catalog_file/config/H3_6_NC.yaml-2+2
/test_catalog_file/config/H3_6_NC.yaml
Add comment 22 dataName: h3_nc_6
Add comment 23 indexRef: hex_id
Add comment 24 nbchuncks: 300
Add comment 25 Minus  limit: 100
Add comment 26 Minus  offset: 600
Add comment 25 Plus  limit: 10000
Add comment 26 Plus  offset: 0
Add comment 27 epsg: EPSG:3163
Add comment 28 overlayHow: intersection
Add comment 29