I'm using Azure ML jobs to run an experiment using python sdk-v2, and I haven't be able to access into the run logs after the run is completed. I'm not sure what is happening, if I'm missing some permission or a previous step. It just says "run 'xxxx' not found
from mlflow.tracking import MlflowClient
# Use MlFlow to retrieve the job that was just completed
run_id = 'musing_steelpan_xxxx'
finished_mlflow_run = MlflowClient().get_run(run_id)
. The run_id actually exist, I'm the owner of the worspace and cluster.
MlflowException Traceback (most recent call last)
Cell In [5], line 6
3 # Use MlFlow to retrieve the job that was just completed
4 run_id = 'musing_steelpan_hnlbhxf9qy'
----> 6 finished_mlflow_run = MlflowClient().get_run(run_id)
File /miniconda/envs/benchmark/lib/python3.8/site-packages/mlflow/tracking/client.py:150, in MlflowClient.get_run(self, run_id)
112 def get_run(self, run_id: str) -> Run:
113 """
114 Fetch the run from backend store. The resulting :py:class:`Run <mlflow.entities.Run>`
115 contains a collection of run metadata -- :py:class:`RunInfo <mlflow.entities.RunInfo>`,
(...)
148 status: FINISHED
149 """
--> 150 return self._tracking_client.get_run(run_id)
File /miniconda/envs/benchmark/lib/python3.8/site-packages/mlflow/tracking/_tracking_service/client.py:72, in TrackingServiceClient.get_run(self, run_id)
58 """
59 Fetch the run from backend store. The resulting :py:class:`Run <mlflow.entities.Run>`
60 contains a collection of run metadata -- :py:class:`RunInfo <mlflow.entities.RunInfo>`,
(...)
69 raises an exception.
70 """
71 _validate_run_id(run_id)
...
648 )
649 run_info = self._get_run_info_from_dir(run_dir)
650 if run_info.experiment_id != exp_id:
MlflowException: Run 'musing_steelpan_xxxx' not found