I’ve created a Vertex AI workbench and done some work, installed python libraries, run my model training, etc. But after the second or third startup the system gets stuck “Provisioning”. This has happened to me 3 times now where each time i’ve setup a new workbench and then after a few startups it can no longer boot and gets stuck at “Provisioning”.
In the Health tab the System Health Status says Unhealthy but all of the other statuses show Healthy. Checking the logs, this is the only error I’ve found. But I haven’t changed the configuration of the workbench since I started it. Also the principle does have permissions for compute admin (v1) and compute admin roles. So I don’t understand why this is breaking.
{
"protoPayload": {
"@type": "type.googleapis.com/google.cloud.audit.AuditLog",
"status": {
"code": 7,
"message": "Required 'Current principal doesn't have permission to mutate this resource!' permission for '[INSTANCE-NAME-REDACTED]'"
},
"authenticationInfo": {
"principalEmail": "-----------------------------@---------------com",
"serviceAccountDelegationInfo": [
{
"firstPartyPrincipal": {
"principalEmail": "service----------------@--------------com"
}
}
],
"principalSubject": "serviceAccount:------------------------------@---------------com"
},
"requestMetadata": {
"callerIp": "##.##.###.###",
"callerSuppliedUserAgent": "google-cloud-sdk gcloud/469.0.0 command/gcloud.compute.instances.remove-metadata invocation-id/####################### environment/GCE environment-version/None client-os/LINUX client-os-ver/5.10.0 client-pltf-arch/x86_64 interactive/False from-script/True python/3.11.8 term/ (Linux 5.10.0-28-cloud-amd64),gzip(gfe)",
"callerNetwork": "//############com/projects/-----------------------------/global/networks/__unknown__",
"requestAttributes": {
"time": "2024-04-11T21:21:11.897314Z",
"auth": {}
},
"destinationAttributes": {}
},
"serviceName": "############com",
"methodName": "v1.compute.instances.setMetadata",
"authorizationInfo": [
{
"resource": "projects/-----------------------------/zones/us-west1-a/instances/[INSTANCE-NAME-REDACTED]",
"permission": "compute.instances.setMetadata",
"granted": true,
"resourceAttributes": {
"service": "compute",
"name": "projects/-----------------------------/zones/us-west1-a/instances/[INSTANCE-NAME-REDACTED]",
"type": "compute.instances"
}
}
],
"resourceName": "projects/-----------------------------/zones/us-west1-a/instances/[INSTANCE-NAME-REDACTED]",
"request": {
"@type": "type.googleapis.com/compute.instances.setMetadata"
},
"response": {
"error": {
"errors": [
{
"domain": "global",
"reason": "forbidden",
"message": "Required 'Current principal doesn't have permission to mutate this resource!' permission for '[INSTANCE-NAME-REDACTED]'"
}
],
"code": 403,
"message": "Required 'Current principal doesn't have permission to mutate this resource!' permission for '[INSTANCE-NAME-REDACTED]'"
},
"@type": "##########com/error"
},
"resourceLocation": {
"currentLocations": [
"us-west1-a"
]
}
},
"insertId": "-###########",
"resource": {
"type": "gce_instance",
"labels": {
"instance_id": "##################",
"zone": "us-west1-a",
"project_id": "-----------------------------"
}
},
"timestamp": "2024-04-11T21:21:11.514971Z",
"severity": "ERROR",
"labels": {
"############com/root_trigger_id": "######################################"
},
"logName": "projects/-----------------------------/logs/############com%2Factivity",
"receiveTimestamp": "2024-04-11T21:21:12.788839353Z"
}