VOL-3557: OLT delete is causing the openolt adapter to panic sometimes - Do not update the core about OLT device connection and operation status on OLT delete - Immediately return if GetDevice call fails towards core in updateStateUnreachable routine Change-Id: I7f81d59ab9823c464c2066fb85b0d61c5a20749a

commit: b1caa44d8d1e7158265dfd449960f5986c9aab93 [log] [tgz]
author: Girish Gowdra <girish@opennetworking.org> Mon Oct 19 12:24:39 2020 -0700
committer: Girish Gowdra <girish@opennetworking.org> Mon Oct 19 12:37:01 2020 -0700
tree: f9d114ea33019a3f704d7a11d8e0bf40201f4320
parent: e8f473bb140acd45190fe6097f750140177519ac [diff]
diff --git a/internal/pkg/core/device_handler.go b/internal/pkg/core/device_handler.go
index 3be60ec..b87ca12 100644
--- a/internal/pkg/core/device_handler.go
+++ b/internal/pkg/core/device_handler.go

@@ -1657,15 +1657,10 @@
 			return olterrors.NewErrAdapter("olt-reboot-failed", log.Fields{"device-id": dh.device.Id}, err).Log()
 		}
 	}
-	cloned := proto.Clone(device).(*voltha.Device)
-	cloned.OperStatus = voltha.OperStatus_UNKNOWN
-	cloned.ConnectStatus = voltha.ConnectStatus_UNREACHABLE
-	if err := dh.coreProxy.DeviceStateUpdate(ctx, cloned.Id, cloned.ConnectStatus, cloned.OperStatus); err != nil {
-		return olterrors.NewErrAdapter("device-state-update-failed", log.Fields{
-			"device-id":      device.Id,
-			"connect-status": cloned.ConnectStatus,
-			"oper-status":    cloned.OperStatus}, err).Log()
-	}
+	// There is no need to update the core about operation status and connection status of the OLT.
+	// The OLT is getting deleted anyway and the core might have already cleared the OLT device from its DB.
+	// So any attempt to update the operation status and connection status of the OLT will result in core throwing an error back,
+	// because the device does not exist in DB.
 	return nil
 }
 func (dh *DeviceHandler) cleanupDeviceResources(ctx context.Context) {
@@ -1935,7 +1930,14 @@
 func (dh *DeviceHandler) updateStateUnreachable(ctx context.Context) {
 	device, err := dh.coreProxy.GetDevice(ctx, dh.device.Id, dh.device.Id)
 	if err != nil || device == nil {
+		// One case where we have seen core returning an error for GetDevice call is after OLT device delete.
+		// After OLT delete, the adapter asks for OLT to reboot. When OLT is rebooted, shortly we loose heartbeat.
+		// The 'startHeartbeatCheck' then asks the device to be marked unreachable towards the core, but the core
+		// has already deleted the device and returns error. In this particular scenario, it is Ok because any necessary
+		// cleanup in the adapter was already done during DeleteDevice API handler routine.
 		_ = olterrors.NewErrNotFound("device", log.Fields{"device-id": dh.device.Id}, err).Log()
+		// Immediately return, otherwise accessing a null 'device' struct would cause panic
+		return
 	}
 
 	if device.ConnectStatus == voltha.ConnectStatus_REACHABLE {
commit	b1caa44d8d1e7158265dfd449960f5986c9aab93	[log] [tgz]
author	Girish Gowdra <girish@opennetworking.org>	Mon Oct 19 12:24:39 2020 -0700
committer	Girish Gowdra <girish@opennetworking.org>	Mon Oct 19 12:37:01 2020 -0700
tree	f9d114ea33019a3f704d7a11d8e0bf40201f4320
parent	e8f473bb140acd45190fe6097f750140177519ac [diff]