• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

kubeovn / kube-ovn / 18705377874

22 Oct 2025 04:28AM UTC coverage: 21.149% (-0.009%) from 21.158%
18705377874

push

github

web-flow
fix: prevent GC from deleting KubeVirt VM interfaces (#5814)

The garbage collector introduced in PR #5789 incorrectly identifies
KubeVirt VM interfaces as 'lost' and deletes them, breaking network
connectivity for VMs within ~60 seconds of creation.

Root cause: For KubeVirt VMs, the pod_name in OVS external_ids is set
to the VM name (e.g., 'ubuntu-vm-br'), not the launcher pod name
(e.g., 'virt-launcher-ubuntu-vm-br-xyz'). When gcInterfaces() tries
to look up the pod by the VM name, it fails and incorrectly deletes
the interface.

Solution: When a pod is not found by direct lookup, check if it might
be a KubeVirt VM by searching for launcher pods with the label
'vm.kubevirt.io/name' matching the pod_name from OVS. If a matching
launcher pod exists, keep the interface instead of deleting it.

This fix maintains backward compatibility with non-KubeVirt pods
while preventing false-positive deletions for KubeVirt VMs.

Signed-off-by: dnugmanov <damir_nug@mail.ru>

0 of 17 new or added lines in 1 file covered. (0.0%)

3 existing lines in 2 files now uncovered.

10735 of 50758 relevant lines covered (21.15%)

0.25 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

0.0
/pkg/daemon/controller.go
1
package daemon
2

3
import (
4
        "bytes"
5
        "context"
6
        "fmt"
7
        "maps"
8
        "os/exec"
9
        "slices"
10
        "strconv"
11
        "strings"
12
        "time"
13

14
        nadutils "github.com/k8snetworkplumbingwg/network-attachment-definition-client/pkg/utils"
15
        "github.com/scylladb/go-set/strset"
16
        v1 "k8s.io/api/core/v1"
17
        k8serrors "k8s.io/apimachinery/pkg/api/errors"
18
        metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
19
        "k8s.io/apimachinery/pkg/labels"
20
        utilruntime "k8s.io/apimachinery/pkg/util/runtime"
21
        "k8s.io/apimachinery/pkg/util/wait"
22
        "k8s.io/client-go/informers"
23
        "k8s.io/client-go/kubernetes/scheme"
24
        typedcorev1 "k8s.io/client-go/kubernetes/typed/core/v1"
25
        listerv1 "k8s.io/client-go/listers/core/v1"
26
        "k8s.io/client-go/tools/cache"
27
        "k8s.io/client-go/tools/record"
28
        "k8s.io/client-go/util/workqueue"
29
        "k8s.io/klog/v2"
30
        k8sexec "k8s.io/utils/exec"
31

32
        kubeovnv1 "github.com/kubeovn/kube-ovn/pkg/apis/kubeovn/v1"
33
        kubeovninformer "github.com/kubeovn/kube-ovn/pkg/client/informers/externalversions"
34
        kubeovnlister "github.com/kubeovn/kube-ovn/pkg/client/listers/kubeovn/v1"
35
        "github.com/kubeovn/kube-ovn/pkg/ovs"
36
        "github.com/kubeovn/kube-ovn/pkg/util"
37
)
38

39
// Controller watch pod and namespace changes to update iptables, ipset and ovs qos
40
type Controller struct {
41
        config *Configuration
42

43
        providerNetworksLister          kubeovnlister.ProviderNetworkLister
44
        providerNetworksSynced          cache.InformerSynced
45
        addOrUpdateProviderNetworkQueue workqueue.TypedRateLimitingInterface[string]
46
        deleteProviderNetworkQueue      workqueue.TypedRateLimitingInterface[*kubeovnv1.ProviderNetwork]
47

48
        vlansLister kubeovnlister.VlanLister
49
        vlansSynced cache.InformerSynced
50

51
        subnetsLister kubeovnlister.SubnetLister
52
        subnetsSynced cache.InformerSynced
53
        subnetQueue   workqueue.TypedRateLimitingInterface[*subnetEvent]
54

55
        ovnEipsLister kubeovnlister.OvnEipLister
56
        ovnEipsSynced cache.InformerSynced
57

58
        podsLister     listerv1.PodLister
59
        podsSynced     cache.InformerSynced
60
        updatePodQueue workqueue.TypedRateLimitingInterface[string]
61
        deletePodQueue workqueue.TypedRateLimitingInterface[*podEvent]
62

63
        nodesLister listerv1.NodeLister
64
        nodesSynced cache.InformerSynced
65

66
        servicesLister listerv1.ServiceLister
67
        servicesSynced cache.InformerSynced
68
        serviceQueue   workqueue.TypedRateLimitingInterface[*serviceEvent]
69

70
        caSecretLister listerv1.SecretLister
71
        caSecretSynced cache.InformerSynced
72
        ipsecQueue     workqueue.TypedRateLimitingInterface[string]
73

74
        recorder record.EventRecorder
75

76
        protocol string
77

78
        ControllerRuntime
79
        localPodName   string
80
        localNamespace string
81

82
        k8sExec k8sexec.Interface
83
}
84

85
func newTypedRateLimitingQueue[T comparable](name string, rateLimiter workqueue.TypedRateLimiter[T]) workqueue.TypedRateLimitingInterface[T] {
×
86
        if rateLimiter == nil {
×
87
                rateLimiter = workqueue.DefaultTypedControllerRateLimiter[T]()
×
88
        }
×
89
        return workqueue.NewTypedRateLimitingQueueWithConfig(rateLimiter, workqueue.TypedRateLimitingQueueConfig[T]{Name: name})
×
90
}
91

92
// NewController init a daemon controller
93
func NewController(config *Configuration,
94
        stopCh <-chan struct{},
95
        podInformerFactory, nodeInformerFactory, caSecretInformerFactory informers.SharedInformerFactory,
96
        kubeovnInformerFactory kubeovninformer.SharedInformerFactory,
97
) (*Controller, error) {
×
98
        eventBroadcaster := record.NewBroadcaster()
×
99
        eventBroadcaster.StartLogging(klog.Infof)
×
100
        eventBroadcaster.StartRecordingToSink(&typedcorev1.EventSinkImpl{Interface: config.KubeClient.CoreV1().Events(v1.NamespaceAll)})
×
101
        recorder := eventBroadcaster.NewRecorder(scheme.Scheme, v1.EventSource{Component: config.NodeName})
×
102
        providerNetworkInformer := kubeovnInformerFactory.Kubeovn().V1().ProviderNetworks()
×
103
        vlanInformer := kubeovnInformerFactory.Kubeovn().V1().Vlans()
×
104
        subnetInformer := kubeovnInformerFactory.Kubeovn().V1().Subnets()
×
105
        ovnEipInformer := kubeovnInformerFactory.Kubeovn().V1().OvnEips()
×
106
        podInformer := podInformerFactory.Core().V1().Pods()
×
107
        nodeInformer := nodeInformerFactory.Core().V1().Nodes()
×
108
        servicesInformer := nodeInformerFactory.Core().V1().Services()
×
109
        caSecretInformer := caSecretInformerFactory.Core().V1().Secrets()
×
110

×
111
        controller := &Controller{
×
112
                config: config,
×
113

×
114
                providerNetworksLister:          providerNetworkInformer.Lister(),
×
115
                providerNetworksSynced:          providerNetworkInformer.Informer().HasSynced,
×
116
                addOrUpdateProviderNetworkQueue: newTypedRateLimitingQueue[string]("AddOrUpdateProviderNetwork", nil),
×
117
                deleteProviderNetworkQueue:      newTypedRateLimitingQueue[*kubeovnv1.ProviderNetwork]("DeleteProviderNetwork", nil),
×
118

×
119
                vlansLister: vlanInformer.Lister(),
×
120
                vlansSynced: vlanInformer.Informer().HasSynced,
×
121

×
122
                subnetsLister: subnetInformer.Lister(),
×
123
                subnetsSynced: subnetInformer.Informer().HasSynced,
×
124
                subnetQueue:   newTypedRateLimitingQueue[*subnetEvent]("Subnet", nil),
×
125

×
126
                ovnEipsLister: ovnEipInformer.Lister(),
×
127
                ovnEipsSynced: ovnEipInformer.Informer().HasSynced,
×
128

×
129
                podsLister:     podInformer.Lister(),
×
130
                podsSynced:     podInformer.Informer().HasSynced,
×
131
                updatePodQueue: newTypedRateLimitingQueue[string]("UpdatePod", nil),
×
132
                deletePodQueue: newTypedRateLimitingQueue[*podEvent]("DeletePod", nil),
×
133

×
134
                nodesLister: nodeInformer.Lister(),
×
135
                nodesSynced: nodeInformer.Informer().HasSynced,
×
136

×
137
                servicesLister: servicesInformer.Lister(),
×
138
                servicesSynced: servicesInformer.Informer().HasSynced,
×
139
                serviceQueue:   newTypedRateLimitingQueue[*serviceEvent]("Service", nil),
×
140

×
141
                caSecretLister: caSecretInformer.Lister(),
×
142
                caSecretSynced: caSecretInformer.Informer().HasSynced,
×
143
                ipsecQueue:     newTypedRateLimitingQueue[string]("IPSecCA", nil),
×
144

×
145
                recorder: recorder,
×
146
                k8sExec:  k8sexec.New(),
×
147
        }
×
148

×
149
        node, err := config.KubeClient.CoreV1().Nodes().Get(context.Background(), config.NodeName, metav1.GetOptions{})
×
150
        if err != nil {
×
151
                util.LogFatalAndExit(err, "failed to get node %s info", config.NodeName)
×
152
        }
×
153
        controller.protocol = util.CheckProtocol(node.Annotations[util.IPAddressAnnotation])
×
154

×
155
        if err = controller.initRuntime(); err != nil {
×
156
                return nil, err
×
157
        }
×
158

159
        podInformerFactory.Start(stopCh)
×
160
        nodeInformerFactory.Start(stopCh)
×
161
        kubeovnInformerFactory.Start(stopCh)
×
162
        caSecretInformerFactory.Start(stopCh)
×
163

×
164
        if !cache.WaitForCacheSync(stopCh,
×
165
                controller.providerNetworksSynced, controller.vlansSynced, controller.subnetsSynced,
×
166
                controller.podsSynced, controller.nodesSynced, controller.servicesSynced, controller.caSecretSynced) {
×
167
                util.LogFatalAndExit(nil, "failed to wait for caches to sync")
×
168
        }
×
169

170
        if _, err = providerNetworkInformer.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
×
171
                AddFunc:    controller.enqueueAddProviderNetwork,
×
172
                UpdateFunc: controller.enqueueUpdateProviderNetwork,
×
173
                DeleteFunc: controller.enqueueDeleteProviderNetwork,
×
174
        }); err != nil {
×
175
                return nil, err
×
176
        }
×
177
        if _, err = vlanInformer.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
×
178
                UpdateFunc: controller.enqueueUpdateVlan,
×
179
        }); err != nil {
×
180
                return nil, err
×
181
        }
×
182
        if _, err = subnetInformer.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
×
183
                AddFunc:    controller.enqueueAddSubnet,
×
184
                UpdateFunc: controller.enqueueUpdateSubnet,
×
185
                DeleteFunc: controller.enqueueDeleteSubnet,
×
186
        }); err != nil {
×
187
                return nil, err
×
188
        }
×
189
        if _, err = servicesInformer.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
×
190
                AddFunc:    controller.enqueueAddService,
×
191
                DeleteFunc: controller.enqueueDeleteService,
×
192
                UpdateFunc: controller.enqueueUpdateService,
×
193
        }); err != nil {
×
194
                util.LogFatalAndExit(err, "failed to add service event handler")
×
195
        }
×
196

197
        if _, err = podInformer.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
×
198
                UpdateFunc: controller.enqueueUpdatePod,
×
199
                DeleteFunc: controller.enqueueDeletePod,
×
200
        }); err != nil {
×
201
                return nil, err
×
202
        }
×
203
        if _, err = caSecretInformer.Informer().AddEventHandler(cache.ResourceEventHandlerFuncs{
×
204
                AddFunc:    controller.enqueueAddIPSecCA,
×
205
                UpdateFunc: controller.enqueueUpdateIPSecCA,
×
206
        }); err != nil {
×
207
                return nil, err
×
208
        }
×
209

210
        return controller, nil
×
211
}
212

213
func (c *Controller) enqueueAddIPSecCA(obj any) {
×
214
        key := cache.MetaObjectToName(obj.(*v1.Secret)).String()
×
215
        klog.V(3).Infof("enqueue add CA %s", key)
×
216
        c.ipsecQueue.Add(key)
×
217
}
×
218

219
func (c *Controller) enqueueUpdateIPSecCA(oldObj, newObj any) {
×
220
        oldSecret := oldObj.(*v1.Secret)
×
221
        newSecret := newObj.(*v1.Secret)
×
222
        if maps.EqualFunc(oldSecret.Data, newSecret.Data, bytes.Equal) {
×
223
                // No changes in CA data, no need to enqueue
×
224
                return
×
225
        }
×
226

227
        key := cache.MetaObjectToName(newSecret).String()
×
228
        klog.V(3).Infof("enqueue update CA %s", key)
×
229
        c.ipsecQueue.Add(key)
×
230
}
231

232
func (c *Controller) enqueueAddProviderNetwork(obj any) {
×
233
        key := cache.MetaObjectToName(obj.(*kubeovnv1.ProviderNetwork)).String()
×
234
        klog.V(3).Infof("enqueue add provider network %s", key)
×
235
        c.addOrUpdateProviderNetworkQueue.Add(key)
×
236
}
×
237

238
func (c *Controller) enqueueUpdateProviderNetwork(_, newObj any) {
×
239
        key := cache.MetaObjectToName(newObj.(*kubeovnv1.ProviderNetwork)).String()
×
240
        klog.V(3).Infof("enqueue update provider network %s", key)
×
241
        c.addOrUpdateProviderNetworkQueue.Add(key)
×
242
}
×
243

244
func (c *Controller) enqueueDeleteProviderNetwork(obj any) {
×
245
        var pn *kubeovnv1.ProviderNetwork
×
246
        switch t := obj.(type) {
×
247
        case *kubeovnv1.ProviderNetwork:
×
248
                pn = t
×
249
        case cache.DeletedFinalStateUnknown:
×
250
                p, ok := t.Obj.(*kubeovnv1.ProviderNetwork)
×
251
                if !ok {
×
252
                        klog.Warningf("unexpected object type: %T", t.Obj)
×
253
                        return
×
254
                }
×
255
                pn = p
×
256
        default:
×
257
                klog.Warningf("unexpected type: %T", obj)
×
258
                return
×
259
        }
260

261
        key := cache.MetaObjectToName(pn).String()
×
262
        klog.V(3).Infof("enqueue delete provider network %s", key)
×
263
        c.deleteProviderNetworkQueue.Add(pn)
×
264
}
265

266
func (c *Controller) runAddOrUpdateProviderNetworkWorker() {
×
267
        for c.processNextAddOrUpdateProviderNetworkWorkItem() {
×
268
        }
×
269
}
270

271
func (c *Controller) runDeleteProviderNetworkWorker() {
×
272
        for c.processNextDeleteProviderNetworkWorkItem() {
×
273
        }
×
274
}
275

276
func (c *Controller) processNextAddOrUpdateProviderNetworkWorkItem() bool {
×
277
        key, shutdown := c.addOrUpdateProviderNetworkQueue.Get()
×
278
        if shutdown {
×
279
                return false
×
280
        }
×
281

282
        err := func(key string) error {
×
283
                defer c.addOrUpdateProviderNetworkQueue.Done(key)
×
284
                if err := c.handleAddOrUpdateProviderNetwork(key); err != nil {
×
285
                        return fmt.Errorf("error syncing %q: %w, requeuing", key, err)
×
286
                }
×
287
                c.addOrUpdateProviderNetworkQueue.Forget(key)
×
288
                return nil
×
289
        }(key)
290
        if err != nil {
×
291
                utilruntime.HandleError(err)
×
292
                c.addOrUpdateProviderNetworkQueue.AddRateLimited(key)
×
293
                return true
×
294
        }
×
295
        return true
×
296
}
297

298
func (c *Controller) processNextDeleteProviderNetworkWorkItem() bool {
×
299
        obj, shutdown := c.deleteProviderNetworkQueue.Get()
×
300
        if shutdown {
×
301
                return false
×
302
        }
×
303

304
        err := func(obj *kubeovnv1.ProviderNetwork) error {
×
305
                defer c.deleteProviderNetworkQueue.Done(obj)
×
306
                if err := c.handleDeleteProviderNetwork(obj); err != nil {
×
307
                        return fmt.Errorf("error syncing %q: %w, requeuing", obj.Name, err)
×
308
                }
×
309
                c.deleteProviderNetworkQueue.Forget(obj)
×
310
                return nil
×
311
        }(obj)
312
        if err != nil {
×
313
                utilruntime.HandleError(err)
×
314
                c.deleteProviderNetworkQueue.AddRateLimited(obj)
×
315
                return true
×
316
        }
×
317
        return true
×
318
}
319

320
func (c *Controller) handleAddOrUpdateProviderNetwork(key string) error {
×
321
        klog.V(3).Infof("handle update provider network %s", key)
×
322
        node, err := c.nodesLister.Get(c.config.NodeName)
×
323
        if err != nil {
×
324
                klog.Error(err)
×
325
                return err
×
326
        }
×
327
        pn, err := c.providerNetworksLister.Get(key)
×
328
        if err != nil {
×
329
                if k8serrors.IsNotFound(err) {
×
330
                        return nil
×
331
                }
×
332
                klog.Error(err)
×
333
                return err
×
334
        }
335

336
        excluded, err := util.IsNodeExcludedFromProviderNetwork(node, pn)
×
337
        if err != nil {
×
338
                klog.Error(err)
×
339
                return err
×
340
        }
×
341

342
        if excluded {
×
343
                c.recordProviderNetworkErr(pn.Name, "")
×
344
                return c.cleanProviderNetwork(pn.DeepCopy(), node.DeepCopy())
×
345
        }
×
346
        return c.initProviderNetwork(pn.DeepCopy(), node.DeepCopy())
×
347
}
348

349
func (c *Controller) initProviderNetwork(pn *kubeovnv1.ProviderNetwork, node *v1.Node) error {
×
350
        nic := pn.Spec.DefaultInterface
×
351
        for _, item := range pn.Spec.CustomInterfaces {
×
352
                if slices.Contains(item.Nodes, node.Name) {
×
353
                        nic = item.Interface
×
354
                        break
×
355
                }
356
        }
357

358
        patch := util.KVPatch{
×
359
                fmt.Sprintf(util.ProviderNetworkReadyTemplate, pn.Name):     nil,
×
360
                fmt.Sprintf(util.ProviderNetworkInterfaceTemplate, pn.Name): nil,
×
361
                fmt.Sprintf(util.ProviderNetworkMtuTemplate, pn.Name):       nil,
×
362
                fmt.Sprintf(util.ProviderNetworkExcludeTemplate, pn.Name):   nil,
×
363
        }
×
364

×
365
        vlans := strset.NewWithSize(len(pn.Status.Vlans) + 1)
×
366
        for _, vlanName := range pn.Status.Vlans {
×
367
                vlan, err := c.vlansLister.Get(vlanName)
×
368
                if err != nil {
×
369
                        if k8serrors.IsNotFound(err) {
×
370
                                klog.Infof("vlan %s not found", vlanName)
×
371
                                continue
×
372
                        }
373
                        klog.Errorf("failed to get vlan %q: %v", vlanName, err)
×
374
                        return err
×
375
                }
376
                vlans.Add(strconv.Itoa(vlan.Spec.ID))
×
377
        }
378
        // always add trunk 0 so that the ovs bridge can communicate with the external network
379
        vlans.Add("0")
×
380

×
381
        var mtu int
×
382
        var err error
×
383
        klog.V(3).Infof("ovs init provider network %s", pn.Name)
×
384
        if mtu, err = c.ovsInitProviderNetwork(pn.Name, nic, vlans.List(), pn.Spec.ExchangeLinkName, c.config.MacLearningFallback); err != nil {
×
385
                delete(patch, fmt.Sprintf(util.ProviderNetworkExcludeTemplate, pn.Name))
×
386
                if err1 := util.PatchLabels(c.config.KubeClient.CoreV1().Nodes(), node.Name, patch); err1 != nil {
×
387
                        klog.Errorf("failed to patch annotations of node %s: %v", node.Name, err1)
×
388
                }
×
389
                c.recordProviderNetworkErr(pn.Name, err.Error())
×
390
                return err
×
391
        }
392

393
        patch[fmt.Sprintf(util.ProviderNetworkReadyTemplate, pn.Name)] = "true"
×
394
        patch[fmt.Sprintf(util.ProviderNetworkInterfaceTemplate, pn.Name)] = nic
×
395
        patch[fmt.Sprintf(util.ProviderNetworkMtuTemplate, pn.Name)] = strconv.Itoa(mtu)
×
396
        if err = util.PatchLabels(c.config.KubeClient.CoreV1().Nodes(), node.Name, patch); err != nil {
×
397
                klog.Errorf("failed to patch labels of node %s: %v", node.Name, err)
×
398
                return err
×
399
        }
×
400
        c.recordProviderNetworkErr(pn.Name, "")
×
401
        return nil
×
402
}
403

404
func (c *Controller) recordProviderNetworkErr(providerNetwork, errMsg string) {
×
405
        var currentPod *v1.Pod
×
406
        var err error
×
407
        if c.localPodName == "" {
×
408
                pods, err := c.config.KubeClient.CoreV1().Pods(v1.NamespaceAll).List(context.Background(), metav1.ListOptions{
×
409
                        LabelSelector: "app=kube-ovn-cni",
×
410
                        FieldSelector: "spec.nodeName=" + c.config.NodeName,
×
411
                })
×
412
                if err != nil {
×
413
                        klog.Errorf("failed to list pod: %v", err)
×
414
                        return
×
415
                }
×
416
                for _, pod := range pods.Items {
×
417
                        if pod.Spec.NodeName == c.config.NodeName && pod.Status.Phase == v1.PodRunning {
×
418
                                c.localPodName = pod.Name
×
419
                                c.localNamespace = pod.Namespace
×
420
                                currentPod = &pod
×
421
                                break
×
422
                        }
423
                }
424
                if currentPod == nil {
×
425
                        klog.Warning("failed to get self pod")
×
426
                        return
×
427
                }
×
428
        } else {
×
429
                if currentPod, err = c.podsLister.Pods(c.localNamespace).Get(c.localPodName); err != nil {
×
430
                        klog.Errorf("failed to get pod %s, %v", c.localPodName, err)
×
431
                        return
×
432
                }
×
433
        }
434

435
        patch := util.KVPatch{}
×
436
        if currentPod.Annotations[fmt.Sprintf(util.ProviderNetworkErrMessageTemplate, providerNetwork)] != errMsg {
×
437
                if errMsg == "" {
×
438
                        patch[fmt.Sprintf(util.ProviderNetworkErrMessageTemplate, providerNetwork)] = nil
×
439
                } else {
×
440
                        patch[fmt.Sprintf(util.ProviderNetworkErrMessageTemplate, providerNetwork)] = errMsg
×
441
                }
×
442
                if err = util.PatchAnnotations(c.config.KubeClient.CoreV1().Pods(c.localNamespace), c.localPodName, patch); err != nil {
×
443
                        klog.Errorf("failed to patch pod %s: %v", c.localPodName, err)
×
444
                        return
×
445
                }
×
446
        }
447
}
448

449
func (c *Controller) cleanProviderNetwork(pn *kubeovnv1.ProviderNetwork, node *v1.Node) error {
×
450
        patch := util.KVPatch{
×
451
                fmt.Sprintf(util.ProviderNetworkReadyTemplate, pn.Name):     nil,
×
452
                fmt.Sprintf(util.ProviderNetworkInterfaceTemplate, pn.Name): nil,
×
453
                fmt.Sprintf(util.ProviderNetworkMtuTemplate, pn.Name):       nil,
×
454
                fmt.Sprintf(util.ProviderNetworkExcludeTemplate, pn.Name):   "true",
×
455
        }
×
456
        if err := util.PatchLabels(c.config.KubeClient.CoreV1().Nodes(), node.Name, patch); err != nil {
×
457
                klog.Errorf("failed to patch labels of node %s: %v", node.Name, err)
×
458
                return err
×
459
        }
×
460

461
        return c.ovsCleanProviderNetwork(pn.Name)
×
462
}
463

464
func (c *Controller) handleDeleteProviderNetwork(pn *kubeovnv1.ProviderNetwork) error {
×
465
        if err := c.ovsCleanProviderNetwork(pn.Name); err != nil {
×
466
                klog.Error(err)
×
467
                return err
×
468
        }
×
469

470
        node, err := c.nodesLister.Get(c.config.NodeName)
×
471
        if err != nil {
×
472
                klog.Error(err)
×
473
                return err
×
474
        }
×
475
        if len(node.Labels) == 0 {
×
476
                return nil
×
477
        }
×
478

479
        patch := util.KVPatch{
×
480
                fmt.Sprintf(util.ProviderNetworkReadyTemplate, pn.Name):     nil,
×
481
                fmt.Sprintf(util.ProviderNetworkInterfaceTemplate, pn.Name): nil,
×
482
                fmt.Sprintf(util.ProviderNetworkMtuTemplate, pn.Name):       nil,
×
483
                fmt.Sprintf(util.ProviderNetworkExcludeTemplate, pn.Name):   nil,
×
484
        }
×
485
        if err = util.PatchLabels(c.config.KubeClient.CoreV1().Nodes(), node.Name, patch); err != nil {
×
486
                klog.Errorf("failed to patch labels of node %s: %v", node.Name, err)
×
487
                return err
×
488
        }
×
489

490
        return nil
×
491
}
492

493
func (c *Controller) enqueueUpdateVlan(oldObj, newObj any) {
×
494
        oldVlan := oldObj.(*kubeovnv1.Vlan)
×
495
        newVlan := newObj.(*kubeovnv1.Vlan)
×
496
        if oldVlan.Spec.ID != newVlan.Spec.ID {
×
497
                klog.V(3).Infof("enqueue update provider network %q", newVlan.Spec.Provider)
×
498
                c.addOrUpdateProviderNetworkQueue.Add(newVlan.Spec.Provider)
×
499
        }
×
500
}
501

502
type subnetEvent struct {
503
        oldObj, newObj any
504
}
505

506
type serviceEvent struct {
507
        oldObj, newObj any
508
}
509

510
type podEvent struct {
511
        oldObj any
512
}
513

514
func (c *Controller) enqueueAddSubnet(obj any) {
×
515
        c.subnetQueue.Add(&subnetEvent{newObj: obj})
×
516
}
×
517

518
func (c *Controller) enqueueUpdateSubnet(oldObj, newObj any) {
×
519
        c.subnetQueue.Add(&subnetEvent{oldObj: oldObj, newObj: newObj})
×
520
}
×
521

522
func (c *Controller) enqueueDeleteSubnet(obj any) {
×
523
        c.subnetQueue.Add(&subnetEvent{oldObj: obj})
×
524
}
×
525

526
func (c *Controller) runSubnetWorker() {
×
527
        for c.processNextSubnetWorkItem() {
×
528
        }
×
529
}
530

531
func (c *Controller) enqueueAddService(obj any) {
×
532
        c.serviceQueue.Add(&serviceEvent{newObj: obj})
×
533
}
×
534

535
func (c *Controller) enqueueUpdateService(oldObj, newObj any) {
×
536
        c.serviceQueue.Add(&serviceEvent{oldObj: oldObj, newObj: newObj})
×
537
}
×
538

539
func (c *Controller) enqueueDeleteService(obj any) {
×
540
        c.serviceQueue.Add(&serviceEvent{oldObj: obj})
×
541
}
×
542

543
func (c *Controller) runAddOrUpdateServicekWorker() {
×
544
        for c.processNextServiceWorkItem() {
×
545
        }
×
546
}
547

548
func (c *Controller) processNextSubnetWorkItem() bool {
×
549
        obj, shutdown := c.subnetQueue.Get()
×
550
        if shutdown {
×
551
                return false
×
552
        }
×
553

554
        err := func(obj *subnetEvent) error {
×
555
                defer c.subnetQueue.Done(obj)
×
556
                if err := c.reconcileRouters(obj); err != nil {
×
557
                        c.subnetQueue.AddRateLimited(obj)
×
558
                        return fmt.Errorf("error syncing %v: %w, requeuing", obj, err)
×
559
                }
×
560
                c.subnetQueue.Forget(obj)
×
561
                return nil
×
562
        }(obj)
563
        if err != nil {
×
564
                utilruntime.HandleError(err)
×
565
                return true
×
566
        }
×
567
        return true
×
568
}
569

570
func (c *Controller) processNextServiceWorkItem() bool {
×
571
        obj, shutdown := c.serviceQueue.Get()
×
572
        if shutdown {
×
573
                return false
×
574
        }
×
575

576
        err := func(obj *serviceEvent) error {
×
577
                defer c.serviceQueue.Done(obj)
×
578
                if err := c.reconcileServices(obj); err != nil {
×
579
                        c.serviceQueue.AddRateLimited(obj)
×
580
                        return fmt.Errorf("error syncing %v: %w, requeuing", obj, err)
×
581
                }
×
582
                c.serviceQueue.Forget(obj)
×
583
                return nil
×
584
        }(obj)
585
        if err != nil {
×
586
                utilruntime.HandleError(err)
×
587
                return true
×
588
        }
×
589
        return true
×
590
}
591

592
func (c *Controller) enqueueUpdatePod(oldObj, newObj any) {
×
593
        oldPod := oldObj.(*v1.Pod)
×
594
        newPod := newObj.(*v1.Pod)
×
595
        key := cache.MetaObjectToName(newPod).String()
×
596

×
597
        if oldPod.Annotations[util.IngressRateAnnotation] != newPod.Annotations[util.IngressRateAnnotation] ||
×
598
                oldPod.Annotations[util.EgressRateAnnotation] != newPod.Annotations[util.EgressRateAnnotation] ||
×
599
                oldPod.Annotations[util.NetemQosLatencyAnnotation] != newPod.Annotations[util.NetemQosLatencyAnnotation] ||
×
600
                oldPod.Annotations[util.NetemQosJitterAnnotation] != newPod.Annotations[util.NetemQosJitterAnnotation] ||
×
601
                oldPod.Annotations[util.NetemQosLimitAnnotation] != newPod.Annotations[util.NetemQosLimitAnnotation] ||
×
602
                oldPod.Annotations[util.NetemQosLossAnnotation] != newPod.Annotations[util.NetemQosLossAnnotation] ||
×
603
                oldPod.Annotations[util.MirrorControlAnnotation] != newPod.Annotations[util.MirrorControlAnnotation] ||
×
604
                oldPod.Annotations[util.IPAddressAnnotation] != newPod.Annotations[util.IPAddressAnnotation] {
×
605
                c.updatePodQueue.Add(key)
×
606
                return
×
607
        }
×
608

609
        attachNets, err := nadutils.ParsePodNetworkAnnotation(newPod)
×
610
        if err != nil {
×
611
                return
×
612
        }
×
613
        for _, multiNet := range attachNets {
×
614
                provider := fmt.Sprintf("%s.%s.%s", multiNet.Name, multiNet.Namespace, util.OvnProvider)
×
615
                if newPod.Annotations[fmt.Sprintf(util.AllocatedAnnotationTemplate, provider)] == "true" {
×
616
                        if oldPod.Annotations[fmt.Sprintf(util.IngressRateAnnotationTemplate, provider)] != newPod.Annotations[fmt.Sprintf(util.IngressRateAnnotationTemplate, provider)] ||
×
617
                                oldPod.Annotations[fmt.Sprintf(util.EgressRateAnnotationTemplate, provider)] != newPod.Annotations[fmt.Sprintf(util.EgressRateAnnotationTemplate, provider)] ||
×
618
                                oldPod.Annotations[fmt.Sprintf(util.NetemQosLatencyAnnotationTemplate, provider)] != newPod.Annotations[fmt.Sprintf(util.NetemQosLatencyAnnotationTemplate, provider)] ||
×
619
                                oldPod.Annotations[fmt.Sprintf(util.NetemQosJitterAnnotationTemplate, provider)] != newPod.Annotations[fmt.Sprintf(util.NetemQosJitterAnnotationTemplate, provider)] ||
×
620
                                oldPod.Annotations[fmt.Sprintf(util.NetemQosLimitAnnotationTemplate, provider)] != newPod.Annotations[fmt.Sprintf(util.NetemQosLimitAnnotationTemplate, provider)] ||
×
621
                                oldPod.Annotations[fmt.Sprintf(util.NetemQosLossAnnotationTemplate, provider)] != newPod.Annotations[fmt.Sprintf(util.NetemQosLossAnnotationTemplate, provider)] ||
×
622
                                oldPod.Annotations[fmt.Sprintf(util.MirrorControlAnnotationTemplate, provider)] != newPod.Annotations[fmt.Sprintf(util.MirrorControlAnnotationTemplate, provider)] {
×
623
                                c.updatePodQueue.Add(key)
×
624
                        }
×
625
                }
626
        }
627
}
628

629
func (c *Controller) enqueueDeletePod(obj any) {
×
630
        var pod *v1.Pod
×
631
        switch t := obj.(type) {
×
632
        case *v1.Pod:
×
633
                pod = t
×
634
        case cache.DeletedFinalStateUnknown:
×
635
                p, ok := t.Obj.(*v1.Pod)
×
636
                if !ok {
×
637
                        klog.Warningf("unexpected object type: %T", t.Obj)
×
638
                        return
×
639
                }
×
640
                pod = p
×
641
        default:
×
642
                klog.Warningf("unexpected type: %T", obj)
×
643
                return
×
644
        }
645

646
        klog.V(3).Infof("enqueue delete pod %s", pod.Name)
×
647
        c.deletePodQueue.Add(&podEvent{oldObj: pod})
×
648
}
649

650
func (c *Controller) runUpdatePodWorker() {
×
651
        for c.processNextUpdatePodWorkItem() {
×
652
        }
×
653
}
654

655
func (c *Controller) runDeletePodWorker() {
×
656
        for c.processNextDeletePodWorkItem() {
×
657
        }
×
658
}
659

660
func (c *Controller) processNextUpdatePodWorkItem() bool {
×
661
        key, shutdown := c.updatePodQueue.Get()
×
662
        if shutdown {
×
663
                return false
×
664
        }
×
665

666
        err := func(key string) error {
×
667
                defer c.updatePodQueue.Done(key)
×
668
                if err := c.handleUpdatePod(key); err != nil {
×
669
                        c.updatePodQueue.AddRateLimited(key)
×
670
                        return fmt.Errorf("error syncing %q: %w, requeuing", key, err)
×
671
                }
×
672
                c.updatePodQueue.Forget(key)
×
673
                return nil
×
674
        }(key)
675
        if err != nil {
×
676
                utilruntime.HandleError(err)
×
677
                return true
×
678
        }
×
679
        return true
×
680
}
681

682
func (c *Controller) processNextDeletePodWorkItem() bool {
×
683
        event, shutdown := c.deletePodQueue.Get()
×
684
        if shutdown {
×
685
                return false
×
686
        }
×
687

688
        err := func(event *podEvent) error {
×
689
                defer c.deletePodQueue.Done(event)
×
690
                if err := c.handleDeletePod(event); err != nil {
×
691
                        c.deletePodQueue.AddRateLimited(event)
×
692
                        return fmt.Errorf("error syncing pod event: %w, requeuing", err)
×
693
                }
×
694
                c.deletePodQueue.Forget(event)
×
695
                return nil
×
696
        }(event)
697
        if err != nil {
×
698
                utilruntime.HandleError(err)
×
699
                return true
×
700
        }
×
701
        return true
×
702
}
703

704
func (c *Controller) gcInterfaces() {
×
705
        interfacePodMap, err := ovs.ListInterfacePodMap()
×
706
        if err != nil {
×
707
                klog.Errorf("failed to list interface pod map: %v", err)
×
708
                return
×
709
        }
×
710
        for iface, pod := range interfacePodMap {
×
711
                parts := strings.Split(pod, "/")
×
712
                if len(parts) < 3 {
×
713
                        klog.Errorf("malformed pod string %q for interface %s, expected format 'namespace/name/errText'", pod, iface)
×
714
                        continue
×
715
                }
716

717
                podNamespace, podName, errText := parts[0], parts[1], parts[2]
×
718
                if strings.Contains(errText, "No such device") {
×
719
                        klog.Infof("pod %s/%s not found, delete ovs interface %s", podNamespace, podName, iface)
×
720
                        if err := ovs.CleanInterface(iface); err != nil {
×
721
                                klog.Errorf("failed to clean ovs interface %s: %v", iface, err)
×
722
                        }
×
723
                        continue
×
724
                }
725

NEW
726
                if _, err := c.podsLister.Pods(podNamespace).Get(podName); err != nil && k8serrors.IsNotFound(err) {
×
NEW
727
                        // Pod not found by name. Check if this might be a KubeVirt VM.
×
NEW
728
                        // For KubeVirt VMs, the pod_name in OVS external_ids is set to the VM name (not the launcher pod name).
×
NEW
729
                        // The actual launcher pod has the label 'vm.kubevirt.io/name' with the VM name as value.
×
NEW
730
                        // Try to find launcher pods by this label.
×
NEW
731
                        selector := labels.SelectorFromSet(map[string]string{util.KubeVirtVMNameLabel: podName})
×
NEW
732
                        launcherPods, listErr := c.podsLister.Pods(podNamespace).List(selector)
×
NEW
733
                        if listErr != nil {
×
NEW
734
                                klog.Errorf("failed to list launcher pods for vm %s/%s: %v", podNamespace, podName, listErr)
×
NEW
735
                                continue
×
736
                        }
737

738
                        // If we found launcher pod(s) for this VM, keep the interface
NEW
739
                        if len(launcherPods) > 0 {
×
NEW
740
                                klog.V(5).Infof("found %d launcher pod(s) for vm %s/%s, keeping ovs interface %s",
×
NEW
741
                                        len(launcherPods), podNamespace, podName, iface)
×
NEW
742
                                continue
×
743
                        }
744

745
                        // No pod and no launcher pod found - safe to delete
NEW
746
                        klog.Infof("pod %s/%s not found, delete ovs interface %s", podNamespace, podName, iface)
×
NEW
747
                        if err := ovs.CleanInterface(iface); err != nil {
×
NEW
748
                                klog.Errorf("failed to clean ovs interface %s: %v", iface, err)
×
UNCOV
749
                        }
×
750
                }
751
        }
752
}
753

754
func (c *Controller) runIPSecWorker() {
×
755
        if err := c.StartIPSecService(); err != nil {
×
756
                klog.Errorf("starting ipsec service: %v", err)
×
757
        }
×
758

759
        for c.processNextIPSecWorkItem() {
×
760
        }
×
761
}
762

763
func (c *Controller) processNextIPSecWorkItem() bool {
×
764
        key, shutdown := c.ipsecQueue.Get()
×
765
        if shutdown {
×
766
                return false
×
767
        }
×
768
        defer c.ipsecQueue.Done(key)
×
769

×
770
        err := func(key string) error {
×
771
                if err := c.SyncIPSecKeys(key); err != nil {
×
772
                        c.ipsecQueue.AddRateLimited(key)
×
773
                        return fmt.Errorf("error syncing %q: %w, requeuing", key, err)
×
774
                }
×
775
                c.ipsecQueue.Forget(key)
×
776
                return nil
×
777
        }(key)
778
        if err != nil {
×
779
                utilruntime.HandleError(err)
×
780
                return true
×
781
        }
×
782
        return true
×
783
}
784

785
// Run starts controller
786
func (c *Controller) Run(stopCh <-chan struct{}) {
×
787
        defer utilruntime.HandleCrash()
×
788
        defer c.addOrUpdateProviderNetworkQueue.ShutDown()
×
789
        defer c.deleteProviderNetworkQueue.ShutDown()
×
790
        defer c.subnetQueue.ShutDown()
×
791
        defer c.serviceQueue.ShutDown()
×
792
        defer c.updatePodQueue.ShutDown()
×
793
        defer c.deletePodQueue.ShutDown()
×
794
        defer c.ipsecQueue.ShutDown()
×
795
        go wait.Until(c.gcInterfaces, time.Minute, stopCh)
×
796
        go wait.Until(recompute, 10*time.Minute, stopCh)
×
797
        go wait.Until(rotateLog, 1*time.Hour, stopCh)
×
798

×
799
        if err := c.setIPSet(); err != nil {
×
800
                util.LogFatalAndExit(err, "failed to set ipsets")
×
801
        }
×
802

803
        klog.Info("Started workers")
×
804
        go wait.Until(c.loopOvn0Check, 5*time.Second, stopCh)
×
805
        go wait.Until(c.loopOvnExt0Check, 5*time.Second, stopCh)
×
806
        go wait.Until(c.loopTunnelCheck, 5*time.Second, stopCh)
×
807
        go wait.Until(c.runAddOrUpdateProviderNetworkWorker, time.Second, stopCh)
×
808
        go wait.Until(c.runAddOrUpdateServicekWorker, time.Second, stopCh)
×
809
        go wait.Until(c.runDeleteProviderNetworkWorker, time.Second, stopCh)
×
810
        go wait.Until(c.runSubnetWorker, time.Second, stopCh)
×
811
        go wait.Until(c.runUpdatePodWorker, time.Second, stopCh)
×
812
        go wait.Until(c.runDeletePodWorker, time.Second, stopCh)
×
813
        go wait.Until(c.runIPSecWorker, 3*time.Second, stopCh)
×
814
        go wait.Until(c.runGateway, 3*time.Second, stopCh)
×
815
        go wait.Until(c.loopEncapIPCheck, 3*time.Second, stopCh)
×
816
        go wait.Until(c.ovnMetricsUpdate, 3*time.Second, stopCh)
×
817
        go wait.Until(func() {
×
818
                if err := c.reconcileRouters(nil); err != nil {
×
819
                        klog.Errorf("failed to reconcile ovn0 routes: %v", err)
×
820
                }
×
821
        }, 3*time.Second, stopCh)
822

823
        if c.config.EnableTProxy {
×
824
                go c.StartTProxyForwarding()
×
825
                go wait.Until(c.runTProxyConfigWorker, 3*time.Second, stopCh)
×
826
                // Using the tproxy method, kubelet's TCP probe packets cannot reach the namespace of the pod of the custom VPC,
×
827
                // so tproxy itself probes the pod of the custom VPC, if probe failed remove the iptable rules from
×
828
                // kubelet to tproxy, if probe success recover the iptable rules
×
829
                go wait.Until(c.StartTProxyTCPPortProbe, 1*time.Second, stopCh)
×
830
        } else {
×
831
                c.cleanTProxyConfig()
×
832
        }
×
833

834
        if !c.config.EnableOVNIPSec {
×
835
                if err := c.StopAndClearIPSecResource(); err != nil {
×
836
                        klog.Errorf("stop and clear ipsec resource error: %v", err)
×
837
                }
×
838
        }
839

840
        <-stopCh
×
841
        klog.Info("Shutting down workers")
×
842
}
843

844
func recompute() {
×
845
        output, err := exec.Command("ovn-appctl", "-t", "ovn-controller", "inc-engine/recompute").CombinedOutput()
×
846
        if err != nil {
×
847
                klog.Errorf("failed to recompute ovn-controller %q", output)
×
848
        }
×
849
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc