Drivers: hv: vmbus: Fix duplicate CPU assignments within a device

author Haiyang Zhang <haiyangz@microsoft.com>

Fri, 16 Jul 2021 18:21:13 +0000 (11:21 -0700)

committer Wei Liu <wei.liu@kernel.org>

Mon, 19 Jul 2021 09:26:31 +0000 (09:26 +0000)
author Haiyang Zhang <haiyangz@microsoft.com>
Fri, 16 Jul 2021 18:21:13 +0000 (11:21 -0700)
committer Wei Liu <wei.liu@kernel.org>
Mon, 19 Jul 2021 09:26:31 +0000 (09:26 +0000)
diff --git a/drivers/hv/channel_mgmt.c b/drivers/hv/channel_mgmt.c

index caf6d0c4bc1b1d72efeb1e0d0b2bd2c81321241d..142308526ec6ae49468fb86f984ec0609d1ac186 100644 (file)
--- a/drivers/hv/channel_mgmt.c
+++ b/drivers/hv/channel_mgmt.c
@@ -605,6 +605,17 @@ static void vmbus_process_offer(struct vmbus_channel *newchannel)
          */
         mutex_lock(&vmbus_connection.channel_mutex);
  
+       list_for_each_entry(channel, &vmbus_connection.chn_list, listentry) {
+               if (guid_equal(&channel->offermsg.offer.if_type,
+                              &newchannel->offermsg.offer.if_type) &&
+                   guid_equal(&channel->offermsg.offer.if_instance,
+                              &newchannel->offermsg.offer.if_instance)) {
+                       fnew = false;
+                       newchannel->primary_channel = channel;
+                       break;
+               }
+       }
+
         init_vp_index(newchannel);
  
         /* Remember the channels that should be cleaned up upon suspend. */
@@ -617,16 +628,6 @@ static void vmbus_process_offer(struct vmbus_channel *newchannel)
          */
         atomic_dec(&vmbus_connection.offer_in_progress);
  
-       list_for_each_entry(channel, &vmbus_connection.chn_list, listentry) {
-               if (guid_equal(&channel->offermsg.offer.if_type,
-                              &newchannel->offermsg.offer.if_type) &&
-                   guid_equal(&channel->offermsg.offer.if_instance,
-                              &newchannel->offermsg.offer.if_instance)) {
-                       fnew = false;
-                       break;
-               }
-       }
-
         if (fnew) {
                 list_add_tail(&newchannel->listentry,
                               &vmbus_connection.chn_list);
@@ -647,7 +648,6 @@ static void vmbus_process_offer(struct vmbus_channel *newchannel)
                 /*
                  * Process the sub-channel.
                  */
-               newchannel->primary_channel = channel;
                 list_add_tail(&newchannel->sc_list, &channel->sc_list);
         }
  
@@ -683,6 +683,30 @@ static void vmbus_process_offer(struct vmbus_channel *newchannel)
         queue_work(wq, &newchannel->add_channel_work);
  }
  
+/*
+ * Check if CPUs used by other channels of the same device.
+ * It should only be called by init_vp_index().
+ */
+static bool hv_cpuself_used(u32 cpu, struct vmbus_channel *chn)
+{
+       struct vmbus_channel *primary = chn->primary_channel;
+       struct vmbus_channel *sc;
+
+       lockdep_assert_held(&vmbus_connection.channel_mutex);
+
+       if (!primary)
+               return false;
+
+       if (primary->target_cpu == cpu)
+               return true;
+
+       list_for_each_entry(sc, &primary->sc_list, sc_list)
+               if (sc != chn && sc->target_cpu == cpu)
+                       return true;
+
+       return false;
+}
+
  /*
   * We use this state to statically distribute the channel interrupt load.
   */
@@ -702,6 +726,7 @@ static int next_numa_node_id;
  static void init_vp_index(struct vmbus_channel *channel)
  {
         bool perf_chn = hv_is_perf_channel(channel);
+       u32 i, ncpu = num_online_cpus();
         cpumask_var_t available_mask;
         struct cpumask *alloced_mask;
         u32 target_cpu;
@@ -724,31 +749,38 @@ static void init_vp_index(struct vmbus_channel *channel)
                 return;
         }
  
-       while (true) {
-               numa_node = next_numa_node_id++;
-               if (numa_node == nr_node_ids) {
-                       next_numa_node_id = 0;
-                       continue;
+       for (i = 1; i <= ncpu + 1; i++) {
+               while (true) {
+                       numa_node = next_numa_node_id++;
+                       if (numa_node == nr_node_ids) {
+                               next_numa_node_id = 0;
+                               continue;
+                       }
+                       if (cpumask_empty(cpumask_of_node(numa_node)))
+                               continue;
+                       break;
+               }
+               alloced_mask = &hv_context.hv_numa_map[numa_node];
+
+               if (cpumask_weight(alloced_mask) ==
+                   cpumask_weight(cpumask_of_node(numa_node))) {
+                       /*
+                        * We have cycled through all the CPUs in the node;
+                        * reset the alloced map.
+                        */
+                       cpumask_clear(alloced_mask);
                 }
-               if (cpumask_empty(cpumask_of_node(numa_node)))
-                       continue;
-               break;
-       }
-       alloced_mask = &hv_context.hv_numa_map[numa_node];
  
-       if (cpumask_weight(alloced_mask) ==
-           cpumask_weight(cpumask_of_node(numa_node))) {
-               /*
-                * We have cycled through all the CPUs in the node;
-                * reset the alloced map.
-                */
-               cpumask_clear(alloced_mask);
-       }
+               cpumask_xor(available_mask, alloced_mask,
+                           cpumask_of_node(numa_node));
  
-       cpumask_xor(available_mask, alloced_mask, cpumask_of_node(numa_node));
+               target_cpu = cpumask_first(available_mask);
+               cpumask_set_cpu(target_cpu, alloced_mask);
  
-       target_cpu = cpumask_first(available_mask);
-       cpumask_set_cpu(target_cpu, alloced_mask);
+               if (channel->offermsg.offer.sub_channel_index >= ncpu ||
+                   i > ncpu || !hv_cpuself_used(target_cpu, channel))
+                       break;
+       }
  
         channel->target_cpu = target_cpu;
author	Haiyang Zhang <haiyangz@microsoft.com>
	Fri, 16 Jul 2021 18:21:13 +0000 (11:21 -0700)
committer	Wei Liu <wei.liu@kernel.org>
	Mon, 19 Jul 2021 09:26:31 +0000 (09:26 +0000)