Lines Matching +full:in +full:- +full:masks

1 // SPDX-License-Identifier: GPL-2.0
38 struct sched_group *group = sd->groups; in sched_domain_debug_one()
39 unsigned long flags = sd->flags; in sched_domain_debug_one()
44 printk(KERN_DEBUG "%*s domain-%d: ", level, "", level); in sched_domain_debug_one()
46 cpumask_pr_args(sched_domain_span(sd)), sd->name); in sched_domain_debug_one()
49 printk(KERN_ERR "ERROR: domain->span does not contain CPU%d\n", cpu); in sched_domain_debug_one()
52 printk(KERN_ERR "ERROR: domain->groups does not contain CPU%d\n", cpu); in sched_domain_debug_one()
59 if ((meta_flags & SDF_SHARED_CHILD) && sd->child && in sched_domain_debug_one()
60 !(sd->child->flags & flag)) in sched_domain_debug_one()
61 printk(KERN_ERR "ERROR: flag %s set here but not in child\n", in sched_domain_debug_one()
64 if ((meta_flags & SDF_SHARED_PARENT) && sd->parent && in sched_domain_debug_one()
65 !(sd->parent->flags & flag)) in sched_domain_debug_one()
66 printk(KERN_ERR "ERROR: flag %s set here but not in parent\n", in sched_domain_debug_one()
84 if (!(sd->flags & SD_OVERLAP) && in sched_domain_debug_one()
94 group->sgc->id, in sched_domain_debug_one()
97 if ((sd->flags & SD_OVERLAP) && in sched_domain_debug_one()
103 if (group->sgc->capacity != SCHED_CAPACITY_SCALE) in sched_domain_debug_one()
104 printk(KERN_CONT " cap=%lu", group->sgc->capacity); in sched_domain_debug_one()
106 if (group == sd->groups && sd->child && in sched_domain_debug_one()
107 !cpumask_equal(sched_domain_span(sd->child), in sched_domain_debug_one()
109 printk(KERN_ERR "ERROR: domain->groups does not match domain->child\n"); in sched_domain_debug_one()
114 group = group->next; in sched_domain_debug_one()
116 if (group != sd->groups) in sched_domain_debug_one()
119 } while (group != sd->groups); in sched_domain_debug_one()
123 printk(KERN_ERR "ERROR: groups don't span domain->span\n"); in sched_domain_debug_one()
125 if (sd->parent && in sched_domain_debug_one()
126 !cpumask_subset(groupmask, sched_domain_span(sd->parent))) in sched_domain_debug_one()
127 printk(KERN_ERR "ERROR: parent span is not a superset of domain->span\n"); in sched_domain_debug_one()
139 printk(KERN_DEBUG "CPU%d attaching NULL sched-domain.\n", cpu); in sched_domain_debug()
143 printk(KERN_DEBUG "CPU%d attaching sched-domain(s):\n", cpu); in sched_domain_debug()
149 sd = sd->parent; in sched_domain_debug()
177 if ((sd->flags & SD_DEGENERATE_GROUPS_MASK) && in sd_degenerate()
178 (sd->groups != sd->groups->next)) in sd_degenerate()
182 if (sd->flags & (SD_WAKE_AFFINE)) in sd_degenerate()
191 unsigned long cflags = sd->flags, pflags = parent->flags; in sd_parent_degenerate()
199 /* Flags needing groups don't count if only 1 group in parent */ in sd_parent_degenerate()
200 if (parent->groups == parent->groups->next) in sd_parent_degenerate()
248 pr_info("rd %*pbl: Checking EAS: frequency-invariant load tracking not yet supported", in sched_is_eas_possible()
264 gov = policy->governor; in sched_is_eas_possible()
294 return -EPERM; in sched_energy_aware_handler()
298 return -EOPNOTSUPP; in sched_energy_aware_handler()
341 tmp = pd->next; in free_pd()
352 pd = pd->next; in find_pd()
372 pd->em_pd = obj; in pd_init()
389 em_pd_nr_perf_states(pd->em_pd)); in perf_domain_debug()
390 pd = pd->next; in perf_domain_debug()
420 * 2. the SD_ASYM_CPUCAPACITY flag is set in the sched_domain hierarchy.
430 struct root_domain *rd = cpu_rq(cpu)->rd; in build_perf_domains()
447 tmp->next = pd; in build_perf_domains()
454 tmp = rd->pd; in build_perf_domains()
455 rcu_assign_pointer(rd->pd, pd); in build_perf_domains()
457 call_rcu(&tmp->rcu, destroy_perf_domain_rcu); in build_perf_domains()
463 tmp = rd->pd; in build_perf_domains()
464 rcu_assign_pointer(rd->pd, NULL); in build_perf_domains()
466 call_rcu(&tmp->rcu, destroy_perf_domain_rcu); in build_perf_domains()
478 cpupri_cleanup(&rd->cpupri); in free_rootdomain()
479 cpudl_cleanup(&rd->cpudl); in free_rootdomain()
480 free_cpumask_var(rd->dlo_mask); in free_rootdomain()
481 free_cpumask_var(rd->rto_mask); in free_rootdomain()
482 free_cpumask_var(rd->online); in free_rootdomain()
483 free_cpumask_var(rd->span); in free_rootdomain()
484 free_pd(rd->pd); in free_rootdomain()
495 if (rq->rd) { in rq_attach_root()
496 old_rd = rq->rd; in rq_attach_root()
498 if (cpumask_test_cpu(rq->cpu, old_rd->online)) in rq_attach_root()
501 cpumask_clear_cpu(rq->cpu, old_rd->span); in rq_attach_root()
506 * in this function: in rq_attach_root()
508 if (!atomic_dec_and_test(&old_rd->refcount)) in rq_attach_root()
512 atomic_inc(&rd->refcount); in rq_attach_root()
513 rq->rd = rd; in rq_attach_root()
515 cpumask_set_cpu(rq->cpu, rd->span); in rq_attach_root()
516 if (cpumask_test_cpu(rq->cpu, cpu_active_mask)) in rq_attach_root()
524 if (rq->fair_server.dl_server) in rq_attach_root()
525 __dl_server_attach_root(&rq->fair_server, rq); in rq_attach_root()
530 call_rcu(&old_rd->rcu, free_rootdomain); in rq_attach_root()
535 atomic_inc(&rd->refcount); in sched_get_rd()
540 if (!atomic_dec_and_test(&rd->refcount)) in sched_put_rd()
543 call_rcu(&rd->rcu, free_rootdomain); in sched_put_rd()
548 if (!zalloc_cpumask_var(&rd->span, GFP_KERNEL)) in init_rootdomain()
550 if (!zalloc_cpumask_var(&rd->online, GFP_KERNEL)) in init_rootdomain()
552 if (!zalloc_cpumask_var(&rd->dlo_mask, GFP_KERNEL)) in init_rootdomain()
554 if (!zalloc_cpumask_var(&rd->rto_mask, GFP_KERNEL)) in init_rootdomain()
558 rd->rto_cpu = -1; in init_rootdomain()
559 raw_spin_lock_init(&rd->rto_lock); in init_rootdomain()
560 rd->rto_push_work = IRQ_WORK_INIT_HARD(rto_push_irq_work_func); in init_rootdomain()
563 rd->visit_gen = 0; in init_rootdomain()
564 init_dl_bw(&rd->dl_bw); in init_rootdomain()
565 if (cpudl_init(&rd->cpudl) != 0) in init_rootdomain()
568 if (cpupri_init(&rd->cpupri) != 0) in init_rootdomain()
573 cpudl_cleanup(&rd->cpudl); in init_rootdomain()
575 free_cpumask_var(rd->rto_mask); in init_rootdomain()
577 free_cpumask_var(rd->dlo_mask); in init_rootdomain()
579 free_cpumask_var(rd->online); in init_rootdomain()
581 free_cpumask_var(rd->span); in init_rootdomain()
583 return -ENOMEM; in init_rootdomain()
587 * By default the system creates a single root-domain with all CPUs as
624 tmp = sg->next; in free_sched_groups()
626 if (free_sgc && atomic_dec_and_test(&sg->sgc->ref)) in free_sched_groups()
627 kfree(sg->sgc); in free_sched_groups()
629 if (atomic_dec_and_test(&sg->ref)) in free_sched_groups()
642 free_sched_groups(sd->groups, 1); in destroy_sched_domain()
644 if (sd->shared && atomic_dec_and_test(&sd->shared->ref)) in destroy_sched_domain()
645 kfree(sd->shared); in destroy_sched_domain()
654 struct sched_domain *parent = sd->parent; in destroy_sched_domains_rcu()
663 call_rcu(&sd->rcu, destroy_sched_domains_rcu); in destroy_sched_domains()
671 * Also keep a unique ID per domain (we use the first CPU number in the cpumask
672 * of the domain), this allows us to quickly tell if two CPUs are in the same
698 sds = sd->shared; in update_top_cache_domain()
713 * but equals to LLC id on non-Cluster machines. in update_top_cache_domain()
739 struct sched_domain *parent = tmp->parent; in cpu_attach_domain()
744 tmp->parent = parent->parent; in cpu_attach_domain()
746 if (parent->parent) { in cpu_attach_domain()
747 parent->parent->child = tmp; in cpu_attach_domain()
748 parent->parent->groups->flags = tmp->flags; in cpu_attach_domain()
752 * Transfer SD_PREFER_SIBLING down in case of a in cpu_attach_domain()
756 if (parent->flags & SD_PREFER_SIBLING) in cpu_attach_domain()
757 tmp->flags |= SD_PREFER_SIBLING; in cpu_attach_domain()
760 tmp = tmp->parent; in cpu_attach_domain()
765 sd = sd->parent; in cpu_attach_domain()
768 struct sched_group *sg = sd->groups; in cpu_attach_domain()
776 sg->flags = 0; in cpu_attach_domain()
777 } while (sg != sd->groups); in cpu_attach_domain()
779 sd->child = NULL; in cpu_attach_domain()
786 tmp = rq->sd; in cpu_attach_domain()
787 rcu_assign_pointer(rq->sd, sd); in cpu_attach_domain()
808 * of this group that's also in the balance mask.
824 * Given a node-distance table, for example:
834 * 0 ----- 1
838 * 3 ----- 2
842 * construct the mask of all nodes reachable in @level hops.
846 * NUMA-2 0-3 0-3 0-3 0-3
847 * groups: {0-1,3},{1-3} {0-2},{0,2-3} {1-3},{0-1,3} {0,2-3},{0-2}
849 * NUMA-1 0-1,3 0-2 1-3 0,2-3
852 * NUMA-0 0 1 2 3
856 * When we iterate a domain in child domain chunks some nodes can be
857 * represented multiple times -- hence the "overlap" naming for this part of
860 * In order to minimize this overlap, we only build enough groups to cover the
861 * domain. For instance Node-0 NUMA-2 would only get groups: 0-1,3 and 1-3.
865 * - the first group of each domain is its child domain; this
866 * gets us the first 0-1,3
867 * - the only uncovered node is 2, who's child domain is 1-3.
870 * more complicated. Consider for instance the groups of NODE-1 NUMA-2, both
871 * groups include the CPUs of Node-0, while those CPUs would not in fact ever
872 * end up at those groups (they would end up in group: 0-1,3).
875 * will contain those CPUs in the group that can reach this group given the
895 * 0 ----- 1
899 * 2 ----- 3
907 * NUMA-2 0-3 0-3
908 * groups: {0-2},{1-3} {1-3},{0-2}
910 * NUMA-1 0-2 0-3 0-3 1-3
912 * NUMA-0 0 1 2 3
930 struct sd_data *sdd = sd->private; in build_balance_mask()
937 sibling = *per_cpu_ptr(sdd->sd, i); in build_balance_mask()
940 * Can happen in the asymmetric case, where these siblings are in build_balance_mask()
944 if (!sibling->child) in build_balance_mask()
948 if (!cpumask_equal(sg_span, sched_domain_span(sibling->child))) in build_balance_mask()
954 /* We must not have empty masks here */ in build_balance_mask()
959 * XXX: This creates per-node group entries; since the load-balancer will
960 * immediately access remote memory to construct this group's load-balance
976 if (sd->child) { in build_group_from_child_sched_domain()
977 cpumask_copy(sg_span, sched_domain_span(sd->child)); in build_group_from_child_sched_domain()
978 sg->flags = sd->child->flags; in build_group_from_child_sched_domain()
983 atomic_inc(&sg->ref); in build_group_from_child_sched_domain()
991 struct sd_data *sdd = sd->private; in init_overlap_sched_group()
998 sg->sgc = *per_cpu_ptr(sdd->sgc, cpu); in init_overlap_sched_group()
999 if (atomic_inc_return(&sg->sgc->ref) == 1) in init_overlap_sched_group()
1005 * Initialize sgc->capacity such that even if we mess up the in init_overlap_sched_group()
1010 sg->sgc->capacity = SCHED_CAPACITY_SCALE * cpumask_weight(sg_span); in init_overlap_sched_group()
1011 sg->sgc->min_capacity = SCHED_CAPACITY_SCALE; in init_overlap_sched_group()
1012 sg->sgc->max_capacity = SCHED_CAPACITY_SCALE; in init_overlap_sched_group()
1022 while (sibling->child && in find_descended_sibling()
1023 !cpumask_subset(sched_domain_span(sibling->child), in find_descended_sibling()
1025 sibling = sibling->child; in find_descended_sibling()
1030 * scheduling because they will be degenerated in cpu_attach_domain in find_descended_sibling()
1032 while (sibling->child && in find_descended_sibling()
1033 cpumask_equal(sched_domain_span(sibling->child), in find_descended_sibling()
1035 sibling = sibling->child; in find_descended_sibling()
1046 struct sd_data *sdd = sd->private; in build_overlap_sched_groups()
1058 sibling = *per_cpu_ptr(sdd->sd, i); in build_overlap_sched_groups()
1061 * Asymmetric node setups can result in situations where the in build_overlap_sched_groups()
1065 * In that case build_sched_domains() will have terminated the in build_overlap_sched_groups()
1088 * 0 --- 1 --- 2 --- 3 in build_overlap_sched_groups()
1090 * NUMA-3 0-3 N/A N/A 0-3 in build_overlap_sched_groups()
1091 * groups: {0-2},{1-3} {1-3},{0-2} in build_overlap_sched_groups()
1093 * NUMA-2 0-2 0-3 0-3 1-3 in build_overlap_sched_groups()
1094 * groups: {0-1},{1-3} {0-2},{2-3} {1-3},{0-1} {2-3},{0-2} in build_overlap_sched_groups()
1096 * NUMA-1 0-1 0-2 1-3 2-3 in build_overlap_sched_groups()
1099 * NUMA-0 0 1 2 3 in build_overlap_sched_groups()
1101 * The NUMA-2 groups for nodes 0 and 3 are obviously buggered, as the in build_overlap_sched_groups()
1104 if (sibling->child && in build_overlap_sched_groups()
1105 !cpumask_subset(sched_domain_span(sibling->child), span)) in build_overlap_sched_groups()
1120 last->next = sg; in build_overlap_sched_groups()
1122 last->next = first; in build_overlap_sched_groups()
1124 sd->groups = first; in build_overlap_sched_groups()
1131 return -ENOMEM; in build_overlap_sched_groups()
1136 * Package topology (also see the load-balance blurb in fair.c)
1141 * - Simultaneous multithreading (SMT)
1142 * - Multi-Core Cache (MC)
1143 * - Package (PKG)
1149 * sched_domain -> sched_group -> sched_group_capacity
1151 * `-' `-'
1153 * The sched_domains are per-CPU and have a two way link (parent & child) and
1157 * denoting the domains of the level below (or individual CPUs in case of the
1169 * - or -
1171 * PKG 0-7 0-7 0-7 0-7 0-7 0-7 0-7 0-7
1172 * MC 0-3 0-3 0-3 0-3 4-7 4-7 4-7 4-7
1173 * SMT 0-1 0-1 2-3 2-3 4-5 4-5 6-7 6-7
1186 * - The first is the balance_cpu (see should_we_balance() and the
1187 * load-balance blurb in fair.c); for each group we only want 1 CPU to
1190 * - The second is the sched_group_capacity; we want all identical groups
1196 * for each CPU in the hierarchy.
1199 * mask is redundant and set all 1s; all CPUs in a group will end up at _that_
1200 * group), we can simply pick the first CPU in each group.
1203 * [*] in other words, the first group of each domain is its child domain.
1208 struct sched_domain *sd = *per_cpu_ptr(sdd->sd, cpu); in get_group()
1209 struct sched_domain *child = sd->child; in get_group()
1216 sg = *per_cpu_ptr(sdd->sg, cpu); in get_group()
1217 sg->sgc = *per_cpu_ptr(sdd->sgc, cpu); in get_group()
1220 already_visited = atomic_inc_return(&sg->ref) > 1; in get_group()
1222 WARN_ON(already_visited != (atomic_inc_return(&sg->sgc->ref) > 1)); in get_group()
1231 sg->flags = child->flags; in get_group()
1237 sg->sgc->capacity = SCHED_CAPACITY_SCALE * cpumask_weight(sched_group_span(sg)); in get_group()
1238 sg->sgc->min_capacity = SCHED_CAPACITY_SCALE; in get_group()
1239 sg->sgc->max_capacity = SCHED_CAPACITY_SCALE; in get_group()
1246 * covered by the given span, will set each group's ->cpumask correctly,
1247 * and will initialize their ->sgc.
1255 struct sd_data *sdd = sd->private; in build_sched_groups()
1278 last->next = sg; in build_sched_groups()
1281 last->next = first; in build_sched_groups()
1282 sd->groups = first; in build_sched_groups()
1291 * distributing the load between different sched groups in a sched domain.
1292 * Typically cpu_capacity for all the groups in a sched domain will be same
1293 * unless there are asymmetries in the topology. If there are asymmetries,
1299 struct sched_group *sg = sd->groups; in init_sched_groups_capacity()
1305 int cpu, cores = 0, max_cpu = -1; in init_sched_groups_capacity()
1307 sg->group_weight = cpumask_weight(sched_group_span(sg)); in init_sched_groups_capacity()
1316 sg->cores = cores; in init_sched_groups_capacity()
1318 if (!(sd->flags & SD_ASYM_PACKING)) in init_sched_groups_capacity()
1327 sg->asym_prefer_cpu = max_cpu; in init_sched_groups_capacity()
1330 sg = sg->next; in init_sched_groups_capacity()
1331 } while (sg != sd->groups); in init_sched_groups_capacity()
1348 * Verify whether there is any CPU capacity asymmetry in a given sched domain.
1402 if (capacity == entry->capacity) in asym_cpu_capacity_update_data()
1404 else if (!insert_entry && capacity > entry->capacity) in asym_cpu_capacity_update_data()
1411 entry->capacity = capacity; in asym_cpu_capacity_update_data()
1415 list_add_tail_rcu(&entry->link, &asym_cap_list); in asym_cpu_capacity_update_data()
1417 list_add_rcu(&entry->link, &insert_entry->link); in asym_cpu_capacity_update_data()
1423 * Build-up/update list of CPUs grouped by their capacities
1440 list_del_rcu(&entry->link); in asym_cpu_capacity_scan()
1441 call_rcu(&entry->rcu, free_asym_cap_entry); in asym_cpu_capacity_scan()
1451 list_del_rcu(&entry->link); in asym_cpu_capacity_scan()
1452 call_rcu(&entry->rcu, free_asym_cap_entry); in asym_cpu_capacity_scan()
1458 * Non-inlined to reduce accumulated stack pressure in build_sched_domains()
1461 static int default_relax_domain_level = -1;
1478 if (!attr || attr->relax_domain_level < 0) { in set_domain_attribute()
1483 request = attr->relax_domain_level; in set_domain_attribute()
1485 if (sd->level >= request) { in set_domain_attribute()
1487 sd->flags &= ~(SD_BALANCE_WAKE|SD_BALANCE_NEWIDLE); in set_domain_attribute()
1499 if (!atomic_read(&d->rd->refcount)) in __free_domain_allocs()
1500 free_rootdomain(&d->rd->rcu); in __free_domain_allocs()
1503 free_percpu(d->sd); in __free_domain_allocs()
1520 d->sd = alloc_percpu(struct sched_domain *); in __visit_domain_allocation_hell()
1521 if (!d->sd) in __visit_domain_allocation_hell()
1523 d->rd = alloc_rootdomain(); in __visit_domain_allocation_hell()
1524 if (!d->rd) in __visit_domain_allocation_hell()
1537 struct sd_data *sdd = sd->private; in claim_allocations()
1539 WARN_ON_ONCE(*per_cpu_ptr(sdd->sd, cpu) != sd); in claim_allocations()
1540 *per_cpu_ptr(sdd->sd, cpu) = NULL; in claim_allocations()
1542 if (atomic_read(&(*per_cpu_ptr(sdd->sds, cpu))->ref)) in claim_allocations()
1543 *per_cpu_ptr(sdd->sds, cpu) = NULL; in claim_allocations()
1545 if (atomic_read(&(*per_cpu_ptr(sdd->sg, cpu))->ref)) in claim_allocations()
1546 *per_cpu_ptr(sdd->sg, cpu) = NULL; in claim_allocations()
1548 if (atomic_read(&(*per_cpu_ptr(sdd->sgc, cpu))->ref)) in claim_allocations()
1549 *per_cpu_ptr(sdd->sgc, cpu) = NULL; in claim_allocations()
1564 * SD_flags allowed in topology descriptions.
1567 * behaviour. Behaviour is artificial and mapped in the below sd_init()
1578 * SD_ASYM_PACKING - describes SMT quirks
1592 struct sd_data *sdd = &tl->data; in sd_init()
1593 struct sched_domain *sd = *per_cpu_ptr(sdd->sd, cpu); in sd_init()
1601 sched_domains_curr_level = tl->numa_level; in sd_init()
1604 sd_weight = cpumask_weight(tl->mask(cpu)); in sd_init()
1606 if (tl->sd_flags) in sd_init()
1607 sd_flags = (*tl->sd_flags)(); in sd_init()
1609 "wrong sd_flags in topology description\n")) in sd_init()
1639 .name = tl->name, in sd_init()
1644 cpumask_and(sd_span, cpu_map, tl->mask(cpu)); in sd_init()
1647 sd->flags |= asym_cpu_capacity_classify(sd_span, cpu_map); in sd_init()
1649 WARN_ONCE((sd->flags & (SD_SHARE_CPUCAPACITY | SD_ASYM_CPUCAPACITY)) == in sd_init()
1657 if ((sd->flags & SD_ASYM_CPUCAPACITY) && sd->child) in sd_init()
1658 sd->child->flags &= ~SD_PREFER_SIBLING; in sd_init()
1660 if (sd->flags & SD_SHARE_CPUCAPACITY) { in sd_init()
1661 sd->imbalance_pct = 110; in sd_init()
1663 } else if (sd->flags & SD_SHARE_LLC) { in sd_init()
1664 sd->imbalance_pct = 117; in sd_init()
1665 sd->cache_nice_tries = 1; in sd_init()
1668 } else if (sd->flags & SD_NUMA) { in sd_init()
1669 sd->cache_nice_tries = 2; in sd_init()
1671 sd->flags &= ~SD_PREFER_SIBLING; in sd_init()
1672 sd->flags |= SD_SERIALIZE; in sd_init()
1673 if (sched_domains_numa_distance[tl->numa_level] > node_reclaim_distance) { in sd_init()
1674 sd->flags &= ~(SD_BALANCE_EXEC | in sd_init()
1681 sd->cache_nice_tries = 1; in sd_init()
1688 if (sd->flags & SD_SHARE_LLC) { in sd_init()
1689 sd->shared = *per_cpu_ptr(sdd->sds, sd_id); in sd_init()
1690 atomic_inc(&sd->shared->ref); in sd_init()
1691 atomic_set(&sd->shared->nr_busy_cpus, sd_weight); in sd_init()
1694 sd->private = sdd; in sd_init()
1700 * Topology list, bottom-up.
1723 for (tl = sched_domain_topology; tl->mask; tl++)
1803 * topology lies in whether communication between not directly
1809 * - If the maximum distance between any nodes is 1 hop, the system
1811 * - If for two nodes A and B, located N > 1 hops away from each other,
1861 struct cpumask ***masks; in sched_init_numa() local
1864 * O(nr_nodes^2) de-duplicating selection sort -- in order to find the in sched_init_numa()
1865 * unique distances in the node_distance() table. in sched_init_numa()
1917 * in other functions. in sched_init_numa()
1923 masks = kzalloc(sizeof(void *) * nr_levels, GFP_KERNEL); in sched_init_numa()
1924 if (!masks) in sched_init_numa()
1932 masks[i] = kzalloc(nr_node_ids * sizeof(void *), GFP_KERNEL); in sched_init_numa()
1933 if (!masks[i]) in sched_init_numa()
1943 masks[i][j] = mask; in sched_init_numa()
1947 sched_numa_warn("Node-distance not symmetric"); in sched_init_numa()
1956 rcu_assign_pointer(sched_domains_numa_masks, masks); in sched_init_numa()
1998 WRITE_ONCE(sched_max_numa_distance, sched_domains_numa_distance[nr_levels - 1]); in sched_init_numa()
2007 struct cpumask ***masks; in sched_reset_numa() local
2015 masks = sched_domains_numa_masks; in sched_reset_numa()
2017 if (distances || masks) { in sched_reset_numa()
2022 for (i = 0; i < nr_levels && masks; i++) { in sched_reset_numa()
2023 if (!masks[i]) in sched_reset_numa()
2026 kfree(masks[i][j]); in sched_reset_numa()
2027 kfree(masks[i]); in sched_reset_numa()
2029 kfree(masks); in sched_reset_numa()
2067 /* Set ourselves in the remote node's masks */ in sched_domains_numa_masks_set()
2087 * sched_numa_find_closest() - given the NUMA topology, find the cpu
2097 struct cpumask ***masks; in sched_numa_find_closest() local
2100 masks = rcu_dereference(sched_domains_numa_masks); in sched_numa_find_closest()
2101 if (!masks) in sched_numa_find_closest()
2104 if (!masks[i][j]) in sched_numa_find_closest()
2106 cpu = cpumask_any_and(cpus, masks[i][j]); in sched_numa_find_closest()
2120 struct cpumask ***masks; member
2131 if (cpumask_weight_and(k->cpus, cur_hop[k->node]) <= k->cpu) in hop_cmp()
2134 if (b == k->masks) { in hop_cmp()
2135 k->w = 0; in hop_cmp()
2139 prev_hop = *((struct cpumask ***)b - 1); in hop_cmp()
2140 k->w = cpumask_weight_and(k->cpus, prev_hop[k->node]); in hop_cmp()
2141 if (k->w <= k->cpu) in hop_cmp()
2144 return -1; in hop_cmp()
2148 * sched_numa_find_nth_cpu() - given the NUMA topology, find the Nth closest CPU
2168 /* CPU-less node entries are uninitialized in sched_domains_numa_masks */ in sched_numa_find_nth_cpu()
2172 k.masks = rcu_dereference(sched_domains_numa_masks); in sched_numa_find_nth_cpu()
2173 if (!k.masks) in sched_numa_find_nth_cpu()
2176 hop_masks = bsearch(&k, k.masks, sched_domains_numa_levels, sizeof(k.masks[0]), hop_cmp); in sched_numa_find_nth_cpu()
2177 hop = hop_masks - k.masks; in sched_numa_find_nth_cpu()
2180 cpumask_nth_and_andnot(cpu - k.w, cpus, k.masks[hop][node], k.masks[hop-1][node]) : in sched_numa_find_nth_cpu()
2181 cpumask_nth_and(cpu, cpus, k.masks[0][node]); in sched_numa_find_nth_cpu()
2189 * sched_numa_hop_mask() - Get the cpumask of CPUs at most @hops hops away from
2198 * read-side section, copy it if required beyond that.
2200 * Note that not all hops are equal in distance; see sched_init_numa() for how
2201 * distances and masks are handled.
2203 * during the lifetime of the system (offline nodes are taken out of the masks).
2207 struct cpumask ***masks; in sched_numa_hop_mask() local
2210 return ERR_PTR(-EINVAL); in sched_numa_hop_mask()
2212 masks = rcu_dereference(sched_domains_numa_masks); in sched_numa_hop_mask()
2213 if (!masks) in sched_numa_hop_mask()
2214 return ERR_PTR(-EBUSY); in sched_numa_hop_mask()
2216 return masks[hops][node]; in sched_numa_hop_mask()
2228 struct sd_data *sdd = &tl->data; in __sdt_alloc()
2230 sdd->sd = alloc_percpu(struct sched_domain *); in __sdt_alloc()
2231 if (!sdd->sd) in __sdt_alloc()
2232 return -ENOMEM; in __sdt_alloc()
2234 sdd->sds = alloc_percpu(struct sched_domain_shared *); in __sdt_alloc()
2235 if (!sdd->sds) in __sdt_alloc()
2236 return -ENOMEM; in __sdt_alloc()
2238 sdd->sg = alloc_percpu(struct sched_group *); in __sdt_alloc()
2239 if (!sdd->sg) in __sdt_alloc()
2240 return -ENOMEM; in __sdt_alloc()
2242 sdd->sgc = alloc_percpu(struct sched_group_capacity *); in __sdt_alloc()
2243 if (!sdd->sgc) in __sdt_alloc()
2244 return -ENOMEM; in __sdt_alloc()
2255 return -ENOMEM; in __sdt_alloc()
2257 *per_cpu_ptr(sdd->sd, j) = sd; in __sdt_alloc()
2262 return -ENOMEM; in __sdt_alloc()
2264 *per_cpu_ptr(sdd->sds, j) = sds; in __sdt_alloc()
2269 return -ENOMEM; in __sdt_alloc()
2271 sg->next = sg; in __sdt_alloc()
2273 *per_cpu_ptr(sdd->sg, j) = sg; in __sdt_alloc()
2278 return -ENOMEM; in __sdt_alloc()
2281 sgc->id = j; in __sdt_alloc()
2284 *per_cpu_ptr(sdd->sgc, j) = sgc; in __sdt_alloc()
2297 struct sd_data *sdd = &tl->data; in __sdt_free()
2302 if (sdd->sd) { in __sdt_free()
2303 sd = *per_cpu_ptr(sdd->sd, j); in __sdt_free()
2304 if (sd && (sd->flags & SD_OVERLAP)) in __sdt_free()
2305 free_sched_groups(sd->groups, 0); in __sdt_free()
2306 kfree(*per_cpu_ptr(sdd->sd, j)); in __sdt_free()
2309 if (sdd->sds) in __sdt_free()
2310 kfree(*per_cpu_ptr(sdd->sds, j)); in __sdt_free()
2311 if (sdd->sg) in __sdt_free()
2312 kfree(*per_cpu_ptr(sdd->sg, j)); in __sdt_free()
2313 if (sdd->sgc) in __sdt_free()
2314 kfree(*per_cpu_ptr(sdd->sgc, j)); in __sdt_free()
2316 free_percpu(sdd->sd); in __sdt_free()
2317 sdd->sd = NULL; in __sdt_free()
2318 free_percpu(sdd->sds); in __sdt_free()
2319 sdd->sds = NULL; in __sdt_free()
2320 free_percpu(sdd->sg); in __sdt_free()
2321 sdd->sg = NULL; in __sdt_free()
2322 free_percpu(sdd->sgc); in __sdt_free()
2323 sdd->sgc = NULL; in __sdt_free()
2334 sd->level = child->level + 1; in build_sched_domain()
2335 sched_domain_level_max = max(sched_domain_level_max, sd->level); in build_sched_domain()
2336 child->parent = sd; in build_sched_domain()
2343 child->name, sd->name); in build_sched_domain()
2358 * Ensure topology masks are sane, i.e. there are no conflicts (overlaps) for
2359 * any two given CPUs at this (non-NUMA) topology level.
2367 if (tl->flags & SDTL_OVERLAP) in topology_span_sane()
2371 * Non-NUMA levels cannot partially overlap - they must be either in topology_span_sane()
2373 * breaking the sched_group lists - i.e. a later get_group() pass in topology_span_sane()
2378 * We should 'and' all those masks with 'cpu_map' to exactly in topology_span_sane()
2383 if (!cpumask_equal(tl->mask(cpu), tl->mask(i)) && in topology_span_sane()
2384 cpumask_intersects(tl->mask(cpu), tl->mask(i))) in topology_span_sane()
2402 int i, ret = -ENOMEM; in build_sched_domains()
2425 has_asym |= sd->flags & SD_ASYM_CPUCAPACITY; in build_sched_domains()
2429 if (tl->flags & SDTL_OVERLAP) in build_sched_domains()
2430 sd->flags |= SD_OVERLAP; in build_sched_domains()
2438 for (sd = *per_cpu_ptr(d.sd, i); sd; sd = sd->parent) { in build_sched_domains()
2439 sd->span_weight = cpumask_weight(sched_domain_span(sd)); in build_sched_domains()
2440 if (sd->flags & SD_OVERLAP) { in build_sched_domains()
2458 for (sd = *per_cpu_ptr(d.sd, i); sd; sd = sd->parent) { in build_sched_domains()
2459 struct sched_domain *child = sd->child; in build_sched_domains()
2461 if (!(sd->flags & SD_SHARE_LLC) && child && in build_sched_domains()
2462 (child->flags & SD_SHARE_LLC)) { in build_sched_domains()
2469 * arbitrary cutoff based two factors -- SMT and in build_sched_domains()
2470 * memory channels. For SMT-2, the intent is to in build_sched_domains()
2472 * SMT-4 or SMT-8 *may* benefit from a different in build_sched_domains()
2486 nr_llcs = sd->span_weight / child->span_weight; in build_sched_domains()
2488 imb = sd->span_weight >> 3; in build_sched_domains()
2492 sd->imb_numa_nr = imb; in build_sched_domains()
2495 top_p = sd->parent; in build_sched_domains()
2496 while (top_p && !(top_p->flags & SD_NUMA)) { in build_sched_domains()
2497 top_p = top_p->parent; in build_sched_domains()
2499 imb_span = top_p ? top_p->span_weight : sd->span_weight; in build_sched_domains()
2501 int factor = max(1U, (sd->span_weight / imb_span)); in build_sched_domains()
2503 sd->imb_numa_nr = imb * factor; in build_sched_domains()
2509 for (i = nr_cpumask_bits-1; i >= 0; i--) { in build_sched_domains()
2513 for (sd = *per_cpu_ptr(d.sd, i); sd; sd = sd->parent) { in build_sched_domains()
2551 /* Number of sched domains in 'doms_cur': */
2554 /* Attributes of custom domains in 'doms_cur' */
2601 * CPUs, but could be used to exclude other special cases in the future.
2624 * Detach sched domains from a group of CPUs specified in cpu_map
2663 * cpumasks in the array doms_new[] of cpumasks. This compares
2668 * The masks don't intersect (don't overlap.) We should setup one
2669 * sched domain for each mask. CPUs not in any of the cpumasks will
2670 * not be load balanced. If the same cpumask appears both in the
2671 * current 'doms_cur' domains and in the new 'doms_new', we can leave
2674 * The passed in 'doms_new' should be allocated using
2677 * alloc call, then it can pass in doms_new == NULL && ndoms_new == 1,
2724 * its dl_bw->total_bw needs to be cleared. It in partition_sched_domains_locked()
2725 * will be recomputed in function in partition_sched_domains_locked()
2728 rd = cpu_rq(cpumask_any(doms_cur[i]))->rd; in partition_sched_domains_locked()
2733 /* No match - a current sched domain not in new doms_new[] */ in partition_sched_domains_locked()
2754 /* No match - add a new doms_new */ in partition_sched_domains_locked()
2765 cpu_rq(cpumask_first(doms_cur[j]))->rd->pd) { in partition_sched_domains_locked()
2770 /* No match - add perf domains for a new rd */ in partition_sched_domains_locked()