1 /*
2  *    Copyright IBM Corp. 2007,2011
3  *    Author(s): Heiko Carstens <heiko.carstens@de.ibm.com>
4  */
5 
6 #define KMSG_COMPONENT "cpu"
7 #define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
8 
9 #include <linux/workqueue.h>
10 #include <linux/bootmem.h>
11 #include <linux/cpuset.h>
12 #include <linux/device.h>
13 #include <linux/kernel.h>
14 #include <linux/sched.h>
15 #include <linux/init.h>
16 #include <linux/delay.h>
17 #include <linux/cpu.h>
18 #include <linux/smp.h>
19 #include <linux/mm.h>
20 
21 #define PTF_HORIZONTAL	(0UL)
22 #define PTF_VERTICAL	(1UL)
23 #define PTF_CHECK	(2UL)
24 
25 struct mask_info {
26 	struct mask_info *next;
27 	unsigned char id;
28 	cpumask_t mask;
29 };
30 
31 static int topology_enabled = 1;
32 static void topology_work_fn(struct work_struct *work);
33 static struct sysinfo_15_1_x *tl_info;
34 static void set_topology_timer(void);
35 static DECLARE_WORK(topology_work, topology_work_fn);
36 /* topology_lock protects the core linked list */
37 static DEFINE_SPINLOCK(topology_lock);
38 
39 static struct mask_info core_info;
40 cpumask_t cpu_core_map[NR_CPUS];
41 unsigned char cpu_core_id[NR_CPUS];
42 
43 static struct mask_info book_info;
44 cpumask_t cpu_book_map[NR_CPUS];
45 unsigned char cpu_book_id[NR_CPUS];
46 
47 /* smp_cpu_state_mutex must be held when accessing this array */
48 int cpu_polarization[NR_CPUS];
49 
cpu_group_map(struct mask_info * info,unsigned int cpu)50 static cpumask_t cpu_group_map(struct mask_info *info, unsigned int cpu)
51 {
52 	cpumask_t mask;
53 
54 	cpumask_clear(&mask);
55 	if (!topology_enabled || !MACHINE_HAS_TOPOLOGY) {
56 		cpumask_copy(&mask, cpumask_of(cpu));
57 		return mask;
58 	}
59 	while (info) {
60 		if (cpumask_test_cpu(cpu, &info->mask)) {
61 			mask = info->mask;
62 			break;
63 		}
64 		info = info->next;
65 	}
66 	if (cpumask_empty(&mask))
67 		cpumask_copy(&mask, cpumask_of(cpu));
68 	return mask;
69 }
70 
add_cpus_to_mask(struct topology_cpu * tl_cpu,struct mask_info * book,struct mask_info * core,int one_core_per_cpu)71 static struct mask_info *add_cpus_to_mask(struct topology_cpu *tl_cpu,
72 					  struct mask_info *book,
73 					  struct mask_info *core,
74 					  int one_core_per_cpu)
75 {
76 	unsigned int cpu;
77 
78 	for (cpu = find_first_bit(&tl_cpu->mask[0], TOPOLOGY_CPU_BITS);
79 	     cpu < TOPOLOGY_CPU_BITS;
80 	     cpu = find_next_bit(&tl_cpu->mask[0], TOPOLOGY_CPU_BITS, cpu + 1))
81 	{
82 		unsigned int rcpu;
83 		int lcpu;
84 
85 		rcpu = TOPOLOGY_CPU_BITS - 1 - cpu + tl_cpu->origin;
86 		lcpu = smp_find_processor_id(rcpu);
87 		if (lcpu >= 0) {
88 			cpumask_set_cpu(lcpu, &book->mask);
89 			cpu_book_id[lcpu] = book->id;
90 			cpumask_set_cpu(lcpu, &core->mask);
91 			if (one_core_per_cpu) {
92 				cpu_core_id[lcpu] = rcpu;
93 				core = core->next;
94 			} else {
95 				cpu_core_id[lcpu] = core->id;
96 			}
97 			cpu_set_polarization(lcpu, tl_cpu->pp);
98 		}
99 	}
100 	return core;
101 }
102 
clear_masks(void)103 static void clear_masks(void)
104 {
105 	struct mask_info *info;
106 
107 	info = &core_info;
108 	while (info) {
109 		cpumask_clear(&info->mask);
110 		info = info->next;
111 	}
112 	info = &book_info;
113 	while (info) {
114 		cpumask_clear(&info->mask);
115 		info = info->next;
116 	}
117 }
118 
next_tle(union topology_entry * tle)119 static union topology_entry *next_tle(union topology_entry *tle)
120 {
121 	if (!tle->nl)
122 		return (union topology_entry *)((struct topology_cpu *)tle + 1);
123 	return (union topology_entry *)((struct topology_container *)tle + 1);
124 }
125 
__tl_to_cores_generic(struct sysinfo_15_1_x * info)126 static void __tl_to_cores_generic(struct sysinfo_15_1_x *info)
127 {
128 	struct mask_info *core = &core_info;
129 	struct mask_info *book = &book_info;
130 	union topology_entry *tle, *end;
131 
132 	tle = info->tle;
133 	end = (union topology_entry *)((unsigned long)info + info->length);
134 	while (tle < end) {
135 		switch (tle->nl) {
136 		case 2:
137 			book = book->next;
138 			book->id = tle->container.id;
139 			break;
140 		case 1:
141 			core = core->next;
142 			core->id = tle->container.id;
143 			break;
144 		case 0:
145 			add_cpus_to_mask(&tle->cpu, book, core, 0);
146 			break;
147 		default:
148 			clear_masks();
149 			return;
150 		}
151 		tle = next_tle(tle);
152 	}
153 }
154 
__tl_to_cores_z10(struct sysinfo_15_1_x * info)155 static void __tl_to_cores_z10(struct sysinfo_15_1_x *info)
156 {
157 	struct mask_info *core = &core_info;
158 	struct mask_info *book = &book_info;
159 	union topology_entry *tle, *end;
160 
161 	tle = info->tle;
162 	end = (union topology_entry *)((unsigned long)info + info->length);
163 	while (tle < end) {
164 		switch (tle->nl) {
165 		case 1:
166 			book = book->next;
167 			book->id = tle->container.id;
168 			break;
169 		case 0:
170 			core = add_cpus_to_mask(&tle->cpu, book, core, 1);
171 			break;
172 		default:
173 			clear_masks();
174 			return;
175 		}
176 		tle = next_tle(tle);
177 	}
178 }
179 
tl_to_cores(struct sysinfo_15_1_x * info)180 static void tl_to_cores(struct sysinfo_15_1_x *info)
181 {
182 	struct cpuid cpu_id;
183 
184 	get_cpu_id(&cpu_id);
185 	spin_lock_irq(&topology_lock);
186 	clear_masks();
187 	switch (cpu_id.machine) {
188 	case 0x2097:
189 	case 0x2098:
190 		__tl_to_cores_z10(info);
191 		break;
192 	default:
193 		__tl_to_cores_generic(info);
194 	}
195 	spin_unlock_irq(&topology_lock);
196 }
197 
topology_update_polarization_simple(void)198 static void topology_update_polarization_simple(void)
199 {
200 	int cpu;
201 
202 	mutex_lock(&smp_cpu_state_mutex);
203 	for_each_possible_cpu(cpu)
204 		cpu_set_polarization(cpu, POLARIZATION_HRZ);
205 	mutex_unlock(&smp_cpu_state_mutex);
206 }
207 
ptf(unsigned long fc)208 static int ptf(unsigned long fc)
209 {
210 	int rc;
211 
212 	asm volatile(
213 		"	.insn	rre,0xb9a20000,%1,%1\n"
214 		"	ipm	%0\n"
215 		"	srl	%0,28\n"
216 		: "=d" (rc)
217 		: "d" (fc)  : "cc");
218 	return rc;
219 }
220 
topology_set_cpu_management(int fc)221 int topology_set_cpu_management(int fc)
222 {
223 	int cpu, rc;
224 
225 	if (!MACHINE_HAS_TOPOLOGY)
226 		return -EOPNOTSUPP;
227 	if (fc)
228 		rc = ptf(PTF_VERTICAL);
229 	else
230 		rc = ptf(PTF_HORIZONTAL);
231 	if (rc)
232 		return -EBUSY;
233 	for_each_possible_cpu(cpu)
234 		cpu_set_polarization(cpu, POLARIZATION_UNKNOWN);
235 	return rc;
236 }
237 
update_cpu_core_map(void)238 static void update_cpu_core_map(void)
239 {
240 	unsigned long flags;
241 	int cpu;
242 
243 	spin_lock_irqsave(&topology_lock, flags);
244 	for_each_possible_cpu(cpu) {
245 		cpu_core_map[cpu] = cpu_group_map(&core_info, cpu);
246 		cpu_book_map[cpu] = cpu_group_map(&book_info, cpu);
247 	}
248 	spin_unlock_irqrestore(&topology_lock, flags);
249 }
250 
store_topology(struct sysinfo_15_1_x * info)251 void store_topology(struct sysinfo_15_1_x *info)
252 {
253 	int rc;
254 
255 	rc = stsi(info, 15, 1, 3);
256 	if (rc != -ENOSYS)
257 		return;
258 	stsi(info, 15, 1, 2);
259 }
260 
arch_update_cpu_topology(void)261 int arch_update_cpu_topology(void)
262 {
263 	struct sysinfo_15_1_x *info = tl_info;
264 	struct device *dev;
265 	int cpu;
266 
267 	if (!MACHINE_HAS_TOPOLOGY) {
268 		update_cpu_core_map();
269 		topology_update_polarization_simple();
270 		return 0;
271 	}
272 	store_topology(info);
273 	tl_to_cores(info);
274 	update_cpu_core_map();
275 	for_each_online_cpu(cpu) {
276 		dev = get_cpu_device(cpu);
277 		kobject_uevent(&dev->kobj, KOBJ_CHANGE);
278 	}
279 	return 1;
280 }
281 
topology_work_fn(struct work_struct * work)282 static void topology_work_fn(struct work_struct *work)
283 {
284 	rebuild_sched_domains();
285 }
286 
topology_schedule_update(void)287 void topology_schedule_update(void)
288 {
289 	schedule_work(&topology_work);
290 }
291 
topology_timer_fn(unsigned long ignored)292 static void topology_timer_fn(unsigned long ignored)
293 {
294 	if (ptf(PTF_CHECK))
295 		topology_schedule_update();
296 	set_topology_timer();
297 }
298 
299 static struct timer_list topology_timer =
300 	TIMER_DEFERRED_INITIALIZER(topology_timer_fn, 0, 0);
301 
302 static atomic_t topology_poll = ATOMIC_INIT(0);
303 
set_topology_timer(void)304 static void set_topology_timer(void)
305 {
306 	if (atomic_add_unless(&topology_poll, -1, 0))
307 		mod_timer(&topology_timer, jiffies + HZ / 10);
308 	else
309 		mod_timer(&topology_timer, jiffies + HZ * 60);
310 }
311 
topology_expect_change(void)312 void topology_expect_change(void)
313 {
314 	if (!MACHINE_HAS_TOPOLOGY)
315 		return;
316 	/* This is racy, but it doesn't matter since it is just a heuristic.
317 	 * Worst case is that we poll in a higher frequency for a bit longer.
318 	 */
319 	if (atomic_read(&topology_poll) > 60)
320 		return;
321 	atomic_add(60, &topology_poll);
322 	set_topology_timer();
323 }
324 
early_parse_topology(char * p)325 static int __init early_parse_topology(char *p)
326 {
327 	if (strncmp(p, "off", 3))
328 		return 0;
329 	topology_enabled = 0;
330 	return 0;
331 }
332 early_param("topology", early_parse_topology);
333 
alloc_masks(struct sysinfo_15_1_x * info,struct mask_info * mask,int offset)334 static void __init alloc_masks(struct sysinfo_15_1_x *info,
335 			       struct mask_info *mask, int offset)
336 {
337 	int i, nr_masks;
338 
339 	nr_masks = info->mag[TOPOLOGY_NR_MAG - offset];
340 	for (i = 0; i < info->mnest - offset; i++)
341 		nr_masks *= info->mag[TOPOLOGY_NR_MAG - offset - 1 - i];
342 	nr_masks = max(nr_masks, 1);
343 	for (i = 0; i < nr_masks; i++) {
344 		mask->next = alloc_bootmem(sizeof(struct mask_info));
345 		mask = mask->next;
346 	}
347 }
348 
s390_init_cpu_topology(void)349 void __init s390_init_cpu_topology(void)
350 {
351 	struct sysinfo_15_1_x *info;
352 	int i;
353 
354 	if (!MACHINE_HAS_TOPOLOGY)
355 		return;
356 	tl_info = alloc_bootmem_pages(PAGE_SIZE);
357 	info = tl_info;
358 	store_topology(info);
359 	pr_info("The CPU configuration topology of the machine is:");
360 	for (i = 0; i < TOPOLOGY_NR_MAG; i++)
361 		printk(KERN_CONT " %d", info->mag[i]);
362 	printk(KERN_CONT " / %d\n", info->mnest);
363 	alloc_masks(info, &core_info, 1);
364 	alloc_masks(info, &book_info, 2);
365 }
366 
367 static int cpu_management;
368 
dispatching_show(struct device * dev,struct device_attribute * attr,char * buf)369 static ssize_t dispatching_show(struct device *dev,
370 				struct device_attribute *attr,
371 				char *buf)
372 {
373 	ssize_t count;
374 
375 	mutex_lock(&smp_cpu_state_mutex);
376 	count = sprintf(buf, "%d\n", cpu_management);
377 	mutex_unlock(&smp_cpu_state_mutex);
378 	return count;
379 }
380 
dispatching_store(struct device * dev,struct device_attribute * attr,const char * buf,size_t count)381 static ssize_t dispatching_store(struct device *dev,
382 				 struct device_attribute *attr,
383 				 const char *buf,
384 				 size_t count)
385 {
386 	int val, rc;
387 	char delim;
388 
389 	if (sscanf(buf, "%d %c", &val, &delim) != 1)
390 		return -EINVAL;
391 	if (val != 0 && val != 1)
392 		return -EINVAL;
393 	rc = 0;
394 	get_online_cpus();
395 	mutex_lock(&smp_cpu_state_mutex);
396 	if (cpu_management == val)
397 		goto out;
398 	rc = topology_set_cpu_management(val);
399 	if (rc)
400 		goto out;
401 	cpu_management = val;
402 	topology_expect_change();
403 out:
404 	mutex_unlock(&smp_cpu_state_mutex);
405 	put_online_cpus();
406 	return rc ? rc : count;
407 }
408 static DEVICE_ATTR(dispatching, 0644, dispatching_show,
409 			 dispatching_store);
410 
cpu_polarization_show(struct device * dev,struct device_attribute * attr,char * buf)411 static ssize_t cpu_polarization_show(struct device *dev,
412 				     struct device_attribute *attr, char *buf)
413 {
414 	int cpu = dev->id;
415 	ssize_t count;
416 
417 	mutex_lock(&smp_cpu_state_mutex);
418 	switch (cpu_read_polarization(cpu)) {
419 	case POLARIZATION_HRZ:
420 		count = sprintf(buf, "horizontal\n");
421 		break;
422 	case POLARIZATION_VL:
423 		count = sprintf(buf, "vertical:low\n");
424 		break;
425 	case POLARIZATION_VM:
426 		count = sprintf(buf, "vertical:medium\n");
427 		break;
428 	case POLARIZATION_VH:
429 		count = sprintf(buf, "vertical:high\n");
430 		break;
431 	default:
432 		count = sprintf(buf, "unknown\n");
433 		break;
434 	}
435 	mutex_unlock(&smp_cpu_state_mutex);
436 	return count;
437 }
438 static DEVICE_ATTR(polarization, 0444, cpu_polarization_show, NULL);
439 
440 static struct attribute *topology_cpu_attrs[] = {
441 	&dev_attr_polarization.attr,
442 	NULL,
443 };
444 
445 static struct attribute_group topology_cpu_attr_group = {
446 	.attrs = topology_cpu_attrs,
447 };
448 
topology_cpu_init(struct cpu * cpu)449 int topology_cpu_init(struct cpu *cpu)
450 {
451 	return sysfs_create_group(&cpu->dev.kobj, &topology_cpu_attr_group);
452 }
453 
topology_init(void)454 static int __init topology_init(void)
455 {
456 	if (!MACHINE_HAS_TOPOLOGY) {
457 		topology_update_polarization_simple();
458 		goto out;
459 	}
460 	set_topology_timer();
461 out:
462 	update_cpu_core_map();
463 	return device_create_file(cpu_subsys.dev_root, &dev_attr_dispatching);
464 }
465 device_initcall(topology_init);
466