Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/dtor/input
[linux-2.6] / arch / i386 / kernel / cpu / cpufreq / speedstep-centrino.c
1 /*
2  * cpufreq driver for Enhanced SpeedStep, as found in Intel's Pentium
3  * M (part of the Centrino chipset).
4  *
5  * Since the original Pentium M, most new Intel CPUs support Enhanced
6  * SpeedStep.
7  *
8  * Despite the "SpeedStep" in the name, this is almost entirely unlike
9  * traditional SpeedStep.
10  *
11  * Modelled on speedstep.c
12  *
13  * Copyright (C) 2003 Jeremy Fitzhardinge <jeremy@goop.org>
14  */
15
16 #include <linux/kernel.h>
17 #include <linux/module.h>
18 #include <linux/init.h>
19 #include <linux/cpufreq.h>
20 #include <linux/sched.h>        /* current */
21 #include <linux/delay.h>
22 #include <linux/compiler.h>
23
24 #ifdef CONFIG_X86_SPEEDSTEP_CENTRINO_ACPI
25 #include <linux/acpi.h>
26 #include <linux/dmi.h>
27 #include <acpi/processor.h>
28 #endif
29
30 #include <asm/msr.h>
31 #include <asm/processor.h>
32 #include <asm/cpufeature.h>
33
34 #define PFX             "speedstep-centrino: "
35 #define MAINTAINER      "cpufreq@lists.linux.org.uk"
36
37 #define dprintk(msg...) cpufreq_debug_printk(CPUFREQ_DEBUG_DRIVER, "speedstep-centrino", msg)
38
39
40 struct cpu_id
41 {
42         __u8    x86;            /* CPU family */
43         __u8    x86_model;      /* model */
44         __u8    x86_mask;       /* stepping */
45 };
46
47 enum {
48         CPU_BANIAS,
49         CPU_DOTHAN_A1,
50         CPU_DOTHAN_A2,
51         CPU_DOTHAN_B0,
52         CPU_MP4HT_D0,
53         CPU_MP4HT_E0,
54 };
55
56 static const struct cpu_id cpu_ids[] = {
57         [CPU_BANIAS]    = { 6,  9, 5 },
58         [CPU_DOTHAN_A1] = { 6, 13, 1 },
59         [CPU_DOTHAN_A2] = { 6, 13, 2 },
60         [CPU_DOTHAN_B0] = { 6, 13, 6 },
61         [CPU_MP4HT_D0]  = {15,  3, 4 },
62         [CPU_MP4HT_E0]  = {15,  4, 1 },
63 };
64 #define N_IDS   ARRAY_SIZE(cpu_ids)
65
66 struct cpu_model
67 {
68         const struct cpu_id *cpu_id;
69         const char      *model_name;
70         unsigned        max_freq; /* max clock in kHz */
71
72         struct cpufreq_frequency_table *op_points; /* clock/voltage pairs */
73 };
74 static int centrino_verify_cpu_id(const struct cpuinfo_x86 *c, const struct cpu_id *x);
75
76 /* Operating points for current CPU */
77 static struct cpu_model *centrino_model[NR_CPUS];
78 static const struct cpu_id *centrino_cpu[NR_CPUS];
79
80 static struct cpufreq_driver centrino_driver;
81
82 #ifdef CONFIG_X86_SPEEDSTEP_CENTRINO_TABLE
83
84 /* Computes the correct form for IA32_PERF_CTL MSR for a particular
85    frequency/voltage operating point; frequency in MHz, volts in mV.
86    This is stored as "index" in the structure. */
87 #define OP(mhz, mv)                                                     \
88         {                                                               \
89                 .frequency = (mhz) * 1000,                              \
90                 .index = (((mhz)/100) << 8) | ((mv - 700) / 16)         \
91         }
92
93 /*
94  * These voltage tables were derived from the Intel Pentium M
95  * datasheet, document 25261202.pdf, Table 5.  I have verified they
96  * are consistent with my IBM ThinkPad X31, which has a 1.3GHz Pentium
97  * M.
98  */
99
100 /* Ultra Low Voltage Intel Pentium M processor 900MHz (Banias) */
101 static struct cpufreq_frequency_table banias_900[] =
102 {
103         OP(600,  844),
104         OP(800,  988),
105         OP(900, 1004),
106         { .frequency = CPUFREQ_TABLE_END }
107 };
108
109 /* Ultra Low Voltage Intel Pentium M processor 1000MHz (Banias) */
110 static struct cpufreq_frequency_table banias_1000[] =
111 {
112         OP(600,   844),
113         OP(800,   972),
114         OP(900,   988),
115         OP(1000, 1004),
116         { .frequency = CPUFREQ_TABLE_END }
117 };
118
119 /* Low Voltage Intel Pentium M processor 1.10GHz (Banias) */
120 static struct cpufreq_frequency_table banias_1100[] =
121 {
122         OP( 600,  956),
123         OP( 800, 1020),
124         OP( 900, 1100),
125         OP(1000, 1164),
126         OP(1100, 1180),
127         { .frequency = CPUFREQ_TABLE_END }
128 };
129
130
131 /* Low Voltage Intel Pentium M processor 1.20GHz (Banias) */
132 static struct cpufreq_frequency_table banias_1200[] =
133 {
134         OP( 600,  956),
135         OP( 800, 1004),
136         OP( 900, 1020),
137         OP(1000, 1100),
138         OP(1100, 1164),
139         OP(1200, 1180),
140         { .frequency = CPUFREQ_TABLE_END }
141 };
142
143 /* Intel Pentium M processor 1.30GHz (Banias) */
144 static struct cpufreq_frequency_table banias_1300[] =
145 {
146         OP( 600,  956),
147         OP( 800, 1260),
148         OP(1000, 1292),
149         OP(1200, 1356),
150         OP(1300, 1388),
151         { .frequency = CPUFREQ_TABLE_END }
152 };
153
154 /* Intel Pentium M processor 1.40GHz (Banias) */
155 static struct cpufreq_frequency_table banias_1400[] =
156 {
157         OP( 600,  956),
158         OP( 800, 1180),
159         OP(1000, 1308),
160         OP(1200, 1436),
161         OP(1400, 1484),
162         { .frequency = CPUFREQ_TABLE_END }
163 };
164
165 /* Intel Pentium M processor 1.50GHz (Banias) */
166 static struct cpufreq_frequency_table banias_1500[] =
167 {
168         OP( 600,  956),
169         OP( 800, 1116),
170         OP(1000, 1228),
171         OP(1200, 1356),
172         OP(1400, 1452),
173         OP(1500, 1484),
174         { .frequency = CPUFREQ_TABLE_END }
175 };
176
177 /* Intel Pentium M processor 1.60GHz (Banias) */
178 static struct cpufreq_frequency_table banias_1600[] =
179 {
180         OP( 600,  956),
181         OP( 800, 1036),
182         OP(1000, 1164),
183         OP(1200, 1276),
184         OP(1400, 1420),
185         OP(1600, 1484),
186         { .frequency = CPUFREQ_TABLE_END }
187 };
188
189 /* Intel Pentium M processor 1.70GHz (Banias) */
190 static struct cpufreq_frequency_table banias_1700[] =
191 {
192         OP( 600,  956),
193         OP( 800, 1004),
194         OP(1000, 1116),
195         OP(1200, 1228),
196         OP(1400, 1308),
197         OP(1700, 1484),
198         { .frequency = CPUFREQ_TABLE_END }
199 };
200 #undef OP
201
202 #define _BANIAS(cpuid, max, name)       \
203 {       .cpu_id         = cpuid,        \
204         .model_name     = "Intel(R) Pentium(R) M processor " name "MHz", \
205         .max_freq       = (max)*1000,   \
206         .op_points      = banias_##max, \
207 }
208 #define BANIAS(max)     _BANIAS(&cpu_ids[CPU_BANIAS], max, #max)
209
210 /* CPU models, their operating frequency range, and freq/voltage
211    operating points */
212 static struct cpu_model models[] =
213 {
214         _BANIAS(&cpu_ids[CPU_BANIAS], 900, " 900"),
215         BANIAS(1000),
216         BANIAS(1100),
217         BANIAS(1200),
218         BANIAS(1300),
219         BANIAS(1400),
220         BANIAS(1500),
221         BANIAS(1600),
222         BANIAS(1700),
223
224         /* NULL model_name is a wildcard */
225         { &cpu_ids[CPU_DOTHAN_A1], NULL, 0, NULL },
226         { &cpu_ids[CPU_DOTHAN_A2], NULL, 0, NULL },
227         { &cpu_ids[CPU_DOTHAN_B0], NULL, 0, NULL },
228         { &cpu_ids[CPU_MP4HT_D0], NULL, 0, NULL },
229         { &cpu_ids[CPU_MP4HT_E0], NULL, 0, NULL },
230
231         { NULL, }
232 };
233 #undef _BANIAS
234 #undef BANIAS
235
236 static int centrino_cpu_init_table(struct cpufreq_policy *policy)
237 {
238         struct cpuinfo_x86 *cpu = &cpu_data[policy->cpu];
239         struct cpu_model *model;
240
241         for(model = models; model->cpu_id != NULL; model++)
242                 if (centrino_verify_cpu_id(cpu, model->cpu_id) &&
243                     (model->model_name == NULL ||
244                      strcmp(cpu->x86_model_id, model->model_name) == 0))
245                         break;
246
247         if (model->cpu_id == NULL) {
248                 /* No match at all */
249                 dprintk("no support for CPU model \"%s\": "
250                        "send /proc/cpuinfo to " MAINTAINER "\n",
251                        cpu->x86_model_id);
252                 return -ENOENT;
253         }
254
255         if (model->op_points == NULL) {
256                 /* Matched a non-match */
257                 dprintk("no table support for CPU model \"%s\"\n",
258                        cpu->x86_model_id);
259 #ifndef CONFIG_X86_SPEEDSTEP_CENTRINO_ACPI
260                 dprintk("try compiling with CONFIG_X86_SPEEDSTEP_CENTRINO_ACPI enabled\n");
261 #endif
262                 return -ENOENT;
263         }
264
265         centrino_model[policy->cpu] = model;
266
267         dprintk("found \"%s\": max frequency: %dkHz\n",
268                model->model_name, model->max_freq);
269
270         return 0;
271 }
272
273 #else
274 static inline int centrino_cpu_init_table(struct cpufreq_policy *policy) { return -ENODEV; }
275 #endif /* CONFIG_X86_SPEEDSTEP_CENTRINO_TABLE */
276
277 static int centrino_verify_cpu_id(const struct cpuinfo_x86 *c, const struct cpu_id *x)
278 {
279         if ((c->x86 == x->x86) &&
280             (c->x86_model == x->x86_model) &&
281             (c->x86_mask == x->x86_mask))
282                 return 1;
283         return 0;
284 }
285
286 /* To be called only after centrino_model is initialized */
287 static unsigned extract_clock(unsigned msr, unsigned int cpu, int failsafe)
288 {
289         int i;
290
291         /*
292          * Extract clock in kHz from PERF_CTL value
293          * for centrino, as some DSDTs are buggy.
294          * Ideally, this can be done using the acpi_data structure.
295          */
296         if ((centrino_cpu[cpu] == &cpu_ids[CPU_BANIAS]) ||
297             (centrino_cpu[cpu] == &cpu_ids[CPU_DOTHAN_A1]) ||
298             (centrino_cpu[cpu] == &cpu_ids[CPU_DOTHAN_B0])) {
299                 msr = (msr >> 8) & 0xff;
300                 return msr * 100000;
301         }
302
303         if ((!centrino_model[cpu]) || (!centrino_model[cpu]->op_points))
304                 return 0;
305
306         msr &= 0xffff;
307         for (i=0;centrino_model[cpu]->op_points[i].frequency != CPUFREQ_TABLE_END; i++) {
308                 if (msr == centrino_model[cpu]->op_points[i].index)
309                         return centrino_model[cpu]->op_points[i].frequency;
310         }
311         if (failsafe)
312                 return centrino_model[cpu]->op_points[i-1].frequency;
313         else
314                 return 0;
315 }
316
317 /* Return the current CPU frequency in kHz */
318 static unsigned int get_cur_freq(unsigned int cpu)
319 {
320         unsigned l, h;
321         unsigned clock_freq;
322         cpumask_t saved_mask;
323
324         saved_mask = current->cpus_allowed;
325         set_cpus_allowed(current, cpumask_of_cpu(cpu));
326         if (smp_processor_id() != cpu)
327                 return 0;
328
329         rdmsr(MSR_IA32_PERF_STATUS, l, h);
330         clock_freq = extract_clock(l, cpu, 0);
331
332         if (unlikely(clock_freq == 0)) {
333                 /*
334                  * On some CPUs, we can see transient MSR values (which are
335                  * not present in _PSS), while CPU is doing some automatic
336                  * P-state transition (like TM2). Get the last freq set 
337                  * in PERF_CTL.
338                  */
339                 rdmsr(MSR_IA32_PERF_CTL, l, h);
340                 clock_freq = extract_clock(l, cpu, 1);
341         }
342
343         set_cpus_allowed(current, saved_mask);
344         return clock_freq;
345 }
346
347
348 #ifdef CONFIG_X86_SPEEDSTEP_CENTRINO_ACPI
349
350 static struct acpi_processor_performance *acpi_perf_data[NR_CPUS];
351
352 /*
353  * centrino_cpu_early_init_acpi - Do the preregistering with ACPI P-States
354  * library
355  *
356  * Before doing the actual init, we need to do _PSD related setup whenever
357  * supported by the BIOS. These are handled by this early_init routine.
358  */
359 static int centrino_cpu_early_init_acpi(void)
360 {
361         unsigned int    i, j;
362         struct acpi_processor_performance       *data;
363
364         for_each_possible_cpu(i) {
365                 data = kzalloc(sizeof(struct acpi_processor_performance), 
366                                 GFP_KERNEL);
367                 if (!data) {
368                         for_each_possible_cpu(j) {
369                                 kfree(acpi_perf_data[j]);
370                                 acpi_perf_data[j] = NULL;
371                         }
372                         return (-ENOMEM);
373                 }
374                 acpi_perf_data[i] = data;
375         }
376
377         acpi_processor_preregister_performance(acpi_perf_data);
378         return 0;
379 }
380
381
382 /*
383  * Some BIOSes do SW_ANY coordination internally, either set it up in hw
384  * or do it in BIOS firmware and won't inform about it to OS. If not
385  * detected, this has a side effect of making CPU run at a different speed
386  * than OS intended it to run at. Detect it and handle it cleanly.
387  */
388 static int bios_with_sw_any_bug;
389 static int sw_any_bug_found(struct dmi_system_id *d)
390 {
391         bios_with_sw_any_bug = 1;
392         return 0;
393 }
394
395
396 static struct dmi_system_id sw_any_bug_dmi_table[] = {
397         {
398                 .callback = sw_any_bug_found,
399                 .ident = "Supermicro Server X6DLP",
400                 .matches = {
401                         DMI_MATCH(DMI_SYS_VENDOR, "Supermicro"),
402                         DMI_MATCH(DMI_BIOS_VERSION, "080010"),
403                         DMI_MATCH(DMI_PRODUCT_NAME, "X6DLP"),
404                 },
405         },
406         { }
407 };
408
409
410 /*
411  * centrino_cpu_init_acpi - register with ACPI P-States library
412  *
413  * Register with the ACPI P-States library (part of drivers/acpi/processor.c)
414  * in order to determine correct frequency and voltage pairings by reading
415  * the _PSS of the ACPI DSDT or SSDT tables.
416  */
417 static int centrino_cpu_init_acpi(struct cpufreq_policy *policy)
418 {
419         unsigned long                   cur_freq;
420         int                             result = 0, i;
421         unsigned int                    cpu = policy->cpu;
422         struct acpi_processor_performance       *p;
423
424         p = acpi_perf_data[cpu];
425
426         /* register with ACPI core */
427         if (acpi_processor_register_performance(p, cpu)) {
428                 dprintk(PFX "obtaining ACPI data failed\n");
429                 return -EIO;
430         }
431
432         policy->shared_type = p->shared_type;
433         /*
434          * Will let policy->cpus know about dependency only when software 
435          * coordination is required.
436          */
437         if (policy->shared_type == CPUFREQ_SHARED_TYPE_ALL ||
438             policy->shared_type == CPUFREQ_SHARED_TYPE_ANY) {
439                 policy->cpus = p->shared_cpu_map;
440         }
441
442 #ifdef CONFIG_SMP
443         dmi_check_system(sw_any_bug_dmi_table);
444         if (bios_with_sw_any_bug && cpus_weight(policy->cpus) == 1) {
445                 policy->shared_type = CPUFREQ_SHARED_TYPE_ALL;
446                 policy->cpus = cpu_core_map[cpu];
447         }
448 #endif
449
450         /* verify the acpi_data */
451         if (p->state_count <= 1) {
452                 dprintk("No P-States\n");
453                 result = -ENODEV;
454                 goto err_unreg;
455         }
456
457         if ((p->control_register.space_id != ACPI_ADR_SPACE_FIXED_HARDWARE) ||
458             (p->status_register.space_id != ACPI_ADR_SPACE_FIXED_HARDWARE)) {
459                 dprintk("Invalid control/status registers (%x - %x)\n",
460                         p->control_register.space_id, p->status_register.space_id);
461                 result = -EIO;
462                 goto err_unreg;
463         }
464
465         for (i=0; i<p->state_count; i++) {
466                 if (p->states[i].control != p->states[i].status) {
467                         dprintk("Different control (%llu) and status values (%llu)\n",
468                                 p->states[i].control, p->states[i].status);
469                         result = -EINVAL;
470                         goto err_unreg;
471                 }
472
473                 if (!p->states[i].core_frequency) {
474                         dprintk("Zero core frequency for state %u\n", i);
475                         result = -EINVAL;
476                         goto err_unreg;
477                 }
478
479                 if (p->states[i].core_frequency > p->states[0].core_frequency) {
480                         dprintk("P%u has larger frequency (%llu) than P0 (%llu), skipping\n", i,
481                                 p->states[i].core_frequency, p->states[0].core_frequency);
482                         p->states[i].core_frequency = 0;
483                         continue;
484                 }
485         }
486
487         centrino_model[cpu] = kzalloc(sizeof(struct cpu_model), GFP_KERNEL);
488         if (!centrino_model[cpu]) {
489                 result = -ENOMEM;
490                 goto err_unreg;
491         }
492
493         centrino_model[cpu]->model_name=NULL;
494         centrino_model[cpu]->max_freq = p->states[0].core_frequency * 1000;
495         centrino_model[cpu]->op_points =  kmalloc(sizeof(struct cpufreq_frequency_table) *
496                                              (p->state_count + 1), GFP_KERNEL);
497         if (!centrino_model[cpu]->op_points) {
498                 result = -ENOMEM;
499                 goto err_kfree;
500         }
501
502         for (i=0; i<p->state_count; i++) {
503                 centrino_model[cpu]->op_points[i].index = p->states[i].control;
504                 centrino_model[cpu]->op_points[i].frequency = p->states[i].core_frequency * 1000;
505                 dprintk("adding state %i with frequency %u and control value %04x\n", 
506                         i, centrino_model[cpu]->op_points[i].frequency, centrino_model[cpu]->op_points[i].index);
507         }
508         centrino_model[cpu]->op_points[p->state_count].frequency = CPUFREQ_TABLE_END;
509
510         cur_freq = get_cur_freq(cpu);
511
512         for (i=0; i<p->state_count; i++) {
513                 if (!p->states[i].core_frequency) {
514                         dprintk("skipping state %u\n", i);
515                         centrino_model[cpu]->op_points[i].frequency = CPUFREQ_ENTRY_INVALID;
516                         continue;
517                 }
518                 
519                 if (extract_clock(centrino_model[cpu]->op_points[i].index, cpu, 0) !=
520                     (centrino_model[cpu]->op_points[i].frequency)) {
521                         dprintk("Invalid encoded frequency (%u vs. %u)\n",
522                                 extract_clock(centrino_model[cpu]->op_points[i].index, cpu, 0),
523                                 centrino_model[cpu]->op_points[i].frequency);
524                         result = -EINVAL;
525                         goto err_kfree_all;
526                 }
527
528                 if (cur_freq == centrino_model[cpu]->op_points[i].frequency)
529                         p->state = i;
530         }
531
532         /* notify BIOS that we exist */
533         acpi_processor_notify_smm(THIS_MODULE);
534
535         return 0;
536
537  err_kfree_all:
538         kfree(centrino_model[cpu]->op_points);
539  err_kfree:
540         kfree(centrino_model[cpu]);
541  err_unreg:
542         acpi_processor_unregister_performance(p, cpu);
543         dprintk(PFX "invalid ACPI data\n");
544         return (result);
545 }
546 #else
547 static inline int centrino_cpu_init_acpi(struct cpufreq_policy *policy) { return -ENODEV; }
548 static inline int centrino_cpu_early_init_acpi(void) { return 0; }
549 #endif
550
551 static int centrino_cpu_init(struct cpufreq_policy *policy)
552 {
553         struct cpuinfo_x86 *cpu = &cpu_data[policy->cpu];
554         unsigned freq;
555         unsigned l, h;
556         int ret;
557         int i;
558
559         /* Only Intel makes Enhanced Speedstep-capable CPUs */
560         if (cpu->x86_vendor != X86_VENDOR_INTEL || !cpu_has(cpu, X86_FEATURE_EST))
561                 return -ENODEV;
562
563         if (cpu_has(cpu, X86_FEATURE_CONSTANT_TSC))
564                 centrino_driver.flags |= CPUFREQ_CONST_LOOPS;
565
566         if (centrino_cpu_init_acpi(policy)) {
567                 if (policy->cpu != 0)
568                         return -ENODEV;
569
570                 for (i = 0; i < N_IDS; i++)
571                         if (centrino_verify_cpu_id(cpu, &cpu_ids[i]))
572                                 break;
573
574                 if (i != N_IDS)
575                         centrino_cpu[policy->cpu] = &cpu_ids[i];
576
577                 if (!centrino_cpu[policy->cpu]) {
578                         dprintk("found unsupported CPU with "
579                         "Enhanced SpeedStep: send /proc/cpuinfo to "
580                         MAINTAINER "\n");
581                         return -ENODEV;
582                 }
583
584                 if (centrino_cpu_init_table(policy)) {
585                         return -ENODEV;
586                 }
587         }
588
589         /* Check to see if Enhanced SpeedStep is enabled, and try to
590            enable it if not. */
591         rdmsr(MSR_IA32_MISC_ENABLE, l, h);
592
593         if (!(l & (1<<16))) {
594                 l |= (1<<16);
595                 dprintk("trying to enable Enhanced SpeedStep (%x)\n", l);
596                 wrmsr(MSR_IA32_MISC_ENABLE, l, h);
597
598                 /* check to see if it stuck */
599                 rdmsr(MSR_IA32_MISC_ENABLE, l, h);
600                 if (!(l & (1<<16))) {
601                         printk(KERN_INFO PFX "couldn't enable Enhanced SpeedStep\n");
602                         return -ENODEV;
603                 }
604         }
605
606         freq = get_cur_freq(policy->cpu);
607
608         policy->governor = CPUFREQ_DEFAULT_GOVERNOR;
609         policy->cpuinfo.transition_latency = 10000; /* 10uS transition latency */
610         policy->cur = freq;
611
612         dprintk("centrino_cpu_init: cur=%dkHz\n", policy->cur);
613
614         ret = cpufreq_frequency_table_cpuinfo(policy, centrino_model[policy->cpu]->op_points);
615         if (ret)
616                 return (ret);
617
618         cpufreq_frequency_table_get_attr(centrino_model[policy->cpu]->op_points, policy->cpu);
619
620         return 0;
621 }
622
623 static int centrino_cpu_exit(struct cpufreq_policy *policy)
624 {
625         unsigned int cpu = policy->cpu;
626
627         if (!centrino_model[cpu])
628                 return -ENODEV;
629
630         cpufreq_frequency_table_put_attr(cpu);
631
632 #ifdef CONFIG_X86_SPEEDSTEP_CENTRINO_ACPI
633         if (!centrino_model[cpu]->model_name) {
634                 static struct acpi_processor_performance *p;
635
636                 if (acpi_perf_data[cpu]) {
637                         p = acpi_perf_data[cpu];
638                         dprintk("unregistering and freeing ACPI data\n");
639                         acpi_processor_unregister_performance(p, cpu);
640                         kfree(centrino_model[cpu]->op_points);
641                         kfree(centrino_model[cpu]);
642                 }
643         }
644 #endif
645
646         centrino_model[cpu] = NULL;
647
648         return 0;
649 }
650
651 /**
652  * centrino_verify - verifies a new CPUFreq policy
653  * @policy: new policy
654  *
655  * Limit must be within this model's frequency range at least one
656  * border included.
657  */
658 static int centrino_verify (struct cpufreq_policy *policy)
659 {
660         return cpufreq_frequency_table_verify(policy, centrino_model[policy->cpu]->op_points);
661 }
662
663 /**
664  * centrino_setpolicy - set a new CPUFreq policy
665  * @policy: new policy
666  * @target_freq: the target frequency
667  * @relation: how that frequency relates to achieved frequency (CPUFREQ_RELATION_L or CPUFREQ_RELATION_H)
668  *
669  * Sets a new CPUFreq policy.
670  */
671 static int centrino_target (struct cpufreq_policy *policy,
672                             unsigned int target_freq,
673                             unsigned int relation)
674 {
675         unsigned int    newstate = 0;
676         unsigned int    msr, oldmsr = 0, h = 0, cpu = policy->cpu;
677         struct cpufreq_freqs    freqs;
678         cpumask_t               online_policy_cpus;
679         cpumask_t               saved_mask;
680         cpumask_t               set_mask;
681         cpumask_t               covered_cpus;
682         int                     retval = 0;
683         unsigned int            j, k, first_cpu, tmp;
684
685         if (unlikely(centrino_model[cpu] == NULL))
686                 return -ENODEV;
687
688         if (unlikely(cpufreq_frequency_table_target(policy,
689                         centrino_model[cpu]->op_points,
690                         target_freq,
691                         relation,
692                         &newstate))) {
693                 return -EINVAL;
694         }
695
696 #ifdef CONFIG_HOTPLUG_CPU
697         /* cpufreq holds the hotplug lock, so we are safe from here on */
698         cpus_and(online_policy_cpus, cpu_online_map, policy->cpus);
699 #else
700         online_policy_cpus = policy->cpus;
701 #endif
702
703         saved_mask = current->cpus_allowed;
704         first_cpu = 1;
705         cpus_clear(covered_cpus);
706         for_each_cpu_mask(j, online_policy_cpus) {
707                 /*
708                  * Support for SMP systems.
709                  * Make sure we are running on CPU that wants to change freq
710                  */
711                 cpus_clear(set_mask);
712                 if (policy->shared_type == CPUFREQ_SHARED_TYPE_ANY)
713                         cpus_or(set_mask, set_mask, online_policy_cpus);
714                 else
715                         cpu_set(j, set_mask);
716
717                 set_cpus_allowed(current, set_mask);
718                 if (unlikely(!cpu_isset(smp_processor_id(), set_mask))) {
719                         dprintk("couldn't limit to CPUs in this domain\n");
720                         retval = -EAGAIN;
721                         if (first_cpu) {
722                                 /* We haven't started the transition yet. */
723                                 goto migrate_end;
724                         }
725                         break;
726                 }
727
728                 msr = centrino_model[cpu]->op_points[newstate].index;
729
730                 if (first_cpu) {
731                         rdmsr(MSR_IA32_PERF_CTL, oldmsr, h);
732                         if (msr == (oldmsr & 0xffff)) {
733                                 dprintk("no change needed - msr was and needs "
734                                         "to be %x\n", oldmsr);
735                                 retval = 0;
736                                 goto migrate_end;
737                         }
738
739                         freqs.old = extract_clock(oldmsr, cpu, 0);
740                         freqs.new = extract_clock(msr, cpu, 0);
741
742                         dprintk("target=%dkHz old=%d new=%d msr=%04x\n",
743                                 target_freq, freqs.old, freqs.new, msr);
744
745                         for_each_cpu_mask(k, online_policy_cpus) {
746                                 freqs.cpu = k;
747                                 cpufreq_notify_transition(&freqs,
748                                         CPUFREQ_PRECHANGE);
749                         }
750
751                         first_cpu = 0;
752                         /* all but 16 LSB are reserved, treat them with care */
753                         oldmsr &= ~0xffff;
754                         msr &= 0xffff;
755                         oldmsr |= msr;
756                 }
757
758                 wrmsr(MSR_IA32_PERF_CTL, oldmsr, h);
759                 if (policy->shared_type == CPUFREQ_SHARED_TYPE_ANY)
760                         break;
761
762                 cpu_set(j, covered_cpus);
763         }
764
765         for_each_cpu_mask(k, online_policy_cpus) {
766                 freqs.cpu = k;
767                 cpufreq_notify_transition(&freqs, CPUFREQ_POSTCHANGE);
768         }
769
770         if (unlikely(retval)) {
771                 /*
772                  * We have failed halfway through the frequency change.
773                  * We have sent callbacks to policy->cpus and
774                  * MSRs have already been written on coverd_cpus.
775                  * Best effort undo..
776                  */
777
778                 if (!cpus_empty(covered_cpus)) {
779                         for_each_cpu_mask(j, covered_cpus) {
780                                 set_cpus_allowed(current, cpumask_of_cpu(j));
781                                 wrmsr(MSR_IA32_PERF_CTL, oldmsr, h);
782                         }
783                 }
784
785                 tmp = freqs.new;
786                 freqs.new = freqs.old;
787                 freqs.old = tmp;
788                 for_each_cpu_mask(j, online_policy_cpus) {
789                         freqs.cpu = j;
790                         cpufreq_notify_transition(&freqs, CPUFREQ_PRECHANGE);
791                         cpufreq_notify_transition(&freqs, CPUFREQ_POSTCHANGE);
792                 }
793         }
794
795 migrate_end:
796         set_cpus_allowed(current, saved_mask);
797         return 0;
798 }
799
800 static struct freq_attr* centrino_attr[] = {
801         &cpufreq_freq_attr_scaling_available_freqs,
802         NULL,
803 };
804
805 static struct cpufreq_driver centrino_driver = {
806         .name           = "centrino", /* should be speedstep-centrino,
807                                          but there's a 16 char limit */
808         .init           = centrino_cpu_init,
809         .exit           = centrino_cpu_exit,
810         .verify         = centrino_verify,
811         .target         = centrino_target,
812         .get            = get_cur_freq,
813         .attr           = centrino_attr,
814         .owner          = THIS_MODULE,
815 };
816
817
818 /**
819  * centrino_init - initializes the Enhanced SpeedStep CPUFreq driver
820  *
821  * Initializes the Enhanced SpeedStep support. Returns -ENODEV on
822  * unsupported devices, -ENOENT if there's no voltage table for this
823  * particular CPU model, -EINVAL on problems during initiatization,
824  * and zero on success.
825  *
826  * This is quite picky.  Not only does the CPU have to advertise the
827  * "est" flag in the cpuid capability flags, we look for a specific
828  * CPU model and stepping, and we need to have the exact model name in
829  * our voltage tables.  That is, be paranoid about not releasing
830  * someone's valuable magic smoke.
831  */
832 static int __init centrino_init(void)
833 {
834         struct cpuinfo_x86 *cpu = cpu_data;
835
836         if (!cpu_has(cpu, X86_FEATURE_EST))
837                 return -ENODEV;
838
839         centrino_cpu_early_init_acpi();
840
841         return cpufreq_register_driver(&centrino_driver);
842 }
843
844 static void __exit centrino_exit(void)
845 {
846 #ifdef CONFIG_X86_SPEEDSTEP_CENTRINO_ACPI
847         unsigned int j;
848 #endif
849         
850         cpufreq_unregister_driver(&centrino_driver);
851
852 #ifdef CONFIG_X86_SPEEDSTEP_CENTRINO_ACPI
853         for_each_possible_cpu(j) {
854                 kfree(acpi_perf_data[j]);
855                 acpi_perf_data[j] = NULL;
856         }
857 #endif
858 }
859
860 MODULE_AUTHOR ("Jeremy Fitzhardinge <jeremy@goop.org>");
861 MODULE_DESCRIPTION ("Enhanced SpeedStep driver for Intel Pentium M processors.");
862 MODULE_LICENSE ("GPL");
863
864 late_initcall(centrino_init);
865 module_exit(centrino_exit);