]>
Commit | Line | Data |
---|---|---|
1da177e4 LT |
1 | /* |
2 | * Pentium 4/Xeon CPU on demand clock modulation/speed scaling | |
3 | * (C) 2002 - 2003 Dominik Brodowski <[email protected]> | |
4 | * (C) 2002 Zwane Mwaikambo <[email protected]> | |
5 | * (C) 2002 Arjan van de Ven <[email protected]> | |
6 | * (C) 2002 Tora T. Engstad | |
7 | * All Rights Reserved | |
8 | * | |
9 | * This program is free software; you can redistribute it and/or | |
10 | * modify it under the terms of the GNU General Public License | |
11 | * as published by the Free Software Foundation; either version | |
12 | * 2 of the License, or (at your option) any later version. | |
13 | * | |
14 | * The author(s) of this software shall not be held liable for damages | |
15 | * of any nature resulting due to the use of this software. This | |
16 | * software is provided AS-IS with no warranties. | |
32ee8c3e | 17 | * |
1da177e4 LT |
18 | * Date Errata Description |
19 | * 20020525 N44, O17 12.5% or 25% DC causes lockup | |
20 | * | |
21 | */ | |
22 | ||
1c5864e2 JP |
23 | #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt |
24 | ||
1da177e4 | 25 | #include <linux/kernel.h> |
32ee8c3e | 26 | #include <linux/module.h> |
1da177e4 LT |
27 | #include <linux/init.h> |
28 | #include <linux/smp.h> | |
29 | #include <linux/cpufreq.h> | |
1da177e4 | 30 | #include <linux/cpumask.h> |
bbfebd66 | 31 | #include <linux/timex.h> |
1da177e4 | 32 | |
32ee8c3e | 33 | #include <asm/processor.h> |
1da177e4 | 34 | #include <asm/msr.h> |
199785ea | 35 | #include <asm/timer.h> |
fa8031ae | 36 | #include <asm/cpu_device_id.h> |
1da177e4 LT |
37 | |
38 | #include "speedstep-lib.h" | |
39 | ||
1da177e4 LT |
40 | /* |
41 | * Duty Cycle (3bits), note DC_DISABLE is not specified in | |
42 | * intel docs i just use it to mean disable | |
43 | */ | |
44 | enum { | |
45 | DC_RESV, DC_DFLT, DC_25PT, DC_38PT, DC_50PT, | |
46 | DC_64PT, DC_75PT, DC_88PT, DC_DISABLE | |
47 | }; | |
48 | ||
49 | #define DC_ENTRIES 8 | |
50 | ||
51 | ||
52 | static int has_N44_O17_errata[NR_CPUS]; | |
53 | static unsigned int stock_freq; | |
54 | static struct cpufreq_driver p4clockmod_driver; | |
55 | static unsigned int cpufreq_p4_get(unsigned int cpu); | |
56 | ||
57 | static int cpufreq_p4_setdc(unsigned int cpu, unsigned int newstate) | |
58 | { | |
59 | u32 l, h; | |
60 | ||
e9f51837 | 61 | if ((newstate > DC_DISABLE) || (newstate == DC_RESV)) |
1da177e4 LT |
62 | return -EINVAL; |
63 | ||
551948bc | 64 | rdmsr_on_cpu(cpu, MSR_IA32_THERM_STATUS, &l, &h); |
1da177e4 LT |
65 | |
66 | if (l & 0x01) | |
2d06d8c4 | 67 | pr_debug("CPU#%d currently thermal throttled\n", cpu); |
1da177e4 | 68 | |
bbfebd66 DJ |
69 | if (has_N44_O17_errata[cpu] && |
70 | (newstate == DC_25PT || newstate == DC_DFLT)) | |
1da177e4 LT |
71 | newstate = DC_38PT; |
72 | ||
551948bc | 73 | rdmsr_on_cpu(cpu, MSR_IA32_THERM_CONTROL, &l, &h); |
1da177e4 | 74 | if (newstate == DC_DISABLE) { |
2d06d8c4 | 75 | pr_debug("CPU#%d disabling modulation\n", cpu); |
551948bc | 76 | wrmsr_on_cpu(cpu, MSR_IA32_THERM_CONTROL, l & ~(1<<4), h); |
1da177e4 | 77 | } else { |
2d06d8c4 | 78 | pr_debug("CPU#%d setting duty cycle to %d%%\n", |
1da177e4 | 79 | cpu, ((125 * newstate) / 10)); |
32ee8c3e | 80 | /* bits 63 - 5 : reserved |
1da177e4 LT |
81 | * bit 4 : enable/disable |
82 | * bits 3-1 : duty cycle | |
83 | * bit 0 : reserved | |
84 | */ | |
85 | l = (l & ~14); | |
86 | l = l | (1<<4) | ((newstate & 0x7)<<1); | |
551948bc | 87 | wrmsr_on_cpu(cpu, MSR_IA32_THERM_CONTROL, l, h); |
1da177e4 LT |
88 | } |
89 | ||
90 | return 0; | |
91 | } | |
92 | ||
93 | ||
94 | static struct cpufreq_frequency_table p4clockmod_table[] = { | |
7f4b0461 VK |
95 | {0, DC_RESV, CPUFREQ_ENTRY_INVALID}, |
96 | {0, DC_DFLT, 0}, | |
97 | {0, DC_25PT, 0}, | |
98 | {0, DC_38PT, 0}, | |
99 | {0, DC_50PT, 0}, | |
100 | {0, DC_64PT, 0}, | |
101 | {0, DC_75PT, 0}, | |
102 | {0, DC_88PT, 0}, | |
103 | {0, DC_DISABLE, 0}, | |
104 | {0, DC_RESV, CPUFREQ_TABLE_END}, | |
1da177e4 LT |
105 | }; |
106 | ||
107 | ||
9c0ebcf7 | 108 | static int cpufreq_p4_target(struct cpufreq_policy *policy, unsigned int index) |
1da177e4 | 109 | { |
1da177e4 LT |
110 | int i; |
111 | ||
bbfebd66 DJ |
112 | /* run on each logical CPU, |
113 | * see section 13.15.3 of IA32 Intel Architecture Software | |
32ee8c3e | 114 | * Developer's Manual, Volume 3 |
1da177e4 | 115 | */ |
835481d9 | 116 | for_each_cpu(i, policy->cpus) |
9c0ebcf7 | 117 | cpufreq_p4_setdc(i, p4clockmod_table[index].driver_data); |
1da177e4 | 118 | |
1da177e4 LT |
119 | return 0; |
120 | } | |
121 | ||
122 | ||
1da177e4 LT |
123 | static unsigned int cpufreq_p4_get_frequency(struct cpuinfo_x86 *c) |
124 | { | |
4e74663c DB |
125 | if (c->x86 == 0x06) { |
126 | if (cpu_has(c, X86_FEATURE_EST)) | |
1c5864e2 | 127 | pr_warn_once("Warning: EST-capable CPU detected. The acpi-cpufreq module offers voltage scaling in addition to frequency scaling. You should use that instead of p4-clockmod, if possible.\n"); |
4e74663c DB |
128 | switch (c->x86_model) { |
129 | case 0x0E: /* Core */ | |
130 | case 0x0F: /* Core Duo */ | |
8529154e | 131 | case 0x16: /* Celeron Core */ |
43195037 | 132 | case 0x1C: /* Atom */ |
4e74663c | 133 | p4clockmod_driver.flags |= CPUFREQ_CONST_LOOPS; |
bbfebd66 | 134 | return speedstep_get_frequency(SPEEDSTEP_CPU_PCORE); |
4e74663c DB |
135 | case 0x0D: /* Pentium M (Dothan) */ |
136 | p4clockmod_driver.flags |= CPUFREQ_CONST_LOOPS; | |
137 | /* fall through */ | |
138 | case 0x09: /* Pentium M (Banias) */ | |
bbfebd66 | 139 | return speedstep_get_frequency(SPEEDSTEP_CPU_PM); |
4e74663c | 140 | } |
1da177e4 LT |
141 | } |
142 | ||
9d1f44ee | 143 | if (c->x86 != 0xF) |
1da177e4 | 144 | return 0; |
1da177e4 LT |
145 | |
146 | /* on P-4s, the TSC runs with constant frequency independent whether | |
147 | * throttling is active or not. */ | |
148 | p4clockmod_driver.flags |= CPUFREQ_CONST_LOOPS; | |
149 | ||
bbfebd66 | 150 | if (speedstep_detect_processor() == SPEEDSTEP_CPU_P4M) { |
1c5864e2 | 151 | pr_warn("Warning: Pentium 4-M detected. The speedstep-ich or acpi cpufreq modules offer voltage scaling in addition of frequency scaling. You should use either one instead of p4-clockmod, if possible.\n"); |
bbfebd66 | 152 | return speedstep_get_frequency(SPEEDSTEP_CPU_P4M); |
1da177e4 LT |
153 | } |
154 | ||
bbfebd66 | 155 | return speedstep_get_frequency(SPEEDSTEP_CPU_P4D); |
1da177e4 LT |
156 | } |
157 | ||
32ee8c3e | 158 | |
1da177e4 LT |
159 | |
160 | static int cpufreq_p4_cpu_init(struct cpufreq_policy *policy) | |
161 | { | |
92cb7612 | 162 | struct cpuinfo_x86 *c = &cpu_data(policy->cpu); |
1da177e4 LT |
163 | int cpuid = 0; |
164 | unsigned int i; | |
165 | ||
166 | #ifdef CONFIG_SMP | |
b60f9a7e | 167 | cpumask_copy(policy->cpus, topology_sibling_cpumask(policy->cpu)); |
1da177e4 LT |
168 | #endif |
169 | ||
170 | /* Errata workaround */ | |
b399151c | 171 | cpuid = (c->x86 << 8) | (c->x86_model << 4) | c->x86_stepping; |
1da177e4 LT |
172 | switch (cpuid) { |
173 | case 0x0f07: | |
174 | case 0x0f0a: | |
175 | case 0x0f11: | |
176 | case 0x0f12: | |
177 | has_N44_O17_errata[policy->cpu] = 1; | |
2d06d8c4 | 178 | pr_debug("has errata -- disabling low frequencies\n"); |
1da177e4 | 179 | } |
32ee8c3e | 180 | |
199785ea MCO |
181 | if (speedstep_detect_processor() == SPEEDSTEP_CPU_P4D && |
182 | c->x86_model < 2) { | |
183 | /* switch to maximum frequency and measure result */ | |
184 | cpufreq_p4_setdc(policy->cpu, DC_DISABLE); | |
185 | recalibrate_cpu_khz(); | |
186 | } | |
1da177e4 LT |
187 | /* get max frequency */ |
188 | stock_freq = cpufreq_p4_get_frequency(c); | |
189 | if (!stock_freq) | |
190 | return -EINVAL; | |
191 | ||
192 | /* table init */ | |
bbfebd66 DJ |
193 | for (i = 1; (p4clockmod_table[i].frequency != CPUFREQ_TABLE_END); i++) { |
194 | if ((i < 2) && (has_N44_O17_errata[policy->cpu])) | |
1da177e4 LT |
195 | p4clockmod_table[i].frequency = CPUFREQ_ENTRY_INVALID; |
196 | else | |
197 | p4clockmod_table[i].frequency = (stock_freq * i)/8; | |
198 | } | |
32ee8c3e | 199 | |
1da177e4 | 200 | /* cpuinfo and default policy values */ |
36e8abf3 DJ |
201 | |
202 | /* the transition latency is set to be 1 higher than the maximum | |
203 | * transition latency of the ondemand governor */ | |
204 | policy->cpuinfo.transition_latency = 10000001; | |
b01b531f | 205 | policy->freq_table = &p4clockmod_table[0]; |
1da177e4 | 206 | |
b01b531f | 207 | return 0; |
1da177e4 LT |
208 | } |
209 | ||
210 | ||
1da177e4 LT |
211 | static unsigned int cpufreq_p4_get(unsigned int cpu) |
212 | { | |
1da177e4 LT |
213 | u32 l, h; |
214 | ||
551948bc | 215 | rdmsr_on_cpu(cpu, MSR_IA32_THERM_CONTROL, &l, &h); |
1da177e4 LT |
216 | |
217 | if (l & 0x10) { | |
218 | l = l >> 1; | |
219 | l &= 0x7; | |
220 | } else | |
221 | l = DC_DISABLE; | |
222 | ||
223 | if (l != DC_DISABLE) | |
bbfebd66 | 224 | return stock_freq * l / 8; |
1da177e4 LT |
225 | |
226 | return stock_freq; | |
227 | } | |
228 | ||
1da177e4 | 229 | static struct cpufreq_driver p4clockmod_driver = { |
522f70ce | 230 | .verify = cpufreq_generic_frequency_table_verify, |
9c0ebcf7 | 231 | .target_index = cpufreq_p4_target, |
1da177e4 | 232 | .init = cpufreq_p4_cpu_init, |
1da177e4 LT |
233 | .get = cpufreq_p4_get, |
234 | .name = "p4-clockmod", | |
522f70ce | 235 | .attr = cpufreq_generic_attr, |
1da177e4 LT |
236 | }; |
237 | ||
fa8031ae AK |
238 | static const struct x86_cpu_id cpufreq_p4_id[] = { |
239 | { X86_VENDOR_INTEL, X86_FAMILY_ANY, X86_MODEL_ANY, X86_FEATURE_ACC }, | |
240 | {} | |
241 | }; | |
242 | ||
243 | /* | |
244 | * Intentionally no MODULE_DEVICE_TABLE here: this driver should not | |
245 | * be auto loaded. Please don't add one. | |
246 | */ | |
1da177e4 LT |
247 | |
248 | static int __init cpufreq_p4_init(void) | |
32ee8c3e | 249 | { |
1da177e4 LT |
250 | int ret; |
251 | ||
252 | /* | |
32ee8c3e | 253 | * THERM_CONTROL is architectural for IA32 now, so |
1da177e4 LT |
254 | * we can rely on the capability checks |
255 | */ | |
fa8031ae | 256 | if (!x86_match_cpu(cpufreq_p4_id) || !boot_cpu_has(X86_FEATURE_ACPI)) |
1da177e4 LT |
257 | return -ENODEV; |
258 | ||
259 | ret = cpufreq_register_driver(&p4clockmod_driver); | |
260 | if (!ret) | |
1c5864e2 | 261 | pr_info("P4/Xeon(TM) CPU On-Demand Clock Modulation available\n"); |
1da177e4 | 262 | |
bbfebd66 | 263 | return ret; |
1da177e4 LT |
264 | } |
265 | ||
266 | ||
267 | static void __exit cpufreq_p4_exit(void) | |
268 | { | |
269 | cpufreq_unregister_driver(&p4clockmod_driver); | |
270 | } | |
271 | ||
272 | ||
bbfebd66 DJ |
273 | MODULE_AUTHOR("Zwane Mwaikambo <[email protected]>"); |
274 | MODULE_DESCRIPTION("cpufreq driver for Pentium(TM) 4/Xeon(TM)"); | |
275 | MODULE_LICENSE("GPL"); | |
1da177e4 LT |
276 | |
277 | late_initcall(cpufreq_p4_init); | |
278 | module_exit(cpufreq_p4_exit); |