Merge tag 'iommu-updates-v5.4' of git://git.kernel.org/pub/scm/linux/kernel/git/joro...
[sfrench/cifs-2.6.git] / arch / x86 / kernel / amd_nb.c
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * Shared support code for AMD K8 northbridges and derivates.
4  * Copyright 2006 Andi Kleen, SUSE Labs.
5  */
6
7 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
8
9 #include <linux/types.h>
10 #include <linux/slab.h>
11 #include <linux/init.h>
12 #include <linux/errno.h>
13 #include <linux/export.h>
14 #include <linux/spinlock.h>
15 #include <linux/pci_ids.h>
16 #include <asm/amd_nb.h>
17
18 #define PCI_DEVICE_ID_AMD_17H_ROOT      0x1450
19 #define PCI_DEVICE_ID_AMD_17H_M10H_ROOT 0x15d0
20 #define PCI_DEVICE_ID_AMD_17H_M30H_ROOT 0x1480
21 #define PCI_DEVICE_ID_AMD_17H_DF_F4     0x1464
22 #define PCI_DEVICE_ID_AMD_17H_M10H_DF_F4 0x15ec
23 #define PCI_DEVICE_ID_AMD_17H_M30H_DF_F4 0x1494
24 #define PCI_DEVICE_ID_AMD_17H_M70H_DF_F4 0x1444
25
26 /* Protect the PCI config register pairs used for SMN and DF indirect access. */
27 static DEFINE_MUTEX(smn_mutex);
28
29 static u32 *flush_words;
30
31 static const struct pci_device_id amd_root_ids[] = {
32         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_ROOT) },
33         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M10H_ROOT) },
34         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M30H_ROOT) },
35         {}
36 };
37
38
39 #define PCI_DEVICE_ID_AMD_CNB17H_F4     0x1704
40
41 const struct pci_device_id amd_nb_misc_ids[] = {
42         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_K8_NB_MISC) },
43         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_10H_NB_MISC) },
44         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_NB_F3) },
45         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M10H_F3) },
46         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M30H_NB_F3) },
47         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M60H_NB_F3) },
48         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_NB_F3) },
49         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_M30H_NB_F3) },
50         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_DF_F3) },
51         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M10H_DF_F3) },
52         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M30H_DF_F3) },
53         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_CNB17H_F3) },
54         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M70H_DF_F3) },
55         {}
56 };
57 EXPORT_SYMBOL_GPL(amd_nb_misc_ids);
58
59 static const struct pci_device_id amd_nb_link_ids[] = {
60         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_NB_F4) },
61         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M30H_NB_F4) },
62         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_15H_M60H_NB_F4) },
63         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_NB_F4) },
64         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_16H_M30H_NB_F4) },
65         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_DF_F4) },
66         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M10H_DF_F4) },
67         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M30H_DF_F4) },
68         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_17H_M70H_DF_F4) },
69         { PCI_DEVICE(PCI_VENDOR_ID_AMD, PCI_DEVICE_ID_AMD_CNB17H_F4) },
70         {}
71 };
72
73 static const struct pci_device_id hygon_root_ids[] = {
74         { PCI_DEVICE(PCI_VENDOR_ID_HYGON, PCI_DEVICE_ID_AMD_17H_ROOT) },
75         {}
76 };
77
78 static const struct pci_device_id hygon_nb_misc_ids[] = {
79         { PCI_DEVICE(PCI_VENDOR_ID_HYGON, PCI_DEVICE_ID_AMD_17H_DF_F3) },
80         {}
81 };
82
83 static const struct pci_device_id hygon_nb_link_ids[] = {
84         { PCI_DEVICE(PCI_VENDOR_ID_HYGON, PCI_DEVICE_ID_AMD_17H_DF_F4) },
85         {}
86 };
87
88 const struct amd_nb_bus_dev_range amd_nb_bus_dev_ranges[] __initconst = {
89         { 0x00, 0x18, 0x20 },
90         { 0xff, 0x00, 0x20 },
91         { 0xfe, 0x00, 0x20 },
92         { }
93 };
94
95 static struct amd_northbridge_info amd_northbridges;
96
97 u16 amd_nb_num(void)
98 {
99         return amd_northbridges.num;
100 }
101 EXPORT_SYMBOL_GPL(amd_nb_num);
102
103 bool amd_nb_has_feature(unsigned int feature)
104 {
105         return ((amd_northbridges.flags & feature) == feature);
106 }
107 EXPORT_SYMBOL_GPL(amd_nb_has_feature);
108
109 struct amd_northbridge *node_to_amd_nb(int node)
110 {
111         return (node < amd_northbridges.num) ? &amd_northbridges.nb[node] : NULL;
112 }
113 EXPORT_SYMBOL_GPL(node_to_amd_nb);
114
115 static struct pci_dev *next_northbridge(struct pci_dev *dev,
116                                         const struct pci_device_id *ids)
117 {
118         do {
119                 dev = pci_get_device(PCI_ANY_ID, PCI_ANY_ID, dev);
120                 if (!dev)
121                         break;
122         } while (!pci_match_id(ids, dev));
123         return dev;
124 }
125
126 static int __amd_smn_rw(u16 node, u32 address, u32 *value, bool write)
127 {
128         struct pci_dev *root;
129         int err = -ENODEV;
130
131         if (node >= amd_northbridges.num)
132                 goto out;
133
134         root = node_to_amd_nb(node)->root;
135         if (!root)
136                 goto out;
137
138         mutex_lock(&smn_mutex);
139
140         err = pci_write_config_dword(root, 0x60, address);
141         if (err) {
142                 pr_warn("Error programming SMN address 0x%x.\n", address);
143                 goto out_unlock;
144         }
145
146         err = (write ? pci_write_config_dword(root, 0x64, *value)
147                      : pci_read_config_dword(root, 0x64, value));
148         if (err)
149                 pr_warn("Error %s SMN address 0x%x.\n",
150                         (write ? "writing to" : "reading from"), address);
151
152 out_unlock:
153         mutex_unlock(&smn_mutex);
154
155 out:
156         return err;
157 }
158
159 int amd_smn_read(u16 node, u32 address, u32 *value)
160 {
161         return __amd_smn_rw(node, address, value, false);
162 }
163 EXPORT_SYMBOL_GPL(amd_smn_read);
164
165 int amd_smn_write(u16 node, u32 address, u32 value)
166 {
167         return __amd_smn_rw(node, address, &value, true);
168 }
169 EXPORT_SYMBOL_GPL(amd_smn_write);
170
171 /*
172  * Data Fabric Indirect Access uses FICAA/FICAD.
173  *
174  * Fabric Indirect Configuration Access Address (FICAA): Constructed based
175  * on the device's Instance Id and the PCI function and register offset of
176  * the desired register.
177  *
178  * Fabric Indirect Configuration Access Data (FICAD): There are FICAD LO
179  * and FICAD HI registers but so far we only need the LO register.
180  */
181 int amd_df_indirect_read(u16 node, u8 func, u16 reg, u8 instance_id, u32 *lo)
182 {
183         struct pci_dev *F4;
184         u32 ficaa;
185         int err = -ENODEV;
186
187         if (node >= amd_northbridges.num)
188                 goto out;
189
190         F4 = node_to_amd_nb(node)->link;
191         if (!F4)
192                 goto out;
193
194         ficaa  = 1;
195         ficaa |= reg & 0x3FC;
196         ficaa |= (func & 0x7) << 11;
197         ficaa |= instance_id << 16;
198
199         mutex_lock(&smn_mutex);
200
201         err = pci_write_config_dword(F4, 0x5C, ficaa);
202         if (err) {
203                 pr_warn("Error writing DF Indirect FICAA, FICAA=0x%x\n", ficaa);
204                 goto out_unlock;
205         }
206
207         err = pci_read_config_dword(F4, 0x98, lo);
208         if (err)
209                 pr_warn("Error reading DF Indirect FICAD LO, FICAA=0x%x.\n", ficaa);
210
211 out_unlock:
212         mutex_unlock(&smn_mutex);
213
214 out:
215         return err;
216 }
217 EXPORT_SYMBOL_GPL(amd_df_indirect_read);
218
219 int amd_cache_northbridges(void)
220 {
221         const struct pci_device_id *misc_ids = amd_nb_misc_ids;
222         const struct pci_device_id *link_ids = amd_nb_link_ids;
223         const struct pci_device_id *root_ids = amd_root_ids;
224         struct pci_dev *root, *misc, *link;
225         struct amd_northbridge *nb;
226         u16 roots_per_misc = 0;
227         u16 misc_count = 0;
228         u16 root_count = 0;
229         u16 i, j;
230
231         if (amd_northbridges.num)
232                 return 0;
233
234         if (boot_cpu_data.x86_vendor == X86_VENDOR_HYGON) {
235                 root_ids = hygon_root_ids;
236                 misc_ids = hygon_nb_misc_ids;
237                 link_ids = hygon_nb_link_ids;
238         }
239
240         misc = NULL;
241         while ((misc = next_northbridge(misc, misc_ids)) != NULL)
242                 misc_count++;
243
244         if (!misc_count)
245                 return -ENODEV;
246
247         root = NULL;
248         while ((root = next_northbridge(root, root_ids)) != NULL)
249                 root_count++;
250
251         if (root_count) {
252                 roots_per_misc = root_count / misc_count;
253
254                 /*
255                  * There should be _exactly_ N roots for each DF/SMN
256                  * interface.
257                  */
258                 if (!roots_per_misc || (root_count % roots_per_misc)) {
259                         pr_info("Unsupported AMD DF/PCI configuration found\n");
260                         return -ENODEV;
261                 }
262         }
263
264         nb = kcalloc(misc_count, sizeof(struct amd_northbridge), GFP_KERNEL);
265         if (!nb)
266                 return -ENOMEM;
267
268         amd_northbridges.nb = nb;
269         amd_northbridges.num = misc_count;
270
271         link = misc = root = NULL;
272         for (i = 0; i < amd_northbridges.num; i++) {
273                 node_to_amd_nb(i)->root = root =
274                         next_northbridge(root, root_ids);
275                 node_to_amd_nb(i)->misc = misc =
276                         next_northbridge(misc, misc_ids);
277                 node_to_amd_nb(i)->link = link =
278                         next_northbridge(link, link_ids);
279
280                 /*
281                  * If there are more PCI root devices than data fabric/
282                  * system management network interfaces, then the (N)
283                  * PCI roots per DF/SMN interface are functionally the
284                  * same (for DF/SMN access) and N-1 are redundant.  N-1
285                  * PCI roots should be skipped per DF/SMN interface so
286                  * the following DF/SMN interfaces get mapped to
287                  * correct PCI roots.
288                  */
289                 for (j = 1; j < roots_per_misc; j++)
290                         root = next_northbridge(root, root_ids);
291         }
292
293         if (amd_gart_present())
294                 amd_northbridges.flags |= AMD_NB_GART;
295
296         /*
297          * Check for L3 cache presence.
298          */
299         if (!cpuid_edx(0x80000006))
300                 return 0;
301
302         /*
303          * Some CPU families support L3 Cache Index Disable. There are some
304          * limitations because of E382 and E388 on family 0x10.
305          */
306         if (boot_cpu_data.x86 == 0x10 &&
307             boot_cpu_data.x86_model >= 0x8 &&
308             (boot_cpu_data.x86_model > 0x9 ||
309              boot_cpu_data.x86_stepping >= 0x1))
310                 amd_northbridges.flags |= AMD_NB_L3_INDEX_DISABLE;
311
312         if (boot_cpu_data.x86 == 0x15)
313                 amd_northbridges.flags |= AMD_NB_L3_INDEX_DISABLE;
314
315         /* L3 cache partitioning is supported on family 0x15 */
316         if (boot_cpu_data.x86 == 0x15)
317                 amd_northbridges.flags |= AMD_NB_L3_PARTITIONING;
318
319         return 0;
320 }
321 EXPORT_SYMBOL_GPL(amd_cache_northbridges);
322
323 /*
324  * Ignores subdevice/subvendor but as far as I can figure out
325  * they're useless anyways
326  */
327 bool __init early_is_amd_nb(u32 device)
328 {
329         const struct pci_device_id *misc_ids = amd_nb_misc_ids;
330         const struct pci_device_id *id;
331         u32 vendor = device & 0xffff;
332
333         if (boot_cpu_data.x86_vendor != X86_VENDOR_AMD &&
334             boot_cpu_data.x86_vendor != X86_VENDOR_HYGON)
335                 return false;
336
337         if (boot_cpu_data.x86_vendor == X86_VENDOR_HYGON)
338                 misc_ids = hygon_nb_misc_ids;
339
340         device >>= 16;
341         for (id = misc_ids; id->vendor; id++)
342                 if (vendor == id->vendor && device == id->device)
343                         return true;
344         return false;
345 }
346
347 struct resource *amd_get_mmconfig_range(struct resource *res)
348 {
349         u32 address;
350         u64 base, msr;
351         unsigned int segn_busn_bits;
352
353         if (boot_cpu_data.x86_vendor != X86_VENDOR_AMD &&
354             boot_cpu_data.x86_vendor != X86_VENDOR_HYGON)
355                 return NULL;
356
357         /* assume all cpus from fam10h have mmconfig */
358         if (boot_cpu_data.x86 < 0x10)
359                 return NULL;
360
361         address = MSR_FAM10H_MMIO_CONF_BASE;
362         rdmsrl(address, msr);
363
364         /* mmconfig is not enabled */
365         if (!(msr & FAM10H_MMIO_CONF_ENABLE))
366                 return NULL;
367
368         base = msr & (FAM10H_MMIO_CONF_BASE_MASK<<FAM10H_MMIO_CONF_BASE_SHIFT);
369
370         segn_busn_bits = (msr >> FAM10H_MMIO_CONF_BUSRANGE_SHIFT) &
371                          FAM10H_MMIO_CONF_BUSRANGE_MASK;
372
373         res->flags = IORESOURCE_MEM;
374         res->start = base;
375         res->end = base + (1ULL<<(segn_busn_bits + 20)) - 1;
376         return res;
377 }
378
379 int amd_get_subcaches(int cpu)
380 {
381         struct pci_dev *link = node_to_amd_nb(amd_get_nb_id(cpu))->link;
382         unsigned int mask;
383
384         if (!amd_nb_has_feature(AMD_NB_L3_PARTITIONING))
385                 return 0;
386
387         pci_read_config_dword(link, 0x1d4, &mask);
388
389         return (mask >> (4 * cpu_data(cpu).cpu_core_id)) & 0xf;
390 }
391
392 int amd_set_subcaches(int cpu, unsigned long mask)
393 {
394         static unsigned int reset, ban;
395         struct amd_northbridge *nb = node_to_amd_nb(amd_get_nb_id(cpu));
396         unsigned int reg;
397         int cuid;
398
399         if (!amd_nb_has_feature(AMD_NB_L3_PARTITIONING) || mask > 0xf)
400                 return -EINVAL;
401
402         /* if necessary, collect reset state of L3 partitioning and BAN mode */
403         if (reset == 0) {
404                 pci_read_config_dword(nb->link, 0x1d4, &reset);
405                 pci_read_config_dword(nb->misc, 0x1b8, &ban);
406                 ban &= 0x180000;
407         }
408
409         /* deactivate BAN mode if any subcaches are to be disabled */
410         if (mask != 0xf) {
411                 pci_read_config_dword(nb->misc, 0x1b8, &reg);
412                 pci_write_config_dword(nb->misc, 0x1b8, reg & ~0x180000);
413         }
414
415         cuid = cpu_data(cpu).cpu_core_id;
416         mask <<= 4 * cuid;
417         mask |= (0xf ^ (1 << cuid)) << 26;
418
419         pci_write_config_dword(nb->link, 0x1d4, mask);
420
421         /* reset BAN mode if L3 partitioning returned to reset state */
422         pci_read_config_dword(nb->link, 0x1d4, &reg);
423         if (reg == reset) {
424                 pci_read_config_dword(nb->misc, 0x1b8, &reg);
425                 reg &= ~0x180000;
426                 pci_write_config_dword(nb->misc, 0x1b8, reg | ban);
427         }
428
429         return 0;
430 }
431
432 static void amd_cache_gart(void)
433 {
434         u16 i;
435
436         if (!amd_nb_has_feature(AMD_NB_GART))
437                 return;
438
439         flush_words = kmalloc_array(amd_northbridges.num, sizeof(u32), GFP_KERNEL);
440         if (!flush_words) {
441                 amd_northbridges.flags &= ~AMD_NB_GART;
442                 pr_notice("Cannot initialize GART flush words, GART support disabled\n");
443                 return;
444         }
445
446         for (i = 0; i != amd_northbridges.num; i++)
447                 pci_read_config_dword(node_to_amd_nb(i)->misc, 0x9c, &flush_words[i]);
448 }
449
450 void amd_flush_garts(void)
451 {
452         int flushed, i;
453         unsigned long flags;
454         static DEFINE_SPINLOCK(gart_lock);
455
456         if (!amd_nb_has_feature(AMD_NB_GART))
457                 return;
458
459         /*
460          * Avoid races between AGP and IOMMU. In theory it's not needed
461          * but I'm not sure if the hardware won't lose flush requests
462          * when another is pending. This whole thing is so expensive anyways
463          * that it doesn't matter to serialize more. -AK
464          */
465         spin_lock_irqsave(&gart_lock, flags);
466         flushed = 0;
467         for (i = 0; i < amd_northbridges.num; i++) {
468                 pci_write_config_dword(node_to_amd_nb(i)->misc, 0x9c,
469                                        flush_words[i] | 1);
470                 flushed++;
471         }
472         for (i = 0; i < amd_northbridges.num; i++) {
473                 u32 w;
474                 /* Make sure the hardware actually executed the flush*/
475                 for (;;) {
476                         pci_read_config_dword(node_to_amd_nb(i)->misc,
477                                               0x9c, &w);
478                         if (!(w & 1))
479                                 break;
480                         cpu_relax();
481                 }
482         }
483         spin_unlock_irqrestore(&gart_lock, flags);
484         if (!flushed)
485                 pr_notice("nothing to flush?\n");
486 }
487 EXPORT_SYMBOL_GPL(amd_flush_garts);
488
489 static void __fix_erratum_688(void *info)
490 {
491 #define MSR_AMD64_IC_CFG 0xC0011021
492
493         msr_set_bit(MSR_AMD64_IC_CFG, 3);
494         msr_set_bit(MSR_AMD64_IC_CFG, 14);
495 }
496
497 /* Apply erratum 688 fix so machines without a BIOS fix work. */
498 static __init void fix_erratum_688(void)
499 {
500         struct pci_dev *F4;
501         u32 val;
502
503         if (boot_cpu_data.x86 != 0x14)
504                 return;
505
506         if (!amd_northbridges.num)
507                 return;
508
509         F4 = node_to_amd_nb(0)->link;
510         if (!F4)
511                 return;
512
513         if (pci_read_config_dword(F4, 0x164, &val))
514                 return;
515
516         if (val & BIT(2))
517                 return;
518
519         on_each_cpu(__fix_erratum_688, NULL, 0);
520
521         pr_info("x86/cpu/AMD: CPU erratum 688 worked around\n");
522 }
523
524 static __init int init_amd_nbs(void)
525 {
526         amd_cache_northbridges();
527         amd_cache_gart();
528
529         fix_erratum_688();
530
531         return 0;
532 }
533
534 /* This has to go after the PCI subsystem */
535 fs_initcall(init_amd_nbs);