1 | /* $NetBSD: nouveau_subdev_ltcg_gf100.c,v 1.1.1.1 2014/08/06 12:36:31 riastradh Exp $ */ |
2 | |
3 | /* |
4 | * Copyright 2012 Red Hat Inc. |
5 | * |
6 | * Permission is hereby granted, free of charge, to any person obtaining a |
7 | * copy of this software and associated documentation files (the "Software"), |
8 | * to deal in the Software without restriction, including without limitation |
9 | * the rights to use, copy, modify, merge, publish, distribute, sublicense, |
10 | * and/or sell copies of the Software, and to permit persons to whom the |
11 | * Software is furnished to do so, subject to the following conditions: |
12 | * |
13 | * The above copyright notice and this permission notice shall be included in |
14 | * all copies or substantial portions of the Software. |
15 | * |
16 | * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR |
17 | * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, |
18 | * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL |
19 | * THE COPYRIGHT HOLDER(S) OR AUTHOR(S) BE LIABLE FOR ANY CLAIM, DAMAGES OR |
20 | * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, |
21 | * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR |
22 | * OTHER DEALINGS IN THE SOFTWARE. |
23 | * |
24 | * Authors: Ben Skeggs |
25 | */ |
26 | |
27 | #include <sys/cdefs.h> |
28 | __KERNEL_RCSID(0, "$NetBSD: nouveau_subdev_ltcg_gf100.c,v 1.1.1.1 2014/08/06 12:36:31 riastradh Exp $" ); |
29 | |
30 | #include <subdev/fb.h> |
31 | #include <subdev/timer.h> |
32 | |
33 | #include "gf100.h" |
34 | |
35 | static void |
36 | gf100_ltcg_lts_isr(struct gf100_ltcg_priv *priv, int ltc, int lts) |
37 | { |
38 | u32 base = 0x141000 + (ltc * 0x2000) + (lts * 0x400); |
39 | u32 stat = nv_rd32(priv, base + 0x020); |
40 | |
41 | if (stat) { |
42 | nv_info(priv, "LTC%d_LTS%d: 0x%08x\n" , ltc, lts, stat); |
43 | nv_wr32(priv, base + 0x020, stat); |
44 | } |
45 | } |
46 | |
47 | static void |
48 | gf100_ltcg_intr(struct nouveau_subdev *subdev) |
49 | { |
50 | struct gf100_ltcg_priv *priv = (void *)subdev; |
51 | u32 mask; |
52 | |
53 | mask = nv_rd32(priv, 0x00017c); |
54 | while (mask) { |
55 | u32 lts, ltc = __ffs(mask); |
56 | for (lts = 0; lts < priv->lts_nr; lts++) |
57 | gf100_ltcg_lts_isr(priv, ltc, lts); |
58 | mask &= ~(1 << ltc); |
59 | } |
60 | |
61 | /* we do something horribly wrong and upset PMFB a lot, so mask off |
62 | * interrupts from it after the first one until it's fixed |
63 | */ |
64 | nv_mask(priv, 0x000640, 0x02000000, 0x00000000); |
65 | } |
66 | |
67 | int |
68 | gf100_ltcg_tags_alloc(struct nouveau_ltcg *ltcg, u32 n, |
69 | struct nouveau_mm_node **pnode) |
70 | { |
71 | struct gf100_ltcg_priv *priv = (struct gf100_ltcg_priv *)ltcg; |
72 | int ret; |
73 | |
74 | ret = nouveau_mm_head(&priv->tags, 1, n, n, 1, pnode); |
75 | if (ret) |
76 | *pnode = NULL; |
77 | |
78 | return ret; |
79 | } |
80 | |
81 | void |
82 | gf100_ltcg_tags_free(struct nouveau_ltcg *ltcg, struct nouveau_mm_node **pnode) |
83 | { |
84 | struct gf100_ltcg_priv *priv = (struct gf100_ltcg_priv *)ltcg; |
85 | |
86 | nouveau_mm_free(&priv->tags, pnode); |
87 | } |
88 | |
89 | static void |
90 | gf100_ltcg_tags_clear(struct nouveau_ltcg *ltcg, u32 first, u32 count) |
91 | { |
92 | struct gf100_ltcg_priv *priv = (struct gf100_ltcg_priv *)ltcg; |
93 | u32 last = first + count - 1; |
94 | int p, i; |
95 | |
96 | BUG_ON((first > last) || (last >= priv->num_tags)); |
97 | |
98 | nv_wr32(priv, 0x17e8cc, first); |
99 | nv_wr32(priv, 0x17e8d0, last); |
100 | nv_wr32(priv, 0x17e8c8, 0x4); /* trigger clear */ |
101 | |
102 | /* wait until it's finished with clearing */ |
103 | for (p = 0; p < priv->ltc_nr; ++p) { |
104 | for (i = 0; i < priv->lts_nr; ++i) |
105 | nv_wait(priv, 0x1410c8 + p * 0x2000 + i * 0x400, ~0, 0); |
106 | } |
107 | } |
108 | |
109 | /* TODO: Figure out tag memory details and drop the over-cautious allocation. |
110 | */ |
111 | int |
112 | gf100_ltcg_init_tag_ram(struct nouveau_fb *pfb, struct gf100_ltcg_priv *priv) |
113 | { |
114 | u32 tag_size, tag_margin, tag_align; |
115 | int ret; |
116 | |
117 | /* tags for 1/4 of VRAM should be enough (8192/4 per GiB of VRAM) */ |
118 | priv->num_tags = (pfb->ram->size >> 17) / 4; |
119 | if (priv->num_tags > (1 << 17)) |
120 | priv->num_tags = 1 << 17; /* we have 17 bits in PTE */ |
121 | priv->num_tags = (priv->num_tags + 63) & ~63; /* round up to 64 */ |
122 | |
123 | tag_align = priv->ltc_nr * 0x800; |
124 | tag_margin = (tag_align < 0x6000) ? 0x6000 : tag_align; |
125 | |
126 | /* 4 part 4 sub: 0x2000 bytes for 56 tags */ |
127 | /* 3 part 4 sub: 0x6000 bytes for 168 tags */ |
128 | /* |
129 | * About 147 bytes per tag. Let's be safe and allocate x2, which makes |
130 | * 0x4980 bytes for 64 tags, and round up to 0x6000 bytes for 64 tags. |
131 | * |
132 | * For 4 GiB of memory we'll have 8192 tags which makes 3 MiB, < 0.1 %. |
133 | */ |
134 | tag_size = (priv->num_tags / 64) * 0x6000 + tag_margin; |
135 | tag_size += tag_align; |
136 | tag_size = (tag_size + 0xfff) >> 12; /* round up */ |
137 | |
138 | ret = nouveau_mm_tail(&pfb->vram, 1, tag_size, tag_size, 1, |
139 | &priv->tag_ram); |
140 | if (ret) { |
141 | priv->num_tags = 0; |
142 | } else { |
143 | u64 tag_base = (priv->tag_ram->offset << 12) + tag_margin; |
144 | |
145 | tag_base += tag_align - 1; |
146 | ret = do_div(tag_base, tag_align); |
147 | |
148 | priv->tag_base = tag_base; |
149 | } |
150 | ret = nouveau_mm_init(&priv->tags, 0, priv->num_tags, 1); |
151 | |
152 | return ret; |
153 | } |
154 | |
155 | static int |
156 | gf100_ltcg_ctor(struct nouveau_object *parent, struct nouveau_object *engine, |
157 | struct nouveau_oclass *oclass, void *data, u32 size, |
158 | struct nouveau_object **pobject) |
159 | { |
160 | struct gf100_ltcg_priv *priv; |
161 | struct nouveau_fb *pfb = nouveau_fb(parent); |
162 | u32 parts, mask; |
163 | int ret, i; |
164 | |
165 | ret = nouveau_ltcg_create(parent, engine, oclass, &priv); |
166 | *pobject = nv_object(priv); |
167 | if (ret) |
168 | return ret; |
169 | |
170 | parts = nv_rd32(priv, 0x022438); |
171 | mask = nv_rd32(priv, 0x022554); |
172 | for (i = 0; i < parts; i++) { |
173 | if (!(mask & (1 << i))) |
174 | priv->ltc_nr++; |
175 | } |
176 | priv->lts_nr = nv_rd32(priv, 0x17e8dc) >> 28; |
177 | |
178 | ret = gf100_ltcg_init_tag_ram(pfb, priv); |
179 | if (ret) |
180 | return ret; |
181 | |
182 | priv->base.tags_alloc = gf100_ltcg_tags_alloc; |
183 | priv->base.tags_free = gf100_ltcg_tags_free; |
184 | priv->base.tags_clear = gf100_ltcg_tags_clear; |
185 | |
186 | nv_subdev(priv)->intr = gf100_ltcg_intr; |
187 | return 0; |
188 | } |
189 | |
190 | void |
191 | gf100_ltcg_dtor(struct nouveau_object *object) |
192 | { |
193 | struct nouveau_ltcg *ltcg = (struct nouveau_ltcg *)object; |
194 | struct gf100_ltcg_priv *priv = (struct gf100_ltcg_priv *)ltcg; |
195 | struct nouveau_fb *pfb = nouveau_fb(ltcg->base.base.parent); |
196 | |
197 | nouveau_mm_fini(&priv->tags); |
198 | nouveau_mm_free(&pfb->vram, &priv->tag_ram); |
199 | |
200 | nouveau_ltcg_destroy(ltcg); |
201 | } |
202 | |
203 | static int |
204 | gf100_ltcg_init(struct nouveau_object *object) |
205 | { |
206 | struct nouveau_ltcg *ltcg = (struct nouveau_ltcg *)object; |
207 | struct gf100_ltcg_priv *priv = (struct gf100_ltcg_priv *)ltcg; |
208 | int ret; |
209 | |
210 | ret = nouveau_ltcg_init(ltcg); |
211 | if (ret) |
212 | return ret; |
213 | |
214 | nv_mask(priv, 0x17e820, 0x00100000, 0x00000000); /* INTR_EN &= ~0x10 */ |
215 | nv_wr32(priv, 0x17e8d8, priv->ltc_nr); |
216 | if (nv_device(ltcg)->card_type >= NV_E0) |
217 | nv_wr32(priv, 0x17e000, priv->ltc_nr); |
218 | nv_wr32(priv, 0x17e8d4, priv->tag_base); |
219 | return 0; |
220 | } |
221 | |
222 | struct nouveau_oclass * |
223 | gf100_ltcg_oclass = &(struct nouveau_oclass) { |
224 | .handle = NV_SUBDEV(LTCG, 0xc0), |
225 | .ofuncs = &(struct nouveau_ofuncs) { |
226 | .ctor = gf100_ltcg_ctor, |
227 | .dtor = gf100_ltcg_dtor, |
228 | .init = gf100_ltcg_init, |
229 | .fini = _nouveau_ltcg_fini, |
230 | }, |
231 | }; |
232 | |