riva_hw.c 76 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237
  1. /***************************************************************************\
  2. |* *|
  3. |* Copyright 1993-1999 NVIDIA, Corporation. All rights reserved. *|
  4. |* *|
  5. |* NOTICE TO USER: The source code is copyrighted under U.S. and *|
  6. |* international laws. Users and possessors of this source code are *|
  7. |* hereby granted a nonexclusive, royalty-free copyright license to *|
  8. |* use this code in individual and commercial software. *|
  9. |* *|
  10. |* Any use of this source code must include, in the user documenta- *|
  11. |* tion and internal comments to the code, notices to the end user *|
  12. |* as follows: *|
  13. |* *|
  14. |* Copyright 1993-1999 NVIDIA, Corporation. All rights reserved. *|
  15. |* *|
  16. |* NVIDIA, CORPORATION MAKES NO REPRESENTATION ABOUT THE SUITABILITY *|
  17. |* OF THIS SOURCE CODE FOR ANY PURPOSE. IT IS PROVIDED "AS IS" *|
  18. |* WITHOUT EXPRESS OR IMPLIED WARRANTY OF ANY KIND. NVIDIA, CORPOR- *|
  19. |* ATION DISCLAIMS ALL WARRANTIES WITH REGARD TO THIS SOURCE CODE, *|
  20. |* INCLUDING ALL IMPLIED WARRANTIES OF MERCHANTABILITY, NONINFRINGE- *|
  21. |* MENT, AND FITNESS FOR A PARTICULAR PURPOSE. IN NO EVENT SHALL *|
  22. |* NVIDIA, CORPORATION BE LIABLE FOR ANY SPECIAL, INDIRECT, INCI- *|
  23. |* DENTAL, OR CONSEQUENTIAL DAMAGES, OR ANY DAMAGES WHATSOEVER RE- *|
  24. |* SULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION *|
  25. |* OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF *|
  26. |* OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOURCE CODE. *|
  27. |* *|
  28. |* U.S. Government End Users. This source code is a "commercial *|
  29. |* item," as that term is defined at 48 C.F.R. 2.101 (OCT 1995), *|
  30. |* consisting of "commercial computer software" and "commercial *|
  31. |* computer software documentation," as such terms are used in *|
  32. |* 48 C.F.R. 12.212 (SEPT 1995) and is provided to the U.S. Govern- *|
  33. |* ment only as a commercial end item. Consistent with 48 C.F.R. *|
  34. |* 12.212 and 48 C.F.R. 227.7202-1 through 227.7202-4 (JUNE 1995), *|
  35. |* all U.S. Government End Users acquire the source code with only *|
  36. |* those rights set forth herein. *|
  37. |* *|
  38. \***************************************************************************/
  39. /*
  40. * GPL licensing note -- nVidia is allowing a liberal interpretation of
  41. * the documentation restriction above, to merely say that this nVidia's
  42. * copyright and disclaimer should be included with all code derived
  43. * from this source. -- Jeff Garzik <jgarzik@pobox.com>, 01/Nov/99
  44. */
  45. /* $XFree86: xc/programs/Xserver/hw/xfree86/drivers/nv/riva_hw.c,v 1.33 2002/08/05 20:47:06 mvojkovi Exp $ */
  46. #include <linux/kernel.h>
  47. #include <linux/pci.h>
  48. #include <linux/pci_ids.h>
  49. #include "riva_hw.h"
  50. #include "riva_tbl.h"
  51. #include "nv_type.h"
  52. /*
  53. * This file is an OS-agnostic file used to make RIVA 128 and RIVA TNT
  54. * operate identically (except TNT has more memory and better 3D quality.
  55. */
  56. static int nv3Busy
  57. (
  58. RIVA_HW_INST *chip
  59. )
  60. {
  61. return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
  62. NV_RD32(&chip->PGRAPH[0x000006B0/4], 0) & 0x01);
  63. }
  64. static int nv4Busy
  65. (
  66. RIVA_HW_INST *chip
  67. )
  68. {
  69. return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
  70. NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
  71. }
  72. static int nv10Busy
  73. (
  74. RIVA_HW_INST *chip
  75. )
  76. {
  77. return ((NV_RD32(&chip->Rop->FifoFree, 0) < chip->FifoEmptyCount) ||
  78. NV_RD32(&chip->PGRAPH[0x00000700/4], 0) & 0x01);
  79. }
  80. static void vgaLockUnlock
  81. (
  82. RIVA_HW_INST *chip,
  83. int Lock
  84. )
  85. {
  86. U008 cr11;
  87. VGA_WR08(chip->PCIO, 0x3D4, 0x11);
  88. cr11 = VGA_RD08(chip->PCIO, 0x3D5);
  89. if(Lock) cr11 |= 0x80;
  90. else cr11 &= ~0x80;
  91. VGA_WR08(chip->PCIO, 0x3D5, cr11);
  92. }
  93. static void nv3LockUnlock
  94. (
  95. RIVA_HW_INST *chip,
  96. int Lock
  97. )
  98. {
  99. VGA_WR08(chip->PVIO, 0x3C4, 0x06);
  100. VGA_WR08(chip->PVIO, 0x3C5, Lock ? 0x99 : 0x57);
  101. vgaLockUnlock(chip, Lock);
  102. }
  103. static void nv4LockUnlock
  104. (
  105. RIVA_HW_INST *chip,
  106. int Lock
  107. )
  108. {
  109. VGA_WR08(chip->PCIO, 0x3D4, 0x1F);
  110. VGA_WR08(chip->PCIO, 0x3D5, Lock ? 0x99 : 0x57);
  111. vgaLockUnlock(chip, Lock);
  112. }
  113. static int ShowHideCursor
  114. (
  115. RIVA_HW_INST *chip,
  116. int ShowHide
  117. )
  118. {
  119. int cursor;
  120. cursor = chip->CurrentState->cursor1;
  121. chip->CurrentState->cursor1 = (chip->CurrentState->cursor1 & 0xFE) |
  122. (ShowHide & 0x01);
  123. VGA_WR08(chip->PCIO, 0x3D4, 0x31);
  124. VGA_WR08(chip->PCIO, 0x3D5, chip->CurrentState->cursor1);
  125. return (cursor & 0x01);
  126. }
  127. /****************************************************************************\
  128. * *
  129. * The video arbitration routines calculate some "magic" numbers. Fixes *
  130. * the snow seen when accessing the framebuffer without it. *
  131. * It just works (I hope). *
  132. * *
  133. \****************************************************************************/
  134. #define DEFAULT_GR_LWM 100
  135. #define DEFAULT_VID_LWM 100
  136. #define DEFAULT_GR_BURST_SIZE 256
  137. #define DEFAULT_VID_BURST_SIZE 128
  138. #define VIDEO 0
  139. #define GRAPHICS 1
  140. #define MPORT 2
  141. #define ENGINE 3
  142. #define GFIFO_SIZE 320
  143. #define GFIFO_SIZE_128 256
  144. #define MFIFO_SIZE 120
  145. #define VFIFO_SIZE 256
  146. typedef struct {
  147. int gdrain_rate;
  148. int vdrain_rate;
  149. int mdrain_rate;
  150. int gburst_size;
  151. int vburst_size;
  152. char vid_en;
  153. char gr_en;
  154. int wcmocc, wcgocc, wcvocc, wcvlwm, wcglwm;
  155. int by_gfacc;
  156. char vid_only_once;
  157. char gr_only_once;
  158. char first_vacc;
  159. char first_gacc;
  160. char first_macc;
  161. int vocc;
  162. int gocc;
  163. int mocc;
  164. char cur;
  165. char engine_en;
  166. char converged;
  167. int priority;
  168. } nv3_arb_info;
  169. typedef struct {
  170. int graphics_lwm;
  171. int video_lwm;
  172. int graphics_burst_size;
  173. int video_burst_size;
  174. int graphics_hi_priority;
  175. int media_hi_priority;
  176. int rtl_values;
  177. int valid;
  178. } nv3_fifo_info;
  179. typedef struct {
  180. char pix_bpp;
  181. char enable_video;
  182. char gr_during_vid;
  183. char enable_mp;
  184. int memory_width;
  185. int video_scale;
  186. int pclk_khz;
  187. int mclk_khz;
  188. int mem_page_miss;
  189. int mem_latency;
  190. char mem_aligned;
  191. } nv3_sim_state;
  192. typedef struct {
  193. int graphics_lwm;
  194. int video_lwm;
  195. int graphics_burst_size;
  196. int video_burst_size;
  197. int valid;
  198. } nv4_fifo_info;
  199. typedef struct {
  200. int pclk_khz;
  201. int mclk_khz;
  202. int nvclk_khz;
  203. char mem_page_miss;
  204. char mem_latency;
  205. int memory_width;
  206. char enable_video;
  207. char gr_during_vid;
  208. char pix_bpp;
  209. char mem_aligned;
  210. char enable_mp;
  211. } nv4_sim_state;
  212. typedef struct {
  213. int graphics_lwm;
  214. int video_lwm;
  215. int graphics_burst_size;
  216. int video_burst_size;
  217. int valid;
  218. } nv10_fifo_info;
  219. typedef struct {
  220. int pclk_khz;
  221. int mclk_khz;
  222. int nvclk_khz;
  223. char mem_page_miss;
  224. char mem_latency;
  225. u32 memory_type;
  226. int memory_width;
  227. char enable_video;
  228. char gr_during_vid;
  229. char pix_bpp;
  230. char mem_aligned;
  231. char enable_mp;
  232. } nv10_sim_state;
  233. static int nv3_iterate(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
  234. {
  235. int iter = 0;
  236. int tmp;
  237. int vfsize, mfsize, gfsize;
  238. int mburst_size = 32;
  239. int mmisses, gmisses, vmisses;
  240. int misses;
  241. int vlwm, glwm;
  242. int last, next, cur;
  243. int max_gfsize ;
  244. long ns;
  245. vlwm = 0;
  246. glwm = 0;
  247. vfsize = 0;
  248. gfsize = 0;
  249. cur = ainfo->cur;
  250. mmisses = 2;
  251. gmisses = 2;
  252. vmisses = 2;
  253. if (ainfo->gburst_size == 128) max_gfsize = GFIFO_SIZE_128;
  254. else max_gfsize = GFIFO_SIZE;
  255. max_gfsize = GFIFO_SIZE;
  256. while (1)
  257. {
  258. if (ainfo->vid_en)
  259. {
  260. if (ainfo->wcvocc > ainfo->vocc) ainfo->wcvocc = ainfo->vocc;
  261. if (ainfo->wcvlwm > vlwm) ainfo->wcvlwm = vlwm ;
  262. ns = 1000000 * ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
  263. vfsize = ns * ainfo->vdrain_rate / 1000000;
  264. vfsize = ainfo->wcvlwm - ainfo->vburst_size + vfsize;
  265. }
  266. if (state->enable_mp)
  267. {
  268. if (ainfo->wcmocc > ainfo->mocc) ainfo->wcmocc = ainfo->mocc;
  269. }
  270. if (ainfo->gr_en)
  271. {
  272. if (ainfo->wcglwm > glwm) ainfo->wcglwm = glwm ;
  273. if (ainfo->wcgocc > ainfo->gocc) ainfo->wcgocc = ainfo->gocc;
  274. ns = 1000000 * (ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
  275. gfsize = (ns * (long) ainfo->gdrain_rate)/1000000;
  276. gfsize = ainfo->wcglwm - ainfo->gburst_size + gfsize;
  277. }
  278. mfsize = 0;
  279. if (!state->gr_during_vid && ainfo->vid_en)
  280. if (ainfo->vid_en && (ainfo->vocc < 0) && !ainfo->vid_only_once)
  281. next = VIDEO;
  282. else if (ainfo->mocc < 0)
  283. next = MPORT;
  284. else if (ainfo->gocc< ainfo->by_gfacc)
  285. next = GRAPHICS;
  286. else return (0);
  287. else switch (ainfo->priority)
  288. {
  289. case VIDEO:
  290. if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
  291. next = VIDEO;
  292. else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
  293. next = GRAPHICS;
  294. else if (ainfo->mocc<0)
  295. next = MPORT;
  296. else return (0);
  297. break;
  298. case GRAPHICS:
  299. if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
  300. next = GRAPHICS;
  301. else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
  302. next = VIDEO;
  303. else if (ainfo->mocc<0)
  304. next = MPORT;
  305. else return (0);
  306. break;
  307. default:
  308. if (ainfo->mocc<0)
  309. next = MPORT;
  310. else if (ainfo->gr_en && ainfo->gocc<0 && !ainfo->gr_only_once)
  311. next = GRAPHICS;
  312. else if (ainfo->vid_en && ainfo->vocc<0 && !ainfo->vid_only_once)
  313. next = VIDEO;
  314. else return (0);
  315. break;
  316. }
  317. last = cur;
  318. cur = next;
  319. iter++;
  320. switch (cur)
  321. {
  322. case VIDEO:
  323. if (last==cur) misses = 0;
  324. else if (ainfo->first_vacc) misses = vmisses;
  325. else misses = 1;
  326. ainfo->first_vacc = 0;
  327. if (last!=cur)
  328. {
  329. ns = 1000000 * (vmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz;
  330. vlwm = ns * ainfo->vdrain_rate/ 1000000;
  331. vlwm = ainfo->vocc - vlwm;
  332. }
  333. ns = 1000000*(misses*state->mem_page_miss + ainfo->vburst_size)/(state->memory_width/8)/state->mclk_khz;
  334. ainfo->vocc = ainfo->vocc + ainfo->vburst_size - ns*ainfo->vdrain_rate/1000000;
  335. ainfo->gocc = ainfo->gocc - ns*ainfo->gdrain_rate/1000000;
  336. ainfo->mocc = ainfo->mocc - ns*ainfo->mdrain_rate/1000000;
  337. break;
  338. case GRAPHICS:
  339. if (last==cur) misses = 0;
  340. else if (ainfo->first_gacc) misses = gmisses;
  341. else misses = 1;
  342. ainfo->first_gacc = 0;
  343. if (last!=cur)
  344. {
  345. ns = 1000000*(gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz ;
  346. glwm = ns * ainfo->gdrain_rate/1000000;
  347. glwm = ainfo->gocc - glwm;
  348. }
  349. ns = 1000000*(misses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8))/state->mclk_khz;
  350. ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
  351. ainfo->gocc = ainfo->gocc + ainfo->gburst_size - ns*ainfo->gdrain_rate/1000000;
  352. ainfo->mocc = ainfo->mocc + 0 - ns*ainfo->mdrain_rate/1000000;
  353. break;
  354. default:
  355. if (last==cur) misses = 0;
  356. else if (ainfo->first_macc) misses = mmisses;
  357. else misses = 1;
  358. ainfo->first_macc = 0;
  359. ns = 1000000*(misses*state->mem_page_miss + mburst_size/(state->memory_width/8))/state->mclk_khz;
  360. ainfo->vocc = ainfo->vocc + 0 - ns*ainfo->vdrain_rate/1000000;
  361. ainfo->gocc = ainfo->gocc + 0 - ns*ainfo->gdrain_rate/1000000;
  362. ainfo->mocc = ainfo->mocc + mburst_size - ns*ainfo->mdrain_rate/1000000;
  363. break;
  364. }
  365. if (iter>100)
  366. {
  367. ainfo->converged = 0;
  368. return (1);
  369. }
  370. ns = 1000000*ainfo->gburst_size/(state->memory_width/8)/state->mclk_khz;
  371. tmp = ns * ainfo->gdrain_rate/1000000;
  372. if (abs(ainfo->gburst_size) + ((abs(ainfo->wcglwm) + 16 ) & ~0x7) - tmp > max_gfsize)
  373. {
  374. ainfo->converged = 0;
  375. return (1);
  376. }
  377. ns = 1000000*ainfo->vburst_size/(state->memory_width/8)/state->mclk_khz;
  378. tmp = ns * ainfo->vdrain_rate/1000000;
  379. if (abs(ainfo->vburst_size) + (abs(ainfo->wcvlwm + 32) & ~0xf) - tmp> VFIFO_SIZE)
  380. {
  381. ainfo->converged = 0;
  382. return (1);
  383. }
  384. if (abs(ainfo->gocc) > max_gfsize)
  385. {
  386. ainfo->converged = 0;
  387. return (1);
  388. }
  389. if (abs(ainfo->vocc) > VFIFO_SIZE)
  390. {
  391. ainfo->converged = 0;
  392. return (1);
  393. }
  394. if (abs(ainfo->mocc) > MFIFO_SIZE)
  395. {
  396. ainfo->converged = 0;
  397. return (1);
  398. }
  399. if (abs(vfsize) > VFIFO_SIZE)
  400. {
  401. ainfo->converged = 0;
  402. return (1);
  403. }
  404. if (abs(gfsize) > max_gfsize)
  405. {
  406. ainfo->converged = 0;
  407. return (1);
  408. }
  409. if (abs(mfsize) > MFIFO_SIZE)
  410. {
  411. ainfo->converged = 0;
  412. return (1);
  413. }
  414. }
  415. }
  416. static char nv3_arb(nv3_fifo_info * res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
  417. {
  418. long ens, vns, mns, gns;
  419. int mmisses, gmisses, vmisses, eburst_size, mburst_size;
  420. int refresh_cycle;
  421. refresh_cycle = 2*(state->mclk_khz/state->pclk_khz) + 5;
  422. mmisses = 2;
  423. if (state->mem_aligned) gmisses = 2;
  424. else gmisses = 3;
  425. vmisses = 2;
  426. eburst_size = state->memory_width * 1;
  427. mburst_size = 32;
  428. if (!state->mclk_khz)
  429. return (0);
  430. gns = 1000000 * (gmisses*state->mem_page_miss + state->mem_latency)/state->mclk_khz;
  431. ainfo->by_gfacc = gns*ainfo->gdrain_rate/1000000;
  432. ainfo->wcmocc = 0;
  433. ainfo->wcgocc = 0;
  434. ainfo->wcvocc = 0;
  435. ainfo->wcvlwm = 0;
  436. ainfo->wcglwm = 0;
  437. ainfo->engine_en = 1;
  438. ainfo->converged = 1;
  439. if (ainfo->engine_en)
  440. {
  441. ens = 1000000*(state->mem_page_miss + eburst_size/(state->memory_width/8) +refresh_cycle)/state->mclk_khz;
  442. ainfo->mocc = state->enable_mp ? 0-ens*ainfo->mdrain_rate/1000000 : 0;
  443. ainfo->vocc = ainfo->vid_en ? 0-ens*ainfo->vdrain_rate/1000000 : 0;
  444. ainfo->gocc = ainfo->gr_en ? 0-ens*ainfo->gdrain_rate/1000000 : 0;
  445. ainfo->cur = ENGINE;
  446. ainfo->first_vacc = 1;
  447. ainfo->first_gacc = 1;
  448. ainfo->first_macc = 1;
  449. nv3_iterate(res_info, state,ainfo);
  450. }
  451. if (state->enable_mp)
  452. {
  453. mns = 1000000 * (mmisses*state->mem_page_miss + mburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
  454. ainfo->mocc = state->enable_mp ? 0 : mburst_size - mns*ainfo->mdrain_rate/1000000;
  455. ainfo->vocc = ainfo->vid_en ? 0 : 0- mns*ainfo->vdrain_rate/1000000;
  456. ainfo->gocc = ainfo->gr_en ? 0: 0- mns*ainfo->gdrain_rate/1000000;
  457. ainfo->cur = MPORT;
  458. ainfo->first_vacc = 1;
  459. ainfo->first_gacc = 1;
  460. ainfo->first_macc = 0;
  461. nv3_iterate(res_info, state,ainfo);
  462. }
  463. if (ainfo->gr_en)
  464. {
  465. ainfo->first_vacc = 1;
  466. ainfo->first_gacc = 0;
  467. ainfo->first_macc = 1;
  468. gns = 1000000*(gmisses*state->mem_page_miss + ainfo->gburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
  469. ainfo->gocc = ainfo->gburst_size - gns*ainfo->gdrain_rate/1000000;
  470. ainfo->vocc = ainfo->vid_en? 0-gns*ainfo->vdrain_rate/1000000 : 0;
  471. ainfo->mocc = state->enable_mp ? 0-gns*ainfo->mdrain_rate/1000000: 0;
  472. ainfo->cur = GRAPHICS;
  473. nv3_iterate(res_info, state,ainfo);
  474. }
  475. if (ainfo->vid_en)
  476. {
  477. ainfo->first_vacc = 0;
  478. ainfo->first_gacc = 1;
  479. ainfo->first_macc = 1;
  480. vns = 1000000*(vmisses*state->mem_page_miss + ainfo->vburst_size/(state->memory_width/8) + refresh_cycle)/state->mclk_khz;
  481. ainfo->vocc = ainfo->vburst_size - vns*ainfo->vdrain_rate/1000000;
  482. ainfo->gocc = ainfo->gr_en? (0-vns*ainfo->gdrain_rate/1000000) : 0;
  483. ainfo->mocc = state->enable_mp? 0-vns*ainfo->mdrain_rate/1000000 :0 ;
  484. ainfo->cur = VIDEO;
  485. nv3_iterate(res_info, state, ainfo);
  486. }
  487. if (ainfo->converged)
  488. {
  489. res_info->graphics_lwm = (int)abs(ainfo->wcglwm) + 16;
  490. res_info->video_lwm = (int)abs(ainfo->wcvlwm) + 32;
  491. res_info->graphics_burst_size = ainfo->gburst_size;
  492. res_info->video_burst_size = ainfo->vburst_size;
  493. res_info->graphics_hi_priority = (ainfo->priority == GRAPHICS);
  494. res_info->media_hi_priority = (ainfo->priority == MPORT);
  495. if (res_info->video_lwm > 160)
  496. {
  497. res_info->graphics_lwm = 256;
  498. res_info->video_lwm = 128;
  499. res_info->graphics_burst_size = 64;
  500. res_info->video_burst_size = 64;
  501. res_info->graphics_hi_priority = 0;
  502. res_info->media_hi_priority = 0;
  503. ainfo->converged = 0;
  504. return (0);
  505. }
  506. if (res_info->video_lwm > 128)
  507. {
  508. res_info->video_lwm = 128;
  509. }
  510. return (1);
  511. }
  512. else
  513. {
  514. res_info->graphics_lwm = 256;
  515. res_info->video_lwm = 128;
  516. res_info->graphics_burst_size = 64;
  517. res_info->video_burst_size = 64;
  518. res_info->graphics_hi_priority = 0;
  519. res_info->media_hi_priority = 0;
  520. return (0);
  521. }
  522. }
  523. static char nv3_get_param(nv3_fifo_info *res_info, nv3_sim_state * state, nv3_arb_info *ainfo)
  524. {
  525. int done, g,v, p;
  526. done = 0;
  527. for (p=0; p < 2; p++)
  528. {
  529. for (g=128 ; g > 32; g= g>> 1)
  530. {
  531. for (v=128; v >=32; v = v>> 1)
  532. {
  533. ainfo->priority = p;
  534. ainfo->gburst_size = g;
  535. ainfo->vburst_size = v;
  536. done = nv3_arb(res_info, state,ainfo);
  537. if (done && (g==128))
  538. if ((res_info->graphics_lwm + g) > 256)
  539. done = 0;
  540. if (done)
  541. goto Done;
  542. }
  543. }
  544. }
  545. Done:
  546. return done;
  547. }
  548. static void nv3CalcArbitration
  549. (
  550. nv3_fifo_info * res_info,
  551. nv3_sim_state * state
  552. )
  553. {
  554. nv3_fifo_info save_info;
  555. nv3_arb_info ainfo;
  556. char res_gr, res_vid;
  557. ainfo.gr_en = 1;
  558. ainfo.vid_en = state->enable_video;
  559. ainfo.vid_only_once = 0;
  560. ainfo.gr_only_once = 0;
  561. ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
  562. ainfo.vdrain_rate = (int) state->pclk_khz * 2;
  563. if (state->video_scale != 0)
  564. ainfo.vdrain_rate = ainfo.vdrain_rate/state->video_scale;
  565. ainfo.mdrain_rate = 33000;
  566. res_info->rtl_values = 0;
  567. if (!state->gr_during_vid && state->enable_video)
  568. {
  569. ainfo.gr_only_once = 1;
  570. ainfo.gr_en = 1;
  571. ainfo.gdrain_rate = 0;
  572. res_vid = nv3_get_param(res_info, state, &ainfo);
  573. res_vid = ainfo.converged;
  574. save_info.video_lwm = res_info->video_lwm;
  575. save_info.video_burst_size = res_info->video_burst_size;
  576. ainfo.vid_en = 1;
  577. ainfo.vid_only_once = 1;
  578. ainfo.gr_en = 1;
  579. ainfo.gdrain_rate = (int) state->pclk_khz * (state->pix_bpp/8);
  580. ainfo.vdrain_rate = 0;
  581. res_gr = nv3_get_param(res_info, state, &ainfo);
  582. res_gr = ainfo.converged;
  583. res_info->video_lwm = save_info.video_lwm;
  584. res_info->video_burst_size = save_info.video_burst_size;
  585. res_info->valid = res_gr & res_vid;
  586. }
  587. else
  588. {
  589. if (!ainfo.gr_en) ainfo.gdrain_rate = 0;
  590. if (!ainfo.vid_en) ainfo.vdrain_rate = 0;
  591. res_gr = nv3_get_param(res_info, state, &ainfo);
  592. res_info->valid = ainfo.converged;
  593. }
  594. }
  595. static void nv3UpdateArbitrationSettings
  596. (
  597. unsigned VClk,
  598. unsigned pixelDepth,
  599. unsigned *burst,
  600. unsigned *lwm,
  601. RIVA_HW_INST *chip
  602. )
  603. {
  604. nv3_fifo_info fifo_data;
  605. nv3_sim_state sim_data;
  606. unsigned int M, N, P, pll, MClk;
  607. pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
  608. M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
  609. MClk = (N * chip->CrystalFreqKHz / M) >> P;
  610. sim_data.pix_bpp = (char)pixelDepth;
  611. sim_data.enable_video = 0;
  612. sim_data.enable_mp = 0;
  613. sim_data.video_scale = 1;
  614. sim_data.memory_width = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
  615. 128 : 64;
  616. sim_data.memory_width = 128;
  617. sim_data.mem_latency = 9;
  618. sim_data.mem_aligned = 1;
  619. sim_data.mem_page_miss = 11;
  620. sim_data.gr_during_vid = 0;
  621. sim_data.pclk_khz = VClk;
  622. sim_data.mclk_khz = MClk;
  623. nv3CalcArbitration(&fifo_data, &sim_data);
  624. if (fifo_data.valid)
  625. {
  626. int b = fifo_data.graphics_burst_size >> 4;
  627. *burst = 0;
  628. while (b >>= 1)
  629. (*burst)++;
  630. *lwm = fifo_data.graphics_lwm >> 3;
  631. }
  632. else
  633. {
  634. *lwm = 0x24;
  635. *burst = 0x2;
  636. }
  637. }
  638. static void nv4CalcArbitration
  639. (
  640. nv4_fifo_info *fifo,
  641. nv4_sim_state *arb
  642. )
  643. {
  644. int data, pagemiss, cas,width, video_enable, bpp;
  645. int nvclks, mclks, pclks, vpagemiss, crtpagemiss, vbs;
  646. int found, mclk_extra, mclk_loop, cbs, m1, p1;
  647. int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
  648. int us_m, us_n, us_p, video_drain_rate, crtc_drain_rate;
  649. int vpm_us, us_video, vlwm, video_fill_us, cpm_us, us_crt,clwm;
  650. fifo->valid = 1;
  651. pclk_freq = arb->pclk_khz;
  652. mclk_freq = arb->mclk_khz;
  653. nvclk_freq = arb->nvclk_khz;
  654. pagemiss = arb->mem_page_miss;
  655. cas = arb->mem_latency;
  656. width = arb->memory_width >> 6;
  657. video_enable = arb->enable_video;
  658. bpp = arb->pix_bpp;
  659. mp_enable = arb->enable_mp;
  660. clwm = 0;
  661. vlwm = 0;
  662. cbs = 128;
  663. pclks = 2;
  664. nvclks = 2;
  665. nvclks += 2;
  666. nvclks += 1;
  667. mclks = 5;
  668. mclks += 3;
  669. mclks += 1;
  670. mclks += cas;
  671. mclks += 1;
  672. mclks += 1;
  673. mclks += 1;
  674. mclks += 1;
  675. mclk_extra = 3;
  676. nvclks += 2;
  677. nvclks += 1;
  678. nvclks += 1;
  679. nvclks += 1;
  680. if (mp_enable)
  681. mclks+=4;
  682. nvclks += 0;
  683. pclks += 0;
  684. found = 0;
  685. vbs = 0;
  686. while (found != 1)
  687. {
  688. fifo->valid = 1;
  689. found = 1;
  690. mclk_loop = mclks+mclk_extra;
  691. us_m = mclk_loop *1000*1000 / mclk_freq;
  692. us_n = nvclks*1000*1000 / nvclk_freq;
  693. us_p = nvclks*1000*1000 / pclk_freq;
  694. if (video_enable)
  695. {
  696. video_drain_rate = pclk_freq * 2;
  697. crtc_drain_rate = pclk_freq * bpp/8;
  698. vpagemiss = 2;
  699. vpagemiss += 1;
  700. crtpagemiss = 2;
  701. vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
  702. if (nvclk_freq * 2 > mclk_freq * width)
  703. video_fill_us = cbs*1000*1000 / 16 / nvclk_freq ;
  704. else
  705. video_fill_us = cbs*1000*1000 / (8 * width) / mclk_freq;
  706. us_video = vpm_us + us_m + us_n + us_p + video_fill_us;
  707. vlwm = us_video * video_drain_rate/(1000*1000);
  708. vlwm++;
  709. vbs = 128;
  710. if (vlwm > 128) vbs = 64;
  711. if (vlwm > (256-64)) vbs = 32;
  712. if (nvclk_freq * 2 > mclk_freq * width)
  713. video_fill_us = vbs *1000*1000/ 16 / nvclk_freq ;
  714. else
  715. video_fill_us = vbs*1000*1000 / (8 * width) / mclk_freq;
  716. cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
  717. us_crt =
  718. us_video
  719. +video_fill_us
  720. +cpm_us
  721. +us_m + us_n +us_p
  722. ;
  723. clwm = us_crt * crtc_drain_rate/(1000*1000);
  724. clwm++;
  725. }
  726. else
  727. {
  728. crtc_drain_rate = pclk_freq * bpp/8;
  729. crtpagemiss = 2;
  730. crtpagemiss += 1;
  731. cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
  732. us_crt = cpm_us + us_m + us_n + us_p ;
  733. clwm = us_crt * crtc_drain_rate/(1000*1000);
  734. clwm++;
  735. }
  736. m1 = clwm + cbs - 512;
  737. p1 = m1 * pclk_freq / mclk_freq;
  738. p1 = p1 * bpp / 8;
  739. if ((p1 < m1) && (m1 > 0))
  740. {
  741. fifo->valid = 0;
  742. found = 0;
  743. if (mclk_extra ==0) found = 1;
  744. mclk_extra--;
  745. }
  746. else if (video_enable)
  747. {
  748. if ((clwm > 511) || (vlwm > 255))
  749. {
  750. fifo->valid = 0;
  751. found = 0;
  752. if (mclk_extra ==0) found = 1;
  753. mclk_extra--;
  754. }
  755. }
  756. else
  757. {
  758. if (clwm > 519)
  759. {
  760. fifo->valid = 0;
  761. found = 0;
  762. if (mclk_extra ==0) found = 1;
  763. mclk_extra--;
  764. }
  765. }
  766. if (clwm < 384) clwm = 384;
  767. if (vlwm < 128) vlwm = 128;
  768. data = (int)(clwm);
  769. fifo->graphics_lwm = data;
  770. fifo->graphics_burst_size = 128;
  771. data = (int)((vlwm+15));
  772. fifo->video_lwm = data;
  773. fifo->video_burst_size = vbs;
  774. }
  775. }
  776. static void nv4UpdateArbitrationSettings
  777. (
  778. unsigned VClk,
  779. unsigned pixelDepth,
  780. unsigned *burst,
  781. unsigned *lwm,
  782. RIVA_HW_INST *chip
  783. )
  784. {
  785. nv4_fifo_info fifo_data;
  786. nv4_sim_state sim_data;
  787. unsigned int M, N, P, pll, MClk, NVClk, cfg1;
  788. pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
  789. M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
  790. MClk = (N * chip->CrystalFreqKHz / M) >> P;
  791. pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
  792. M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
  793. NVClk = (N * chip->CrystalFreqKHz / M) >> P;
  794. cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
  795. sim_data.pix_bpp = (char)pixelDepth;
  796. sim_data.enable_video = 0;
  797. sim_data.enable_mp = 0;
  798. sim_data.memory_width = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
  799. 128 : 64;
  800. sim_data.mem_latency = (char)cfg1 & 0x0F;
  801. sim_data.mem_aligned = 1;
  802. sim_data.mem_page_miss = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
  803. sim_data.gr_during_vid = 0;
  804. sim_data.pclk_khz = VClk;
  805. sim_data.mclk_khz = MClk;
  806. sim_data.nvclk_khz = NVClk;
  807. nv4CalcArbitration(&fifo_data, &sim_data);
  808. if (fifo_data.valid)
  809. {
  810. int b = fifo_data.graphics_burst_size >> 4;
  811. *burst = 0;
  812. while (b >>= 1)
  813. (*burst)++;
  814. *lwm = fifo_data.graphics_lwm >> 3;
  815. }
  816. }
  817. static void nv10CalcArbitration
  818. (
  819. nv10_fifo_info *fifo,
  820. nv10_sim_state *arb
  821. )
  822. {
  823. int data, pagemiss, width, video_enable, bpp;
  824. int nvclks, mclks, pclks, vpagemiss, crtpagemiss;
  825. int nvclk_fill;
  826. int found, mclk_extra, mclk_loop, cbs, m1;
  827. int mclk_freq, pclk_freq, nvclk_freq, mp_enable;
  828. int us_m, us_m_min, us_n, us_p, crtc_drain_rate;
  829. int vus_m;
  830. int vpm_us, us_video, cpm_us, us_crt,clwm;
  831. int clwm_rnd_down;
  832. int m2us, us_pipe_min, p1clk, p2;
  833. int min_mclk_extra;
  834. int us_min_mclk_extra;
  835. fifo->valid = 1;
  836. pclk_freq = arb->pclk_khz; /* freq in KHz */
  837. mclk_freq = arb->mclk_khz;
  838. nvclk_freq = arb->nvclk_khz;
  839. pagemiss = arb->mem_page_miss;
  840. width = arb->memory_width/64;
  841. video_enable = arb->enable_video;
  842. bpp = arb->pix_bpp;
  843. mp_enable = arb->enable_mp;
  844. clwm = 0;
  845. cbs = 512;
  846. pclks = 4; /* lwm detect. */
  847. nvclks = 3; /* lwm -> sync. */
  848. nvclks += 2; /* fbi bus cycles (1 req + 1 busy) */
  849. mclks = 1; /* 2 edge sync. may be very close to edge so just put one. */
  850. mclks += 1; /* arb_hp_req */
  851. mclks += 5; /* ap_hp_req tiling pipeline */
  852. mclks += 2; /* tc_req latency fifo */
  853. mclks += 2; /* fb_cas_n_ memory request to fbio block */
  854. mclks += 7; /* sm_d_rdv data returned from fbio block */
  855. /* fb.rd.d.Put_gc need to accumulate 256 bits for read */
  856. if (arb->memory_type == 0)
  857. if (arb->memory_width == 64) /* 64 bit bus */
  858. mclks += 4;
  859. else
  860. mclks += 2;
  861. else
  862. if (arb->memory_width == 64) /* 64 bit bus */
  863. mclks += 2;
  864. else
  865. mclks += 1;
  866. if ((!video_enable) && (arb->memory_width == 128))
  867. {
  868. mclk_extra = (bpp == 32) ? 31 : 42; /* Margin of error */
  869. min_mclk_extra = 17;
  870. }
  871. else
  872. {
  873. mclk_extra = (bpp == 32) ? 8 : 4; /* Margin of error */
  874. /* mclk_extra = 4; */ /* Margin of error */
  875. min_mclk_extra = 18;
  876. }
  877. nvclks += 1; /* 2 edge sync. may be very close to edge so just put one. */
  878. nvclks += 1; /* fbi_d_rdv_n */
  879. nvclks += 1; /* Fbi_d_rdata */
  880. nvclks += 1; /* crtfifo load */
  881. if(mp_enable)
  882. mclks+=4; /* Mp can get in with a burst of 8. */
  883. /* Extra clocks determined by heuristics */
  884. nvclks += 0;
  885. pclks += 0;
  886. found = 0;
  887. while(found != 1) {
  888. fifo->valid = 1;
  889. found = 1;
  890. mclk_loop = mclks+mclk_extra;
  891. us_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
  892. us_m_min = mclks * 1000*1000 / mclk_freq; /* Minimum Mclk latency in us */
  893. us_min_mclk_extra = min_mclk_extra *1000*1000 / mclk_freq;
  894. us_n = nvclks*1000*1000 / nvclk_freq;/* nvclk latency in us */
  895. us_p = pclks*1000*1000 / pclk_freq;/* nvclk latency in us */
  896. us_pipe_min = us_m_min + us_n + us_p;
  897. vus_m = mclk_loop *1000*1000 / mclk_freq; /* Mclk latency in us */
  898. if(video_enable) {
  899. crtc_drain_rate = pclk_freq * bpp/8; /* MB/s */
  900. vpagemiss = 1; /* self generating page miss */
  901. vpagemiss += 1; /* One higher priority before */
  902. crtpagemiss = 2; /* self generating page miss */
  903. if(mp_enable)
  904. crtpagemiss += 1; /* if MA0 conflict */
  905. vpm_us = (vpagemiss * pagemiss)*1000*1000/mclk_freq;
  906. us_video = vpm_us + vus_m; /* Video has separate read return path */
  907. cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
  908. us_crt =
  909. us_video /* Wait for video */
  910. +cpm_us /* CRT Page miss */
  911. +us_m + us_n +us_p /* other latency */
  912. ;
  913. clwm = us_crt * crtc_drain_rate/(1000*1000);
  914. clwm++; /* fixed point <= float_point - 1. Fixes that */
  915. } else {
  916. crtc_drain_rate = pclk_freq * bpp/8; /* bpp * pclk/8 */
  917. crtpagemiss = 1; /* self generating page miss */
  918. crtpagemiss += 1; /* MA0 page miss */
  919. if(mp_enable)
  920. crtpagemiss += 1; /* if MA0 conflict */
  921. cpm_us = crtpagemiss * pagemiss *1000*1000/ mclk_freq;
  922. us_crt = cpm_us + us_m + us_n + us_p ;
  923. clwm = us_crt * crtc_drain_rate/(1000*1000);
  924. clwm++; /* fixed point <= float_point - 1. Fixes that */
  925. /*
  926. //
  927. // Another concern, only for high pclks so don't do this
  928. // with video:
  929. // What happens if the latency to fetch the cbs is so large that
  930. // fifo empties. In that case we need to have an alternate clwm value
  931. // based off the total burst fetch
  932. //
  933. us_crt = (cbs * 1000 * 1000)/ (8*width)/mclk_freq ;
  934. us_crt = us_crt + us_m + us_n + us_p + (4 * 1000 * 1000)/mclk_freq;
  935. clwm_mt = us_crt * crtc_drain_rate/(1000*1000);
  936. clwm_mt ++;
  937. if(clwm_mt > clwm)
  938. clwm = clwm_mt;
  939. */
  940. /* Finally, a heuristic check when width == 64 bits */
  941. if(width == 1){
  942. nvclk_fill = nvclk_freq * 8;
  943. if(crtc_drain_rate * 100 >= nvclk_fill * 102)
  944. clwm = 0xfff; /*Large number to fail */
  945. else if(crtc_drain_rate * 100 >= nvclk_fill * 98) {
  946. clwm = 1024;
  947. cbs = 512;
  948. }
  949. }
  950. }
  951. /*
  952. Overfill check:
  953. */
  954. clwm_rnd_down = ((int)clwm/8)*8;
  955. if (clwm_rnd_down < clwm)
  956. clwm += 8;
  957. m1 = clwm + cbs - 1024; /* Amount of overfill */
  958. m2us = us_pipe_min + us_min_mclk_extra;
  959. /* pclk cycles to drain */
  960. p1clk = m2us * pclk_freq/(1000*1000);
  961. p2 = p1clk * bpp / 8; /* bytes drained. */
  962. if((p2 < m1) && (m1 > 0)) {
  963. fifo->valid = 0;
  964. found = 0;
  965. if(min_mclk_extra == 0) {
  966. if(cbs <= 32) {
  967. found = 1; /* Can't adjust anymore! */
  968. } else {
  969. cbs = cbs/2; /* reduce the burst size */
  970. }
  971. } else {
  972. min_mclk_extra--;
  973. }
  974. } else {
  975. if (clwm > 1023){ /* Have some margin */
  976. fifo->valid = 0;
  977. found = 0;
  978. if(min_mclk_extra == 0)
  979. found = 1; /* Can't adjust anymore! */
  980. else
  981. min_mclk_extra--;
  982. }
  983. }
  984. if(clwm < (1024-cbs+8)) clwm = 1024-cbs+8;
  985. data = (int)(clwm);
  986. /* printf("CRT LWM: %f bytes, prog: 0x%x, bs: 256\n", clwm, data ); */
  987. fifo->graphics_lwm = data; fifo->graphics_burst_size = cbs;
  988. /* printf("VID LWM: %f bytes, prog: 0x%x, bs: %d\n, ", vlwm, data, vbs ); */
  989. fifo->video_lwm = 1024; fifo->video_burst_size = 512;
  990. }
  991. }
  992. static void nv10UpdateArbitrationSettings
  993. (
  994. unsigned VClk,
  995. unsigned pixelDepth,
  996. unsigned *burst,
  997. unsigned *lwm,
  998. RIVA_HW_INST *chip
  999. )
  1000. {
  1001. nv10_fifo_info fifo_data;
  1002. nv10_sim_state sim_data;
  1003. unsigned int M, N, P, pll, MClk, NVClk, cfg1;
  1004. pll = NV_RD32(&chip->PRAMDAC0[0x00000504/4], 0);
  1005. M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
  1006. MClk = (N * chip->CrystalFreqKHz / M) >> P;
  1007. pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
  1008. M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
  1009. NVClk = (N * chip->CrystalFreqKHz / M) >> P;
  1010. cfg1 = NV_RD32(&chip->PFB[0x00000204/4], 0);
  1011. sim_data.pix_bpp = (char)pixelDepth;
  1012. sim_data.enable_video = 0;
  1013. sim_data.enable_mp = 0;
  1014. sim_data.memory_type = (NV_RD32(&chip->PFB[0x00000200/4], 0) & 0x01) ?
  1015. 1 : 0;
  1016. sim_data.memory_width = (NV_RD32(&chip->PEXTDEV[0x00000000/4], 0) & 0x10) ?
  1017. 128 : 64;
  1018. sim_data.mem_latency = (char)cfg1 & 0x0F;
  1019. sim_data.mem_aligned = 1;
  1020. sim_data.mem_page_miss = (char)(((cfg1 >> 4) &0x0F) + ((cfg1 >> 31) & 0x01));
  1021. sim_data.gr_during_vid = 0;
  1022. sim_data.pclk_khz = VClk;
  1023. sim_data.mclk_khz = MClk;
  1024. sim_data.nvclk_khz = NVClk;
  1025. nv10CalcArbitration(&fifo_data, &sim_data);
  1026. if (fifo_data.valid)
  1027. {
  1028. int b = fifo_data.graphics_burst_size >> 4;
  1029. *burst = 0;
  1030. while (b >>= 1)
  1031. (*burst)++;
  1032. *lwm = fifo_data.graphics_lwm >> 3;
  1033. }
  1034. }
  1035. static void nForceUpdateArbitrationSettings
  1036. (
  1037. unsigned VClk,
  1038. unsigned pixelDepth,
  1039. unsigned *burst,
  1040. unsigned *lwm,
  1041. RIVA_HW_INST *chip,
  1042. struct pci_dev *pdev
  1043. )
  1044. {
  1045. nv10_fifo_info fifo_data;
  1046. nv10_sim_state sim_data;
  1047. unsigned int M, N, P, pll, MClk, NVClk;
  1048. unsigned int uMClkPostDiv;
  1049. struct pci_dev *dev;
  1050. int domain = pci_domain_nr(pdev->bus);
  1051. dev = pci_get_domain_bus_and_slot(domain, 0, 3);
  1052. pci_read_config_dword(dev, 0x6C, &uMClkPostDiv);
  1053. pci_dev_put(dev);
  1054. uMClkPostDiv = (uMClkPostDiv >> 8) & 0xf;
  1055. if(!uMClkPostDiv) uMClkPostDiv = 4;
  1056. MClk = 400000 / uMClkPostDiv;
  1057. pll = NV_RD32(&chip->PRAMDAC0[0x00000500/4], 0);
  1058. M = (pll >> 0) & 0xFF; N = (pll >> 8) & 0xFF; P = (pll >> 16) & 0x0F;
  1059. NVClk = (N * chip->CrystalFreqKHz / M) >> P;
  1060. sim_data.pix_bpp = (char)pixelDepth;
  1061. sim_data.enable_video = 0;
  1062. sim_data.enable_mp = 0;
  1063. dev = pci_get_domain_bus_and_slot(domain, 0, 1);
  1064. pci_read_config_dword(dev, 0x7C, &sim_data.memory_type);
  1065. pci_dev_put(dev);
  1066. sim_data.memory_type = (sim_data.memory_type >> 12) & 1;
  1067. sim_data.memory_width = 64;
  1068. sim_data.mem_latency = 3;
  1069. sim_data.mem_aligned = 1;
  1070. sim_data.mem_page_miss = 10;
  1071. sim_data.gr_during_vid = 0;
  1072. sim_data.pclk_khz = VClk;
  1073. sim_data.mclk_khz = MClk;
  1074. sim_data.nvclk_khz = NVClk;
  1075. nv10CalcArbitration(&fifo_data, &sim_data);
  1076. if (fifo_data.valid)
  1077. {
  1078. int b = fifo_data.graphics_burst_size >> 4;
  1079. *burst = 0;
  1080. while (b >>= 1)
  1081. (*burst)++;
  1082. *lwm = fifo_data.graphics_lwm >> 3;
  1083. }
  1084. }
  1085. /****************************************************************************\
  1086. * *
  1087. * RIVA Mode State Routines *
  1088. * *
  1089. \****************************************************************************/
  1090. /*
  1091. * Calculate the Video Clock parameters for the PLL.
  1092. */
  1093. static int CalcVClock
  1094. (
  1095. int clockIn,
  1096. int *clockOut,
  1097. int *mOut,
  1098. int *nOut,
  1099. int *pOut,
  1100. RIVA_HW_INST *chip
  1101. )
  1102. {
  1103. unsigned lowM, highM, highP;
  1104. unsigned DeltaNew, DeltaOld;
  1105. unsigned VClk, Freq;
  1106. unsigned M, N, P;
  1107. DeltaOld = 0xFFFFFFFF;
  1108. VClk = (unsigned)clockIn;
  1109. if (chip->CrystalFreqKHz == 13500)
  1110. {
  1111. lowM = 7;
  1112. highM = 13 - (chip->Architecture == NV_ARCH_03);
  1113. }
  1114. else
  1115. {
  1116. lowM = 8;
  1117. highM = 14 - (chip->Architecture == NV_ARCH_03);
  1118. }
  1119. highP = 4 - (chip->Architecture == NV_ARCH_03);
  1120. for (P = 0; P <= highP; P ++)
  1121. {
  1122. Freq = VClk << P;
  1123. if ((Freq >= 128000) && (Freq <= chip->MaxVClockFreqKHz))
  1124. {
  1125. for (M = lowM; M <= highM; M++)
  1126. {
  1127. N = (VClk << P) * M / chip->CrystalFreqKHz;
  1128. if(N <= 255) {
  1129. Freq = (chip->CrystalFreqKHz * N / M) >> P;
  1130. if (Freq > VClk)
  1131. DeltaNew = Freq - VClk;
  1132. else
  1133. DeltaNew = VClk - Freq;
  1134. if (DeltaNew < DeltaOld)
  1135. {
  1136. *mOut = M;
  1137. *nOut = N;
  1138. *pOut = P;
  1139. *clockOut = Freq;
  1140. DeltaOld = DeltaNew;
  1141. }
  1142. }
  1143. }
  1144. }
  1145. }
  1146. /* non-zero: M/N/P/clock values assigned. zero: error (not set) */
  1147. return (DeltaOld != 0xFFFFFFFF);
  1148. }
  1149. /*
  1150. * Calculate extended mode parameters (SVGA) and save in a
  1151. * mode state structure.
  1152. */
  1153. int CalcStateExt
  1154. (
  1155. RIVA_HW_INST *chip,
  1156. RIVA_HW_STATE *state,
  1157. struct pci_dev *pdev,
  1158. int bpp,
  1159. int width,
  1160. int hDisplaySize,
  1161. int height,
  1162. int dotClock
  1163. )
  1164. {
  1165. int pixelDepth;
  1166. int VClk, m, n, p;
  1167. /*
  1168. * Save mode parameters.
  1169. */
  1170. state->bpp = bpp; /* this is not bitsPerPixel, it's 8,15,16,32 */
  1171. state->width = width;
  1172. state->height = height;
  1173. /*
  1174. * Extended RIVA registers.
  1175. */
  1176. pixelDepth = (bpp + 1)/8;
  1177. if (!CalcVClock(dotClock, &VClk, &m, &n, &p, chip))
  1178. return -EINVAL;
  1179. switch (chip->Architecture)
  1180. {
  1181. case NV_ARCH_03:
  1182. nv3UpdateArbitrationSettings(VClk,
  1183. pixelDepth * 8,
  1184. &(state->arbitration0),
  1185. &(state->arbitration1),
  1186. chip);
  1187. state->cursor0 = 0x00;
  1188. state->cursor1 = 0x78;
  1189. state->cursor2 = 0x00000000;
  1190. state->pllsel = 0x10010100;
  1191. state->config = ((width + 31)/32)
  1192. | (((pixelDepth > 2) ? 3 : pixelDepth) << 8)
  1193. | 0x1000;
  1194. state->general = 0x00100100;
  1195. state->repaint1 = hDisplaySize < 1280 ? 0x06 : 0x02;
  1196. break;
  1197. case NV_ARCH_04:
  1198. nv4UpdateArbitrationSettings(VClk,
  1199. pixelDepth * 8,
  1200. &(state->arbitration0),
  1201. &(state->arbitration1),
  1202. chip);
  1203. state->cursor0 = 0x00;
  1204. state->cursor1 = 0xFC;
  1205. state->cursor2 = 0x00000000;
  1206. state->pllsel = 0x10000700;
  1207. state->config = 0x00001114;
  1208. state->general = bpp == 16 ? 0x00101100 : 0x00100100;
  1209. state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
  1210. break;
  1211. case NV_ARCH_10:
  1212. case NV_ARCH_20:
  1213. case NV_ARCH_30:
  1214. if((chip->Chipset == NV_CHIP_IGEFORCE2) ||
  1215. (chip->Chipset == NV_CHIP_0x01F0))
  1216. {
  1217. nForceUpdateArbitrationSettings(VClk,
  1218. pixelDepth * 8,
  1219. &(state->arbitration0),
  1220. &(state->arbitration1),
  1221. chip, pdev);
  1222. } else {
  1223. nv10UpdateArbitrationSettings(VClk,
  1224. pixelDepth * 8,
  1225. &(state->arbitration0),
  1226. &(state->arbitration1),
  1227. chip);
  1228. }
  1229. state->cursor0 = 0x80 | (chip->CursorStart >> 17);
  1230. state->cursor1 = (chip->CursorStart >> 11) << 2;
  1231. state->cursor2 = chip->CursorStart >> 24;
  1232. state->pllsel = 0x10000700;
  1233. state->config = NV_RD32(&chip->PFB[0x00000200/4], 0);
  1234. state->general = bpp == 16 ? 0x00101100 : 0x00100100;
  1235. state->repaint1 = hDisplaySize < 1280 ? 0x04 : 0x00;
  1236. break;
  1237. }
  1238. /* Paul Richards: below if block borks things in kernel for some reason */
  1239. /* Tony: Below is needed to set hardware in DirectColor */
  1240. if((bpp != 8) && (chip->Architecture != NV_ARCH_03))
  1241. state->general |= 0x00000030;
  1242. state->vpll = (p << 16) | (n << 8) | m;
  1243. state->repaint0 = (((width/8)*pixelDepth) & 0x700) >> 3;
  1244. state->pixel = pixelDepth > 2 ? 3 : pixelDepth;
  1245. state->offset0 =
  1246. state->offset1 =
  1247. state->offset2 =
  1248. state->offset3 = 0;
  1249. state->pitch0 =
  1250. state->pitch1 =
  1251. state->pitch2 =
  1252. state->pitch3 = pixelDepth * width;
  1253. return 0;
  1254. }
  1255. /*
  1256. * Load fixed function state and pre-calculated/stored state.
  1257. */
  1258. #define LOAD_FIXED_STATE(tbl,dev) \
  1259. for (i = 0; i < sizeof(tbl##Table##dev)/8; i++) \
  1260. NV_WR32(&chip->dev[tbl##Table##dev[i][0]], 0, tbl##Table##dev[i][1])
  1261. #define LOAD_FIXED_STATE_8BPP(tbl,dev) \
  1262. for (i = 0; i < sizeof(tbl##Table##dev##_8BPP)/8; i++) \
  1263. NV_WR32(&chip->dev[tbl##Table##dev##_8BPP[i][0]], 0, tbl##Table##dev##_8BPP[i][1])
  1264. #define LOAD_FIXED_STATE_15BPP(tbl,dev) \
  1265. for (i = 0; i < sizeof(tbl##Table##dev##_15BPP)/8; i++) \
  1266. NV_WR32(&chip->dev[tbl##Table##dev##_15BPP[i][0]], 0, tbl##Table##dev##_15BPP[i][1])
  1267. #define LOAD_FIXED_STATE_16BPP(tbl,dev) \
  1268. for (i = 0; i < sizeof(tbl##Table##dev##_16BPP)/8; i++) \
  1269. NV_WR32(&chip->dev[tbl##Table##dev##_16BPP[i][0]], 0, tbl##Table##dev##_16BPP[i][1])
  1270. #define LOAD_FIXED_STATE_32BPP(tbl,dev) \
  1271. for (i = 0; i < sizeof(tbl##Table##dev##_32BPP)/8; i++) \
  1272. NV_WR32(&chip->dev[tbl##Table##dev##_32BPP[i][0]], 0, tbl##Table##dev##_32BPP[i][1])
  1273. static void UpdateFifoState
  1274. (
  1275. RIVA_HW_INST *chip
  1276. )
  1277. {
  1278. int i;
  1279. switch (chip->Architecture)
  1280. {
  1281. case NV_ARCH_04:
  1282. LOAD_FIXED_STATE(nv4,FIFO);
  1283. chip->Tri03 = NULL;
  1284. chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
  1285. break;
  1286. case NV_ARCH_10:
  1287. case NV_ARCH_20:
  1288. case NV_ARCH_30:
  1289. /*
  1290. * Initialize state for the RivaTriangle3D05 routines.
  1291. */
  1292. LOAD_FIXED_STATE(nv10tri05,PGRAPH);
  1293. LOAD_FIXED_STATE(nv10,FIFO);
  1294. chip->Tri03 = NULL;
  1295. chip->Tri05 = (RivaTexturedTriangle05 __iomem *)&(chip->FIFO[0x0000E000/4]);
  1296. break;
  1297. }
  1298. }
  1299. static void LoadStateExt
  1300. (
  1301. RIVA_HW_INST *chip,
  1302. RIVA_HW_STATE *state
  1303. )
  1304. {
  1305. int i;
  1306. /*
  1307. * Load HW fixed function state.
  1308. */
  1309. LOAD_FIXED_STATE(Riva,PMC);
  1310. LOAD_FIXED_STATE(Riva,PTIMER);
  1311. switch (chip->Architecture)
  1312. {
  1313. case NV_ARCH_03:
  1314. /*
  1315. * Make sure frame buffer config gets set before loading PRAMIN.
  1316. */
  1317. NV_WR32(chip->PFB, 0x00000200, state->config);
  1318. LOAD_FIXED_STATE(nv3,PFIFO);
  1319. LOAD_FIXED_STATE(nv3,PRAMIN);
  1320. LOAD_FIXED_STATE(nv3,PGRAPH);
  1321. switch (state->bpp)
  1322. {
  1323. case 15:
  1324. case 16:
  1325. LOAD_FIXED_STATE_15BPP(nv3,PRAMIN);
  1326. LOAD_FIXED_STATE_15BPP(nv3,PGRAPH);
  1327. chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
  1328. break;
  1329. case 24:
  1330. case 32:
  1331. LOAD_FIXED_STATE_32BPP(nv3,PRAMIN);
  1332. LOAD_FIXED_STATE_32BPP(nv3,PGRAPH);
  1333. chip->Tri03 = NULL;
  1334. break;
  1335. case 8:
  1336. default:
  1337. LOAD_FIXED_STATE_8BPP(nv3,PRAMIN);
  1338. LOAD_FIXED_STATE_8BPP(nv3,PGRAPH);
  1339. chip->Tri03 = NULL;
  1340. break;
  1341. }
  1342. for (i = 0x00000; i < 0x00800; i++)
  1343. NV_WR32(&chip->PRAMIN[0x00000502 + i], 0, (i << 12) | 0x03);
  1344. NV_WR32(chip->PGRAPH, 0x00000630, state->offset0);
  1345. NV_WR32(chip->PGRAPH, 0x00000634, state->offset1);
  1346. NV_WR32(chip->PGRAPH, 0x00000638, state->offset2);
  1347. NV_WR32(chip->PGRAPH, 0x0000063C, state->offset3);
  1348. NV_WR32(chip->PGRAPH, 0x00000650, state->pitch0);
  1349. NV_WR32(chip->PGRAPH, 0x00000654, state->pitch1);
  1350. NV_WR32(chip->PGRAPH, 0x00000658, state->pitch2);
  1351. NV_WR32(chip->PGRAPH, 0x0000065C, state->pitch3);
  1352. break;
  1353. case NV_ARCH_04:
  1354. /*
  1355. * Make sure frame buffer config gets set before loading PRAMIN.
  1356. */
  1357. NV_WR32(chip->PFB, 0x00000200, state->config);
  1358. LOAD_FIXED_STATE(nv4,PFIFO);
  1359. LOAD_FIXED_STATE(nv4,PRAMIN);
  1360. LOAD_FIXED_STATE(nv4,PGRAPH);
  1361. switch (state->bpp)
  1362. {
  1363. case 15:
  1364. LOAD_FIXED_STATE_15BPP(nv4,PRAMIN);
  1365. LOAD_FIXED_STATE_15BPP(nv4,PGRAPH);
  1366. chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
  1367. break;
  1368. case 16:
  1369. LOAD_FIXED_STATE_16BPP(nv4,PRAMIN);
  1370. LOAD_FIXED_STATE_16BPP(nv4,PGRAPH);
  1371. chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
  1372. break;
  1373. case 24:
  1374. case 32:
  1375. LOAD_FIXED_STATE_32BPP(nv4,PRAMIN);
  1376. LOAD_FIXED_STATE_32BPP(nv4,PGRAPH);
  1377. chip->Tri03 = NULL;
  1378. break;
  1379. case 8:
  1380. default:
  1381. LOAD_FIXED_STATE_8BPP(nv4,PRAMIN);
  1382. LOAD_FIXED_STATE_8BPP(nv4,PGRAPH);
  1383. chip->Tri03 = NULL;
  1384. break;
  1385. }
  1386. NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
  1387. NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
  1388. NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
  1389. NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
  1390. NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
  1391. NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
  1392. NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
  1393. NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
  1394. break;
  1395. case NV_ARCH_10:
  1396. case NV_ARCH_20:
  1397. case NV_ARCH_30:
  1398. if(chip->twoHeads) {
  1399. VGA_WR08(chip->PCIO, 0x03D4, 0x44);
  1400. VGA_WR08(chip->PCIO, 0x03D5, state->crtcOwner);
  1401. chip->LockUnlock(chip, 0);
  1402. }
  1403. LOAD_FIXED_STATE(nv10,PFIFO);
  1404. LOAD_FIXED_STATE(nv10,PRAMIN);
  1405. LOAD_FIXED_STATE(nv10,PGRAPH);
  1406. switch (state->bpp)
  1407. {
  1408. case 15:
  1409. LOAD_FIXED_STATE_15BPP(nv10,PRAMIN);
  1410. LOAD_FIXED_STATE_15BPP(nv10,PGRAPH);
  1411. chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
  1412. break;
  1413. case 16:
  1414. LOAD_FIXED_STATE_16BPP(nv10,PRAMIN);
  1415. LOAD_FIXED_STATE_16BPP(nv10,PGRAPH);
  1416. chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
  1417. break;
  1418. case 24:
  1419. case 32:
  1420. LOAD_FIXED_STATE_32BPP(nv10,PRAMIN);
  1421. LOAD_FIXED_STATE_32BPP(nv10,PGRAPH);
  1422. chip->Tri03 = NULL;
  1423. break;
  1424. case 8:
  1425. default:
  1426. LOAD_FIXED_STATE_8BPP(nv10,PRAMIN);
  1427. LOAD_FIXED_STATE_8BPP(nv10,PGRAPH);
  1428. chip->Tri03 = NULL;
  1429. break;
  1430. }
  1431. if(chip->Architecture == NV_ARCH_10) {
  1432. NV_WR32(chip->PGRAPH, 0x00000640, state->offset0);
  1433. NV_WR32(chip->PGRAPH, 0x00000644, state->offset1);
  1434. NV_WR32(chip->PGRAPH, 0x00000648, state->offset2);
  1435. NV_WR32(chip->PGRAPH, 0x0000064C, state->offset3);
  1436. NV_WR32(chip->PGRAPH, 0x00000670, state->pitch0);
  1437. NV_WR32(chip->PGRAPH, 0x00000674, state->pitch1);
  1438. NV_WR32(chip->PGRAPH, 0x00000678, state->pitch2);
  1439. NV_WR32(chip->PGRAPH, 0x0000067C, state->pitch3);
  1440. NV_WR32(chip->PGRAPH, 0x00000680, state->pitch3);
  1441. } else {
  1442. NV_WR32(chip->PGRAPH, 0x00000820, state->offset0);
  1443. NV_WR32(chip->PGRAPH, 0x00000824, state->offset1);
  1444. NV_WR32(chip->PGRAPH, 0x00000828, state->offset2);
  1445. NV_WR32(chip->PGRAPH, 0x0000082C, state->offset3);
  1446. NV_WR32(chip->PGRAPH, 0x00000850, state->pitch0);
  1447. NV_WR32(chip->PGRAPH, 0x00000854, state->pitch1);
  1448. NV_WR32(chip->PGRAPH, 0x00000858, state->pitch2);
  1449. NV_WR32(chip->PGRAPH, 0x0000085C, state->pitch3);
  1450. NV_WR32(chip->PGRAPH, 0x00000860, state->pitch3);
  1451. NV_WR32(chip->PGRAPH, 0x00000864, state->pitch3);
  1452. NV_WR32(chip->PGRAPH, 0x000009A4, NV_RD32(chip->PFB, 0x00000200));
  1453. NV_WR32(chip->PGRAPH, 0x000009A8, NV_RD32(chip->PFB, 0x00000204));
  1454. }
  1455. if(chip->twoHeads) {
  1456. NV_WR32(chip->PCRTC0, 0x00000860, state->head);
  1457. NV_WR32(chip->PCRTC0, 0x00002860, state->head2);
  1458. }
  1459. NV_WR32(chip->PRAMDAC, 0x00000404, NV_RD32(chip->PRAMDAC, 0x00000404) | (1 << 25));
  1460. NV_WR32(chip->PMC, 0x00008704, 1);
  1461. NV_WR32(chip->PMC, 0x00008140, 0);
  1462. NV_WR32(chip->PMC, 0x00008920, 0);
  1463. NV_WR32(chip->PMC, 0x00008924, 0);
  1464. NV_WR32(chip->PMC, 0x00008908, 0x01ffffff);
  1465. NV_WR32(chip->PMC, 0x0000890C, 0x01ffffff);
  1466. NV_WR32(chip->PMC, 0x00001588, 0);
  1467. NV_WR32(chip->PFB, 0x00000240, 0);
  1468. NV_WR32(chip->PFB, 0x00000250, 0);
  1469. NV_WR32(chip->PFB, 0x00000260, 0);
  1470. NV_WR32(chip->PFB, 0x00000270, 0);
  1471. NV_WR32(chip->PFB, 0x00000280, 0);
  1472. NV_WR32(chip->PFB, 0x00000290, 0);
  1473. NV_WR32(chip->PFB, 0x000002A0, 0);
  1474. NV_WR32(chip->PFB, 0x000002B0, 0);
  1475. NV_WR32(chip->PGRAPH, 0x00000B00, NV_RD32(chip->PFB, 0x00000240));
  1476. NV_WR32(chip->PGRAPH, 0x00000B04, NV_RD32(chip->PFB, 0x00000244));
  1477. NV_WR32(chip->PGRAPH, 0x00000B08, NV_RD32(chip->PFB, 0x00000248));
  1478. NV_WR32(chip->PGRAPH, 0x00000B0C, NV_RD32(chip->PFB, 0x0000024C));
  1479. NV_WR32(chip->PGRAPH, 0x00000B10, NV_RD32(chip->PFB, 0x00000250));
  1480. NV_WR32(chip->PGRAPH, 0x00000B14, NV_RD32(chip->PFB, 0x00000254));
  1481. NV_WR32(chip->PGRAPH, 0x00000B18, NV_RD32(chip->PFB, 0x00000258));
  1482. NV_WR32(chip->PGRAPH, 0x00000B1C, NV_RD32(chip->PFB, 0x0000025C));
  1483. NV_WR32(chip->PGRAPH, 0x00000B20, NV_RD32(chip->PFB, 0x00000260));
  1484. NV_WR32(chip->PGRAPH, 0x00000B24, NV_RD32(chip->PFB, 0x00000264));
  1485. NV_WR32(chip->PGRAPH, 0x00000B28, NV_RD32(chip->PFB, 0x00000268));
  1486. NV_WR32(chip->PGRAPH, 0x00000B2C, NV_RD32(chip->PFB, 0x0000026C));
  1487. NV_WR32(chip->PGRAPH, 0x00000B30, NV_RD32(chip->PFB, 0x00000270));
  1488. NV_WR32(chip->PGRAPH, 0x00000B34, NV_RD32(chip->PFB, 0x00000274));
  1489. NV_WR32(chip->PGRAPH, 0x00000B38, NV_RD32(chip->PFB, 0x00000278));
  1490. NV_WR32(chip->PGRAPH, 0x00000B3C, NV_RD32(chip->PFB, 0x0000027C));
  1491. NV_WR32(chip->PGRAPH, 0x00000B40, NV_RD32(chip->PFB, 0x00000280));
  1492. NV_WR32(chip->PGRAPH, 0x00000B44, NV_RD32(chip->PFB, 0x00000284));
  1493. NV_WR32(chip->PGRAPH, 0x00000B48, NV_RD32(chip->PFB, 0x00000288));
  1494. NV_WR32(chip->PGRAPH, 0x00000B4C, NV_RD32(chip->PFB, 0x0000028C));
  1495. NV_WR32(chip->PGRAPH, 0x00000B50, NV_RD32(chip->PFB, 0x00000290));
  1496. NV_WR32(chip->PGRAPH, 0x00000B54, NV_RD32(chip->PFB, 0x00000294));
  1497. NV_WR32(chip->PGRAPH, 0x00000B58, NV_RD32(chip->PFB, 0x00000298));
  1498. NV_WR32(chip->PGRAPH, 0x00000B5C, NV_RD32(chip->PFB, 0x0000029C));
  1499. NV_WR32(chip->PGRAPH, 0x00000B60, NV_RD32(chip->PFB, 0x000002A0));
  1500. NV_WR32(chip->PGRAPH, 0x00000B64, NV_RD32(chip->PFB, 0x000002A4));
  1501. NV_WR32(chip->PGRAPH, 0x00000B68, NV_RD32(chip->PFB, 0x000002A8));
  1502. NV_WR32(chip->PGRAPH, 0x00000B6C, NV_RD32(chip->PFB, 0x000002AC));
  1503. NV_WR32(chip->PGRAPH, 0x00000B70, NV_RD32(chip->PFB, 0x000002B0));
  1504. NV_WR32(chip->PGRAPH, 0x00000B74, NV_RD32(chip->PFB, 0x000002B4));
  1505. NV_WR32(chip->PGRAPH, 0x00000B78, NV_RD32(chip->PFB, 0x000002B8));
  1506. NV_WR32(chip->PGRAPH, 0x00000B7C, NV_RD32(chip->PFB, 0x000002BC));
  1507. NV_WR32(chip->PGRAPH, 0x00000F40, 0x10000000);
  1508. NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000000);
  1509. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
  1510. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000008);
  1511. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000200);
  1512. for (i = 0; i < (3*16); i++)
  1513. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1514. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
  1515. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1516. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000800);
  1517. for (i = 0; i < (16*16); i++)
  1518. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1519. NV_WR32(chip->PGRAPH, 0x00000F40, 0x30000000);
  1520. NV_WR32(chip->PGRAPH, 0x00000F44, 0x00000004);
  1521. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006400);
  1522. for (i = 0; i < (59*4); i++)
  1523. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1524. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006800);
  1525. for (i = 0; i < (47*4); i++)
  1526. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1527. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00006C00);
  1528. for (i = 0; i < (3*4); i++)
  1529. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1530. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007000);
  1531. for (i = 0; i < (19*4); i++)
  1532. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1533. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007400);
  1534. for (i = 0; i < (12*4); i++)
  1535. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1536. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00007800);
  1537. for (i = 0; i < (12*4); i++)
  1538. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1539. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00004400);
  1540. for (i = 0; i < (8*4); i++)
  1541. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1542. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000000);
  1543. for (i = 0; i < 16; i++)
  1544. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1545. NV_WR32(chip->PGRAPH, 0x00000F50, 0x00000040);
  1546. for (i = 0; i < 4; i++)
  1547. NV_WR32(chip->PGRAPH, 0x00000F54, 0x00000000);
  1548. NV_WR32(chip->PCRTC, 0x00000810, state->cursorConfig);
  1549. if(chip->flatPanel) {
  1550. if((chip->Chipset & 0x0ff0) == 0x0110) {
  1551. NV_WR32(chip->PRAMDAC, 0x0528, state->dither);
  1552. } else
  1553. if((chip->Chipset & 0x0ff0) >= 0x0170) {
  1554. NV_WR32(chip->PRAMDAC, 0x083C, state->dither);
  1555. }
  1556. VGA_WR08(chip->PCIO, 0x03D4, 0x53);
  1557. VGA_WR08(chip->PCIO, 0x03D5, 0);
  1558. VGA_WR08(chip->PCIO, 0x03D4, 0x54);
  1559. VGA_WR08(chip->PCIO, 0x03D5, 0);
  1560. VGA_WR08(chip->PCIO, 0x03D4, 0x21);
  1561. VGA_WR08(chip->PCIO, 0x03D5, 0xfa);
  1562. }
  1563. VGA_WR08(chip->PCIO, 0x03D4, 0x41);
  1564. VGA_WR08(chip->PCIO, 0x03D5, state->extra);
  1565. }
  1566. LOAD_FIXED_STATE(Riva,FIFO);
  1567. UpdateFifoState(chip);
  1568. /*
  1569. * Load HW mode state.
  1570. */
  1571. VGA_WR08(chip->PCIO, 0x03D4, 0x19);
  1572. VGA_WR08(chip->PCIO, 0x03D5, state->repaint0);
  1573. VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
  1574. VGA_WR08(chip->PCIO, 0x03D5, state->repaint1);
  1575. VGA_WR08(chip->PCIO, 0x03D4, 0x25);
  1576. VGA_WR08(chip->PCIO, 0x03D5, state->screen);
  1577. VGA_WR08(chip->PCIO, 0x03D4, 0x28);
  1578. VGA_WR08(chip->PCIO, 0x03D5, state->pixel);
  1579. VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
  1580. VGA_WR08(chip->PCIO, 0x03D5, state->horiz);
  1581. VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
  1582. VGA_WR08(chip->PCIO, 0x03D5, state->arbitration0);
  1583. VGA_WR08(chip->PCIO, 0x03D4, 0x20);
  1584. VGA_WR08(chip->PCIO, 0x03D5, state->arbitration1);
  1585. VGA_WR08(chip->PCIO, 0x03D4, 0x30);
  1586. VGA_WR08(chip->PCIO, 0x03D5, state->cursor0);
  1587. VGA_WR08(chip->PCIO, 0x03D4, 0x31);
  1588. VGA_WR08(chip->PCIO, 0x03D5, state->cursor1);
  1589. VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
  1590. VGA_WR08(chip->PCIO, 0x03D5, state->cursor2);
  1591. VGA_WR08(chip->PCIO, 0x03D4, 0x39);
  1592. VGA_WR08(chip->PCIO, 0x03D5, state->interlace);
  1593. if(!chip->flatPanel) {
  1594. NV_WR32(chip->PRAMDAC0, 0x00000508, state->vpll);
  1595. NV_WR32(chip->PRAMDAC0, 0x0000050C, state->pllsel);
  1596. if(chip->twoHeads)
  1597. NV_WR32(chip->PRAMDAC0, 0x00000520, state->vpll2);
  1598. } else {
  1599. NV_WR32(chip->PRAMDAC, 0x00000848 , state->scale);
  1600. }
  1601. NV_WR32(chip->PRAMDAC, 0x00000600 , state->general);
  1602. /*
  1603. * Turn off VBlank enable and reset.
  1604. */
  1605. NV_WR32(chip->PCRTC, 0x00000140, 0);
  1606. NV_WR32(chip->PCRTC, 0x00000100, chip->VBlankBit);
  1607. /*
  1608. * Set interrupt enable.
  1609. */
  1610. NV_WR32(chip->PMC, 0x00000140, chip->EnableIRQ & 0x01);
  1611. /*
  1612. * Set current state pointer.
  1613. */
  1614. chip->CurrentState = state;
  1615. /*
  1616. * Reset FIFO free and empty counts.
  1617. */
  1618. chip->FifoFreeCount = 0;
  1619. /* Free count from first subchannel */
  1620. chip->FifoEmptyCount = NV_RD32(&chip->Rop->FifoFree, 0);
  1621. }
  1622. static void UnloadStateExt
  1623. (
  1624. RIVA_HW_INST *chip,
  1625. RIVA_HW_STATE *state
  1626. )
  1627. {
  1628. /*
  1629. * Save current HW state.
  1630. */
  1631. VGA_WR08(chip->PCIO, 0x03D4, 0x19);
  1632. state->repaint0 = VGA_RD08(chip->PCIO, 0x03D5);
  1633. VGA_WR08(chip->PCIO, 0x03D4, 0x1A);
  1634. state->repaint1 = VGA_RD08(chip->PCIO, 0x03D5);
  1635. VGA_WR08(chip->PCIO, 0x03D4, 0x25);
  1636. state->screen = VGA_RD08(chip->PCIO, 0x03D5);
  1637. VGA_WR08(chip->PCIO, 0x03D4, 0x28);
  1638. state->pixel = VGA_RD08(chip->PCIO, 0x03D5);
  1639. VGA_WR08(chip->PCIO, 0x03D4, 0x2D);
  1640. state->horiz = VGA_RD08(chip->PCIO, 0x03D5);
  1641. VGA_WR08(chip->PCIO, 0x03D4, 0x1B);
  1642. state->arbitration0 = VGA_RD08(chip->PCIO, 0x03D5);
  1643. VGA_WR08(chip->PCIO, 0x03D4, 0x20);
  1644. state->arbitration1 = VGA_RD08(chip->PCIO, 0x03D5);
  1645. VGA_WR08(chip->PCIO, 0x03D4, 0x30);
  1646. state->cursor0 = VGA_RD08(chip->PCIO, 0x03D5);
  1647. VGA_WR08(chip->PCIO, 0x03D4, 0x31);
  1648. state->cursor1 = VGA_RD08(chip->PCIO, 0x03D5);
  1649. VGA_WR08(chip->PCIO, 0x03D4, 0x2F);
  1650. state->cursor2 = VGA_RD08(chip->PCIO, 0x03D5);
  1651. VGA_WR08(chip->PCIO, 0x03D4, 0x39);
  1652. state->interlace = VGA_RD08(chip->PCIO, 0x03D5);
  1653. state->vpll = NV_RD32(chip->PRAMDAC0, 0x00000508);
  1654. state->vpll2 = NV_RD32(chip->PRAMDAC0, 0x00000520);
  1655. state->pllsel = NV_RD32(chip->PRAMDAC0, 0x0000050C);
  1656. state->general = NV_RD32(chip->PRAMDAC, 0x00000600);
  1657. state->scale = NV_RD32(chip->PRAMDAC, 0x00000848);
  1658. state->config = NV_RD32(chip->PFB, 0x00000200);
  1659. switch (chip->Architecture)
  1660. {
  1661. case NV_ARCH_03:
  1662. state->offset0 = NV_RD32(chip->PGRAPH, 0x00000630);
  1663. state->offset1 = NV_RD32(chip->PGRAPH, 0x00000634);
  1664. state->offset2 = NV_RD32(chip->PGRAPH, 0x00000638);
  1665. state->offset3 = NV_RD32(chip->PGRAPH, 0x0000063C);
  1666. state->pitch0 = NV_RD32(chip->PGRAPH, 0x00000650);
  1667. state->pitch1 = NV_RD32(chip->PGRAPH, 0x00000654);
  1668. state->pitch2 = NV_RD32(chip->PGRAPH, 0x00000658);
  1669. state->pitch3 = NV_RD32(chip->PGRAPH, 0x0000065C);
  1670. break;
  1671. case NV_ARCH_04:
  1672. state->offset0 = NV_RD32(chip->PGRAPH, 0x00000640);
  1673. state->offset1 = NV_RD32(chip->PGRAPH, 0x00000644);
  1674. state->offset2 = NV_RD32(chip->PGRAPH, 0x00000648);
  1675. state->offset3 = NV_RD32(chip->PGRAPH, 0x0000064C);
  1676. state->pitch0 = NV_RD32(chip->PGRAPH, 0x00000670);
  1677. state->pitch1 = NV_RD32(chip->PGRAPH, 0x00000674);
  1678. state->pitch2 = NV_RD32(chip->PGRAPH, 0x00000678);
  1679. state->pitch3 = NV_RD32(chip->PGRAPH, 0x0000067C);
  1680. break;
  1681. case NV_ARCH_10:
  1682. case NV_ARCH_20:
  1683. case NV_ARCH_30:
  1684. state->offset0 = NV_RD32(chip->PGRAPH, 0x00000640);
  1685. state->offset1 = NV_RD32(chip->PGRAPH, 0x00000644);
  1686. state->offset2 = NV_RD32(chip->PGRAPH, 0x00000648);
  1687. state->offset3 = NV_RD32(chip->PGRAPH, 0x0000064C);
  1688. state->pitch0 = NV_RD32(chip->PGRAPH, 0x00000670);
  1689. state->pitch1 = NV_RD32(chip->PGRAPH, 0x00000674);
  1690. state->pitch2 = NV_RD32(chip->PGRAPH, 0x00000678);
  1691. state->pitch3 = NV_RD32(chip->PGRAPH, 0x0000067C);
  1692. if(chip->twoHeads) {
  1693. state->head = NV_RD32(chip->PCRTC0, 0x00000860);
  1694. state->head2 = NV_RD32(chip->PCRTC0, 0x00002860);
  1695. VGA_WR08(chip->PCIO, 0x03D4, 0x44);
  1696. state->crtcOwner = VGA_RD08(chip->PCIO, 0x03D5);
  1697. }
  1698. VGA_WR08(chip->PCIO, 0x03D4, 0x41);
  1699. state->extra = VGA_RD08(chip->PCIO, 0x03D5);
  1700. state->cursorConfig = NV_RD32(chip->PCRTC, 0x00000810);
  1701. if((chip->Chipset & 0x0ff0) == 0x0110) {
  1702. state->dither = NV_RD32(chip->PRAMDAC, 0x0528);
  1703. } else
  1704. if((chip->Chipset & 0x0ff0) >= 0x0170) {
  1705. state->dither = NV_RD32(chip->PRAMDAC, 0x083C);
  1706. }
  1707. break;
  1708. }
  1709. }
  1710. static void SetStartAddress
  1711. (
  1712. RIVA_HW_INST *chip,
  1713. unsigned start
  1714. )
  1715. {
  1716. NV_WR32(chip->PCRTC, 0x800, start);
  1717. }
  1718. static void SetStartAddress3
  1719. (
  1720. RIVA_HW_INST *chip,
  1721. unsigned start
  1722. )
  1723. {
  1724. int offset = start >> 2;
  1725. int pan = (start & 3) << 1;
  1726. unsigned char tmp;
  1727. /*
  1728. * Unlock extended registers.
  1729. */
  1730. chip->LockUnlock(chip, 0);
  1731. /*
  1732. * Set start address.
  1733. */
  1734. VGA_WR08(chip->PCIO, 0x3D4, 0x0D); VGA_WR08(chip->PCIO, 0x3D5, offset);
  1735. offset >>= 8;
  1736. VGA_WR08(chip->PCIO, 0x3D4, 0x0C); VGA_WR08(chip->PCIO, 0x3D5, offset);
  1737. offset >>= 8;
  1738. VGA_WR08(chip->PCIO, 0x3D4, 0x19); tmp = VGA_RD08(chip->PCIO, 0x3D5);
  1739. VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x01F) | (tmp & ~0x1F));
  1740. VGA_WR08(chip->PCIO, 0x3D4, 0x2D); tmp = VGA_RD08(chip->PCIO, 0x3D5);
  1741. VGA_WR08(chip->PCIO, 0x3D5, (offset & 0x60) | (tmp & ~0x60));
  1742. /*
  1743. * 4 pixel pan register.
  1744. */
  1745. offset = VGA_RD08(chip->PCIO, chip->IO + 0x0A);
  1746. VGA_WR08(chip->PCIO, 0x3C0, 0x13);
  1747. VGA_WR08(chip->PCIO, 0x3C0, pan);
  1748. }
  1749. static void nv3SetSurfaces2D
  1750. (
  1751. RIVA_HW_INST *chip,
  1752. unsigned surf0,
  1753. unsigned surf1
  1754. )
  1755. {
  1756. RivaSurface __iomem *Surface =
  1757. (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
  1758. RIVA_FIFO_FREE(*chip,Tri03,5);
  1759. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
  1760. NV_WR32(&Surface->Offset, 0, surf0);
  1761. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
  1762. NV_WR32(&Surface->Offset, 0, surf1);
  1763. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
  1764. }
  1765. static void nv4SetSurfaces2D
  1766. (
  1767. RIVA_HW_INST *chip,
  1768. unsigned surf0,
  1769. unsigned surf1
  1770. )
  1771. {
  1772. RivaSurface __iomem *Surface =
  1773. (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
  1774. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
  1775. NV_WR32(&Surface->Offset, 0, surf0);
  1776. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
  1777. NV_WR32(&Surface->Offset, 0, surf1);
  1778. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
  1779. }
  1780. static void nv10SetSurfaces2D
  1781. (
  1782. RIVA_HW_INST *chip,
  1783. unsigned surf0,
  1784. unsigned surf1
  1785. )
  1786. {
  1787. RivaSurface __iomem *Surface =
  1788. (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
  1789. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000003);
  1790. NV_WR32(&Surface->Offset, 0, surf0);
  1791. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000004);
  1792. NV_WR32(&Surface->Offset, 0, surf1);
  1793. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
  1794. }
  1795. static void nv3SetSurfaces3D
  1796. (
  1797. RIVA_HW_INST *chip,
  1798. unsigned surf0,
  1799. unsigned surf1
  1800. )
  1801. {
  1802. RivaSurface __iomem *Surface =
  1803. (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
  1804. RIVA_FIFO_FREE(*chip,Tri03,5);
  1805. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
  1806. NV_WR32(&Surface->Offset, 0, surf0);
  1807. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
  1808. NV_WR32(&Surface->Offset, 0, surf1);
  1809. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000013);
  1810. }
  1811. static void nv4SetSurfaces3D
  1812. (
  1813. RIVA_HW_INST *chip,
  1814. unsigned surf0,
  1815. unsigned surf1
  1816. )
  1817. {
  1818. RivaSurface __iomem *Surface =
  1819. (RivaSurface __iomem *)&(chip->FIFO[0x0000E000/4]);
  1820. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000005);
  1821. NV_WR32(&Surface->Offset, 0, surf0);
  1822. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000006);
  1823. NV_WR32(&Surface->Offset, 0, surf1);
  1824. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
  1825. }
  1826. static void nv10SetSurfaces3D
  1827. (
  1828. RIVA_HW_INST *chip,
  1829. unsigned surf0,
  1830. unsigned surf1
  1831. )
  1832. {
  1833. RivaSurface3D __iomem *Surfaces3D =
  1834. (RivaSurface3D __iomem *)&(chip->FIFO[0x0000E000/4]);
  1835. RIVA_FIFO_FREE(*chip,Tri03,4);
  1836. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000007);
  1837. NV_WR32(&Surfaces3D->RenderBufferOffset, 0, surf0);
  1838. NV_WR32(&Surfaces3D->ZBufferOffset, 0, surf1);
  1839. NV_WR32(&chip->FIFO[0x00003800], 0, 0x80000014);
  1840. }
  1841. /****************************************************************************\
  1842. * *
  1843. * Probe RIVA Chip Configuration *
  1844. * *
  1845. \****************************************************************************/
  1846. static void nv3GetConfig
  1847. (
  1848. RIVA_HW_INST *chip
  1849. )
  1850. {
  1851. /*
  1852. * Fill in chip configuration.
  1853. */
  1854. if (NV_RD32(&chip->PFB[0x00000000/4], 0) & 0x00000020)
  1855. {
  1856. if (((NV_RD32(chip->PMC, 0x00000000) & 0xF0) == 0x20)
  1857. && ((NV_RD32(chip->PMC, 0x00000000) & 0x0F) >= 0x02))
  1858. {
  1859. /*
  1860. * SDRAM 128 ZX.
  1861. */
  1862. chip->RamBandwidthKBytesPerSec = 800000;
  1863. switch (NV_RD32(chip->PFB, 0x00000000) & 0x03)
  1864. {
  1865. case 2:
  1866. chip->RamAmountKBytes = 1024 * 4;
  1867. break;
  1868. case 1:
  1869. chip->RamAmountKBytes = 1024 * 2;
  1870. break;
  1871. default:
  1872. chip->RamAmountKBytes = 1024 * 8;
  1873. break;
  1874. }
  1875. }
  1876. else
  1877. {
  1878. chip->RamBandwidthKBytesPerSec = 1000000;
  1879. chip->RamAmountKBytes = 1024 * 8;
  1880. }
  1881. }
  1882. else
  1883. {
  1884. /*
  1885. * SGRAM 128.
  1886. */
  1887. chip->RamBandwidthKBytesPerSec = 1000000;
  1888. switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
  1889. {
  1890. case 0:
  1891. chip->RamAmountKBytes = 1024 * 8;
  1892. break;
  1893. case 2:
  1894. chip->RamAmountKBytes = 1024 * 4;
  1895. break;
  1896. default:
  1897. chip->RamAmountKBytes = 1024 * 2;
  1898. break;
  1899. }
  1900. }
  1901. chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
  1902. chip->CURSOR = &(chip->PRAMIN[0x00008000/4 - 0x0800/4]);
  1903. chip->VBlankBit = 0x00000100;
  1904. chip->MaxVClockFreqKHz = 256000;
  1905. /*
  1906. * Set chip functions.
  1907. */
  1908. chip->Busy = nv3Busy;
  1909. chip->ShowHideCursor = ShowHideCursor;
  1910. chip->LoadStateExt = LoadStateExt;
  1911. chip->UnloadStateExt = UnloadStateExt;
  1912. chip->SetStartAddress = SetStartAddress3;
  1913. chip->SetSurfaces2D = nv3SetSurfaces2D;
  1914. chip->SetSurfaces3D = nv3SetSurfaces3D;
  1915. chip->LockUnlock = nv3LockUnlock;
  1916. }
  1917. static void nv4GetConfig
  1918. (
  1919. RIVA_HW_INST *chip
  1920. )
  1921. {
  1922. /*
  1923. * Fill in chip configuration.
  1924. */
  1925. if (NV_RD32(chip->PFB, 0x00000000) & 0x00000100)
  1926. {
  1927. chip->RamAmountKBytes = ((NV_RD32(chip->PFB, 0x00000000) >> 12) & 0x0F) * 1024 * 2
  1928. + 1024 * 2;
  1929. }
  1930. else
  1931. {
  1932. switch (NV_RD32(chip->PFB, 0x00000000) & 0x00000003)
  1933. {
  1934. case 0:
  1935. chip->RamAmountKBytes = 1024 * 32;
  1936. break;
  1937. case 1:
  1938. chip->RamAmountKBytes = 1024 * 4;
  1939. break;
  1940. case 2:
  1941. chip->RamAmountKBytes = 1024 * 8;
  1942. break;
  1943. case 3:
  1944. default:
  1945. chip->RamAmountKBytes = 1024 * 16;
  1946. break;
  1947. }
  1948. }
  1949. switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
  1950. {
  1951. case 3:
  1952. chip->RamBandwidthKBytesPerSec = 800000;
  1953. break;
  1954. default:
  1955. chip->RamBandwidthKBytesPerSec = 1000000;
  1956. break;
  1957. }
  1958. chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x00000000) & 0x00000040) ? 14318 : 13500;
  1959. chip->CURSOR = &(chip->PRAMIN[0x00010000/4 - 0x0800/4]);
  1960. chip->VBlankBit = 0x00000001;
  1961. chip->MaxVClockFreqKHz = 350000;
  1962. /*
  1963. * Set chip functions.
  1964. */
  1965. chip->Busy = nv4Busy;
  1966. chip->ShowHideCursor = ShowHideCursor;
  1967. chip->LoadStateExt = LoadStateExt;
  1968. chip->UnloadStateExt = UnloadStateExt;
  1969. chip->SetStartAddress = SetStartAddress;
  1970. chip->SetSurfaces2D = nv4SetSurfaces2D;
  1971. chip->SetSurfaces3D = nv4SetSurfaces3D;
  1972. chip->LockUnlock = nv4LockUnlock;
  1973. }
  1974. static void nv10GetConfig
  1975. (
  1976. RIVA_HW_INST *chip,
  1977. struct pci_dev *pdev,
  1978. unsigned int chipset
  1979. )
  1980. {
  1981. struct pci_dev* dev;
  1982. int domain = pci_domain_nr(pdev->bus);
  1983. u32 amt;
  1984. #ifdef __BIG_ENDIAN
  1985. /* turn on big endian register access */
  1986. if(!(NV_RD32(chip->PMC, 0x00000004) & 0x01000001))
  1987. NV_WR32(chip->PMC, 0x00000004, 0x01000001);
  1988. #endif
  1989. /*
  1990. * Fill in chip configuration.
  1991. */
  1992. if(chipset == NV_CHIP_IGEFORCE2) {
  1993. dev = pci_get_domain_bus_and_slot(domain, 0, 1);
  1994. pci_read_config_dword(dev, 0x7C, &amt);
  1995. pci_dev_put(dev);
  1996. chip->RamAmountKBytes = (((amt >> 6) & 31) + 1) * 1024;
  1997. } else if(chipset == NV_CHIP_0x01F0) {
  1998. dev = pci_get_domain_bus_and_slot(domain, 0, 1);
  1999. pci_read_config_dword(dev, 0x84, &amt);
  2000. pci_dev_put(dev);
  2001. chip->RamAmountKBytes = (((amt >> 4) & 127) + 1) * 1024;
  2002. } else {
  2003. switch ((NV_RD32(chip->PFB, 0x0000020C) >> 20) & 0x000000FF)
  2004. {
  2005. case 0x02:
  2006. chip->RamAmountKBytes = 1024 * 2;
  2007. break;
  2008. case 0x04:
  2009. chip->RamAmountKBytes = 1024 * 4;
  2010. break;
  2011. case 0x08:
  2012. chip->RamAmountKBytes = 1024 * 8;
  2013. break;
  2014. case 0x10:
  2015. chip->RamAmountKBytes = 1024 * 16;
  2016. break;
  2017. case 0x20:
  2018. chip->RamAmountKBytes = 1024 * 32;
  2019. break;
  2020. case 0x40:
  2021. chip->RamAmountKBytes = 1024 * 64;
  2022. break;
  2023. case 0x80:
  2024. chip->RamAmountKBytes = 1024 * 128;
  2025. break;
  2026. default:
  2027. chip->RamAmountKBytes = 1024 * 16;
  2028. break;
  2029. }
  2030. }
  2031. switch ((NV_RD32(chip->PFB, 0x00000000) >> 3) & 0x00000003)
  2032. {
  2033. case 3:
  2034. chip->RamBandwidthKBytesPerSec = 800000;
  2035. break;
  2036. default:
  2037. chip->RamBandwidthKBytesPerSec = 1000000;
  2038. break;
  2039. }
  2040. chip->CrystalFreqKHz = (NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 6)) ?
  2041. 14318 : 13500;
  2042. switch (chipset & 0x0ff0) {
  2043. case 0x0170:
  2044. case 0x0180:
  2045. case 0x01F0:
  2046. case 0x0250:
  2047. case 0x0280:
  2048. case 0x0300:
  2049. case 0x0310:
  2050. case 0x0320:
  2051. case 0x0330:
  2052. case 0x0340:
  2053. if(NV_RD32(chip->PEXTDEV, 0x0000) & (1 << 22))
  2054. chip->CrystalFreqKHz = 27000;
  2055. break;
  2056. default:
  2057. break;
  2058. }
  2059. chip->CursorStart = (chip->RamAmountKBytes - 128) * 1024;
  2060. chip->CURSOR = NULL; /* can't set this here */
  2061. chip->VBlankBit = 0x00000001;
  2062. chip->MaxVClockFreqKHz = 350000;
  2063. /*
  2064. * Set chip functions.
  2065. */
  2066. chip->Busy = nv10Busy;
  2067. chip->ShowHideCursor = ShowHideCursor;
  2068. chip->LoadStateExt = LoadStateExt;
  2069. chip->UnloadStateExt = UnloadStateExt;
  2070. chip->SetStartAddress = SetStartAddress;
  2071. chip->SetSurfaces2D = nv10SetSurfaces2D;
  2072. chip->SetSurfaces3D = nv10SetSurfaces3D;
  2073. chip->LockUnlock = nv4LockUnlock;
  2074. switch(chipset & 0x0ff0) {
  2075. case 0x0110:
  2076. case 0x0170:
  2077. case 0x0180:
  2078. case 0x01F0:
  2079. case 0x0250:
  2080. case 0x0280:
  2081. case 0x0300:
  2082. case 0x0310:
  2083. case 0x0320:
  2084. case 0x0330:
  2085. case 0x0340:
  2086. chip->twoHeads = TRUE;
  2087. break;
  2088. default:
  2089. chip->twoHeads = FALSE;
  2090. break;
  2091. }
  2092. }
  2093. int RivaGetConfig
  2094. (
  2095. RIVA_HW_INST *chip,
  2096. struct pci_dev *pdev,
  2097. unsigned int chipset
  2098. )
  2099. {
  2100. /*
  2101. * Save this so future SW know whats it's dealing with.
  2102. */
  2103. chip->Version = RIVA_SW_VERSION;
  2104. /*
  2105. * Chip specific configuration.
  2106. */
  2107. switch (chip->Architecture)
  2108. {
  2109. case NV_ARCH_03:
  2110. nv3GetConfig(chip);
  2111. break;
  2112. case NV_ARCH_04:
  2113. nv4GetConfig(chip);
  2114. break;
  2115. case NV_ARCH_10:
  2116. case NV_ARCH_20:
  2117. case NV_ARCH_30:
  2118. nv10GetConfig(chip, pdev, chipset);
  2119. break;
  2120. default:
  2121. return (-1);
  2122. }
  2123. chip->Chipset = chipset;
  2124. /*
  2125. * Fill in FIFO pointers.
  2126. */
  2127. chip->Rop = (RivaRop __iomem *)&(chip->FIFO[0x00000000/4]);
  2128. chip->Clip = (RivaClip __iomem *)&(chip->FIFO[0x00002000/4]);
  2129. chip->Patt = (RivaPattern __iomem *)&(chip->FIFO[0x00004000/4]);
  2130. chip->Pixmap = (RivaPixmap __iomem *)&(chip->FIFO[0x00006000/4]);
  2131. chip->Blt = (RivaScreenBlt __iomem *)&(chip->FIFO[0x00008000/4]);
  2132. chip->Bitmap = (RivaBitmap __iomem *)&(chip->FIFO[0x0000A000/4]);
  2133. chip->Line = (RivaLine __iomem *)&(chip->FIFO[0x0000C000/4]);
  2134. chip->Tri03 = (RivaTexturedTriangle03 __iomem *)&(chip->FIFO[0x0000E000/4]);
  2135. return (0);
  2136. }