1 /* 2 * CDDL HEADER START 3 * 4 * The contents of this file are subject to the terms of the 5 * Common Development and Distribution License, Version 1.0 only 6 * (the "License"). You may not use this file except in compliance 7 * with the License. 8 * 9 * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 10 * or http://www.opensolaris.org/os/licensing. 11 * See the License for the specific language governing permissions 12 * and limitations under the License. 13 * 14 * When distributing Covered Code, include this CDDL HEADER in each 15 * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 16 * If applicable, add the following below this CDDL HEADER, with the 17 * fields enclosed by brackets "[]" replaced with your own identifying 18 * information: Portions Copyright [yyyy] [name of copyright owner] 19 * 20 * CDDL HEADER END 21 */ 22 /* 23 * Copyright 2007 Sun Microsystems, Inc. All rights reserved. 24 * Use is subject to license terms. 25 * 26 * Assembly code support for the jalapeno module 27 */ 28 29 #pragma ident "%Z%%M% %I% %E% SMI" 30 31 #if !defined(lint) 32 #include "assym.h" 33 #endif /* lint */ 34 35 #include <sys/asm_linkage.h> 36 #include <sys/mmu.h> 37 #include <vm/hat_sfmmu.h> 38 #include <sys/machparam.h> 39 #include <sys/machcpuvar.h> 40 #include <sys/machthread.h> 41 #include <sys/machtrap.h> 42 #include <sys/privregs.h> 43 #include <sys/asm_linkage.h> 44 #include <sys/trap.h> 45 #include <sys/cheetahregs.h> 46 #include <sys/us3_module.h> 47 #include <sys/xc_impl.h> 48 #include <sys/intreg.h> 49 #include <sys/async.h> 50 #include <sys/clock.h> 51 #include <sys/cheetahasm.h> 52 53 #ifdef TRAPTRACE 54 #include <sys/traptrace.h> 55 #endif /* TRAPTRACE */ 56 57 #if !defined(lint) 58 59 /* BEGIN CSTYLED */ 60 61 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 62 63 #define CHK_JP_ERRATA85_ENABLED(scr, label) \ 64 ASM_LD(scr, jp_errata_85_active); \ 65 cmp scr, 1; \ 66 bne %icc, label; \ 67 nop 68 69 #define SET_64BIT_PA(dest, scr, hi32, lo32) \ 70 set hi32, scr; \ 71 sllx scr, 32, scr; \ 72 sethi %hi(lo32), dest; \ 73 or dest, %lo(lo32), dest; \ 74 or scr, dest, dest 75 76 /* 77 * Macro to trigger Jalapeno/Tomatillo speed change 78 * j_chng_pa - scratch register 79 * scr - scratch register 80 */ 81 #define JP_ESTAR_TRIGGER(j_chng_pa, scr) \ 82 SET_64BIT_PA(j_chng_pa, scr, TOM_HIGH_PA, M_T_J_CHNG_INIT_PA); \ 83 ldxa [j_chng_pa]ASI_IO, scr; \ 84 5: \ 85 and scr, TOM_TRIGGER_MASK, scr; \ 86 cmp scr, TOM_TRIGGER; \ 87 be,pt %icc, 5b; /* wait while 10 */ \ 88 ldxa [j_chng_pa]ASI_IO, scr; \ 89 andn scr, TOM_TRIGGER_MASK, scr; \ 90 stxa scr, [j_chng_pa]ASI_IO; /* clear j_chng[1:0] */ \ 91 or scr, TOM_TRIGGER, scr; \ 92 stxa scr, [j_chng_pa]ASI_IO; /* trigger j_chng */ \ 93 ldxa [j_chng_pa]ASI_IO, scr; \ 94 6: \ 95 and scr, TOM_TRIGGER_MASK, scr; \ 96 cmp scr, TOM_TRIGGER; \ 97 be,pt %icc, 6b; /* wait while 10 */ \ 98 ldxa [j_chng_pa]ASI_IO, scr; \ 99 andn scr, TOM_TRIGGER_MASK, scr; \ 100 stxa scr, [j_chng_pa]ASI_IO; /* deassert j_chng */ 101 102 /* 103 * Macro to set Jalapeno CPU speed 104 * speed - new speed constant 105 * scr1 - scratch register 106 * scr2 - scratch register 107 */ 108 #define SET_JP_SPEED(speed, scr1, scr2) \ 109 ldxa [%g0]ASI_JBUS_CONFIG, scr1; \ 110 set JBUS_CONFIG_ECLK_MASK, scr2; \ 111 andn scr1, scr2, scr1; \ 112 set speed, scr2; \ 113 or scr1, scr2, scr1; \ 114 stxa scr1, [%g0]ASI_JBUS_CONFIG; 115 116 /* 117 * macro to set Master Tomatillo speed 118 * speed - tomatillo speed constant 119 * tpa - tomatillo estar control register PA 120 * scr - scratch register 121 */ 122 #define SET_TOM_SPEED(speed, tpa, scr) \ 123 ldxa [tpa]ASI_IO, scr; \ 124 andn scr, TOM_ESTAR_ELCK_MASK, scr; \ 125 or scr, speed, scr; \ 126 stxa scr, [tpa]ASI_IO; 127 128 /* 129 * macro to check and set Slave Tomatillo speed 130 * speed - tomatillo speed constant 131 * scr1 - scratch register 132 * scr2 - scratch register 133 */ 134 135 #define SET_SLAVE_T_SPEED(speed, scr1, scr2) \ 136 ldxa [%g0]ASI_JBUS_CONFIG, scr2; \ 137 srlx scr2, JBUS_SLAVE_T_PORT_BIT, scr2; \ 138 btst 1, scr2; \ 139 bz,pt %icc, 4f; \ 140 nop; \ 141 SET_64BIT_PA(scr1, scr2, TOM_HIGH_PA, S_T_ESTAR_CTRL_PA); \ 142 SET_TOM_SPEED(speed, scr1, scr2); \ 143 4: 144 145 146 /* 147 * macro to adjust ASI_MCU_CTL_REG1[26:25] fsm bits according to 148 * new cpu speed: fsm[1:0]=11b for full speed, fsm[1:0]=0 for estar speed 149 * value - fsm bit value constant 150 * scr1 - scratch register 151 * scr2 - scratch register 152 */ 153 #define JP_ADJUST_FSM(value, scr1, scr2) \ 154 ldxa [%g0]ASI_MCU_CTRL, scr1; \ 155 set JP_MCU_FSM_MASK, scr2; \ 156 andn scr1, scr2, scr1; \ 157 set value, scr2; \ 158 or scr1, scr2, scr1; \ 159 stxa scr1, [%g0]ASI_MCU_CTRL; \ 160 membar #Sync; 161 162 /* 163 * JP_FORCE_FULL_SPEED and its fellow macros are for Jalapeno 164 * workstation to work around Errata 85. The front portion of 165 * it packs JP speed(14..13) and Tomatillo speed(5..0) into one 166 * register. 167 * 168 * Current code assumes that these two fields are non-overlapping. 169 * If that assumption changes, then this code won't work. If so, we 170 * force a compile time error by not defining the JP_FORCE_FULL_SPEED 171 * and JP_RESTORE_SPEED macros below. 172 */ 173 174 #if !(JBUS_CONFIG_ECLK_MASK & TOM_SPEED_MASK) 175 176 /* 177 * Macro to force Jalapeno/Tomatillo to full speed 178 * old_lvl - register used to save original cpu, tomatillo speed 179 * scr2 - scratch register 180 * scr3 - scratch register 181 * scr4 - scratch register 182 */ 183 #define JP_FORCE_FULL_SPEED(old_lvl, scr2, scr3, scr4) \ 184 ldxa [%g0]ASI_JBUS_CONFIG, old_lvl; \ 185 set JBUS_CONFIG_ECLK_MASK, scr4; \ 186 and old_lvl, scr4, old_lvl; \ 187 SET_64BIT_PA(scr2, scr3, TOM_HIGH_PA, M_T_ESTAR_CTRL_PA); \ 188 ldxa [scr2]ASI_IO, scr3; \ 189 set TOM_ESTAR_ELCK_MASK, scr4; \ 190 and scr3, scr4, scr3; \ 191 or old_lvl, scr3, old_lvl; \ 192 /* original jp and tomatillo speed saved in old_lvl */ \ 193 \ 194 /* either intended or currently at full speed */ \ 195 set JBUS_CONFIG_ECLK_MASK, scr4; \ 196 andcc old_lvl, scr4, %g0; \ 197 bz,pt %icc, 8f; \ 198 nop; \ 199 /* go through 1/2 speed. */ \ 200 SET_JP_SPEED(JBUS_CONFIG_ECLK_2, scr3, scr4); \ 201 SET_TOM_SPEED(TOM_HALF_SPEED, scr2, scr3); \ 202 SET_SLAVE_T_SPEED(TOM_HALF_SPEED, scr3, scr4); \ 203 JP_ADJUST_FSM(0, scr3, scr4); \ 204 set jp_estar_tl0_data, scr3; \ 205 ldx [scr3], %g0; \ 206 membar #Sync; /* or busy wait 1us */ \ 207 JP_ESTAR_TRIGGER(scr3, scr4); \ 208 8: \ 209 /* bring to 1:1 speed */ \ 210 SET_JP_SPEED(JBUS_CONFIG_ECLK_1, scr3, scr4); \ 211 SET_TOM_SPEED(TOM_FULL_SPEED, scr2, scr3); \ 212 SET_SLAVE_T_SPEED(TOM_FULL_SPEED, scr3, scr4); \ 213 JP_ADJUST_FSM(JP_MCU_FSM_MASK, scr3, scr4); \ 214 JP_ESTAR_TRIGGER(scr3, scr4) 215 216 217 /* 218 * Macro to restore Jalapeno/Tomatillo to original speed 219 * old_lvl - register contains saved original cpu, tomatillo speed 220 * scr2 - scratch register 221 * scr3 - scratch register 222 * scr4 - scratch register 223 * 224 * If trap had occured in the middle of ppm cpu speed transtion, then 225 * old_lvl[31:10] contains the intended new speed written into jbus_config. 226 * if old_lvl[9:0] is inconsistent with old_lvl[31:10], then the trap surely 227 * interrupted the ppm cpu speed transition, otherwise nothing for sure. 228 * We'll restore the intended/then-current speed, that should cause no 229 * trouble to subsequent ppm cpu speed change code. 230 */ 231 #define JP_RESTORE_SPEED(old_lvl, scr2, scr3, scr4) \ 232 srlx old_lvl, JBUS_CONFIG_ECLK_SHIFT, scr2; \ 233 and scr2, 3, scr2; \ 234 add scr2, 1, scr2; \ 235 cmp scr2, 3; \ 236 bne,pt %icc, 7f; \ 237 nop; \ 238 set TOM_SLOW_SPEED, scr2; \ 239 /* scr2 contains tom speed according to intended jp speed */ \ 240 7: \ 241 andn old_lvl, TOM_ESTAR_ELCK_MASK, old_lvl; \ 242 or scr2, old_lvl, old_lvl; \ 243 /* updated old_lvl to contain intended jp and tom speed */ \ 244 andcc old_lvl, TOM_FULL_SPEED, %g0; \ 245 bnz,pt %icc, 9f; /* intended full, already at full */ \ 246 nop; \ 247 \ 248 /* go to half speed */ \ 249 SET_JP_SPEED(JBUS_CONFIG_ECLK_2, scr3, scr4); \ 250 SET_64BIT_PA(scr2, scr3, TOM_HIGH_PA, M_T_ESTAR_CTRL_PA); \ 251 SET_TOM_SPEED(TOM_HALF_SPEED, scr2, scr3); \ 252 SET_SLAVE_T_SPEED(TOM_HALF_SPEED, scr3, scr4); \ 253 JP_ADJUST_FSM(0, scr3, scr4); \ 254 set jp_estar_tl0_data, scr3; \ 255 ldx [scr3], %g0; \ 256 membar #Sync; \ 257 JP_ESTAR_TRIGGER(scr3, scr4); \ 258 andcc old_lvl, TOM_SLOW_SPEED, %g0; \ 259 bz,pt %icc, 9f; /* intended 1:2, already at 1:2 */ \ 260 nop; \ 261 \ 262 /* go to 1:32 speed */ \ 263 SET_JP_SPEED(JBUS_CONFIG_ECLK_32, scr3, scr4); \ 264 SET_TOM_SPEED(TOM_SLOW_SPEED, scr2, scr3); \ 265 SET_SLAVE_T_SPEED(TOM_SLOW_SPEED, scr3, scr4); \ 266 JP_ESTAR_TRIGGER(scr3, scr4); \ 267 9: 268 269 #endif /* !(JBUS_CONFIG_ECLK_MASK & TOM_SPEED_MASK) */ 270 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 271 272 /* 273 * Jalapeno version to reflush an Ecache line by index. 274 * Will flush all 4 ways (with only one scratch register). 275 * Note that the code will be faster if we use 2 scratch registers. 276 */ 277 #define ECACHE_REFLUSH_LINE(ec_set_size, index, scr1) \ 278 JP_EC_DIAG_ACCESS_MEMBAR; \ 279 ldxa [index]ASI_EC_DIAG, %g0; \ 280 JP_EC_DIAG_ACCESS_MEMBAR; \ 281 mov 1, scr1; \ 282 sllx scr1, JP_ECFLUSH_EC_WAY_SHIFT, scr1; \ 283 add scr1, index, scr1; \ 284 JP_EC_DIAG_ACCESS_MEMBAR; \ 285 ldxa [scr1]ASI_EC_DIAG, %g0; \ 286 JP_EC_DIAG_ACCESS_MEMBAR; \ 287 mov 2, scr1; \ 288 sllx scr1, JP_ECFLUSH_EC_WAY_SHIFT, scr1; \ 289 add scr1, index, scr1; \ 290 JP_EC_DIAG_ACCESS_MEMBAR; \ 291 ldxa [scr1]ASI_EC_DIAG, %g0; \ 292 JP_EC_DIAG_ACCESS_MEMBAR; \ 293 mov 3, scr1; \ 294 sllx scr1, JP_ECFLUSH_EC_WAY_SHIFT, scr1; \ 295 add scr1, index, scr1; \ 296 JP_EC_DIAG_ACCESS_MEMBAR; \ 297 ldxa [scr1]ASI_EC_DIAG, %g0; \ 298 JP_EC_DIAG_ACCESS_MEMBAR 299 300 /* 301 * Jalapeno version of ecache_flush_line. Uses Jalapeno Ecache Displacement 302 * Flush feature to flush all 4 sets/ways. 303 */ 304 #define ECACHE_FLUSH_LINE(physaddr, ec_set_size, scr1, scr2) \ 305 CPU_INDEX(scr1, scr2); \ 306 sllx scr1, JP_ECFLUSH_PORTID_SHIFT, scr1; \ 307 set JP_ECACHE_IDX_DISP_FLUSH, scr2; \ 308 or scr2, scr1, scr2; \ 309 sub ec_set_size, 1, scr1; \ 310 and physaddr, scr1, scr1; \ 311 or scr2, scr1, scr1; \ 312 ECACHE_REFLUSH_LINE(ec_set_size, scr1, scr2) 313 314 /* 315 * Macro for getting ecache size from cpunodes structure 316 * scr1: Scratch, ecache size returned in this 317 * scr2: Scratch 318 */ 319 #define GET_ECACHE_SIZE(scr1, scr2) \ 320 CPU_INDEX(scr1, scr2); \ 321 mulx scr1, CPU_NODE_SIZE, scr1; \ 322 set cpunodes + ECACHE_SIZE, scr2; \ 323 ld [scr1 + scr2], scr1 324 325 /* END CSTYLED */ 326 327 #endif /* !lint */ 328 329 #if defined(lint) 330 331 /* ARGSUSED */ 332 void 333 shipit(int upaid, int bn) 334 { return; } 335 336 #else /* lint */ 337 338 /* 339 * Ship mondo to aid using implicit busy/nack pair (bn ignored) 340 */ 341 ENTRY_NP(shipit) 342 sll %o0, IDCR_PID_SHIFT, %g1 ! IDCR<18:14> = agent id 343 or %g1, IDCR_OFFSET, %g1 ! IDCR<13:0> = 0x70 344 stxa %g0, [%g1]ASI_INTR_DISPATCH ! interrupt vector dispatch 345 membar #Sync 346 retl 347 nop 348 SET_SIZE(shipit) 349 350 #endif /* lint */ 351 352 353 /* 354 * flush_ecache: 355 * %o0 - 64 bit physical address 356 * %o1 - ecache size 357 * %o2 - ecache linesize 358 */ 359 #if defined(lint) 360 361 /*ARGSUSED*/ 362 void 363 flush_ecache(uint64_t physaddr, size_t ecache_size, size_t ecache_linesize) 364 {} 365 366 #else /* !lint */ 367 368 ENTRY(flush_ecache) 369 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 370 CHK_JP_ERRATA85_ENABLED(%g1, flush_ecache_1); 371 JP_FORCE_FULL_SPEED(%o3, %g1, %g2, %g3); /* %o3: saved speed */ 372 flush_ecache_1: 373 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 374 375 /* 376 * Flush the entire Ecache using displacement flush. 377 */ 378 ECACHE_FLUSHALL(%o1, %o2, %o0, %o4) 379 380 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 381 CHK_JP_ERRATA85_ENABLED(%g1, flush_ecache_2); 382 JP_RESTORE_SPEED(%o3, %g1, %g2, %g3); /* %o3: saved speed */ 383 flush_ecache_2: 384 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 385 386 retl 387 nop 388 SET_SIZE(flush_ecache) 389 390 #endif /* lint */ 391 392 393 #if defined(lint) 394 395 void 396 fast_ecc_err(void) 397 {} 398 399 #else /* lint */ 400 401 .section ".text" 402 .align 64 403 ENTRY_NP(fast_ecc_err) 404 405 /* 406 * Turn off CEEN and NCEEN. 407 */ 408 ldxa [%g0]ASI_ESTATE_ERR, %g3 409 andn %g3, EN_REG_NCEEN + EN_REG_CEEN, %g4 410 stxa %g4, [%g0]ASI_ESTATE_ERR 411 membar #Sync ! membar sync required 412 413 /* 414 * Do the CPU log out capture. 415 * %g3 = "failed?" return value. 416 * %g2 = Input = AFAR. Output the clo_flags info which is passed 417 * into this macro via %g4. Output only valid if cpu_private 418 * struct has not been initialized. 419 * CHPR_FECCTL0_LOGOUT = cpu logout structure offset input 420 * %g4 = Trap information stored in the cpu logout flags field 421 * %g5 = scr1 422 * %g6 = scr2 423 * %g3 = scr3 424 * %g4 = scr4 425 */ 426 and %g3, EN_REG_CEEN, %g4 ! store the CEEN value, TL=0 427 set CHPR_FECCTL0_LOGOUT, %g6 428 DO_CPU_LOGOUT(%g3, %g2, %g6, %g4, %g5, %g6, %g3, %g4) 429 430 /* 431 * Flush the Ecache to get the error out of the Ecache. If the UCC 432 * or UCU is on a dirty line, then the following flush will turn 433 * that into a WDC or WDU, respectively. 434 */ 435 CPU_INDEX(%g4, %g5) 436 mulx %g4, CPU_NODE_SIZE, %g4 437 set cpunodes, %g5 438 add %g4, %g5, %g4 439 ld [%g4 + ECACHE_LINESIZE], %g5 440 ld [%g4 + ECACHE_SIZE], %g4 441 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 442 CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_err_1); 443 set jp_estar_tl0_data, %g6 444 stx %g2, [%g6 + 0] 445 stx %g3, [%g6 + 8] 446 JP_FORCE_FULL_SPEED(%g2, %g3, %g6, %g7) /* %g2: saved speed */ 447 fast_ecc_err_1: 448 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 449 ECACHE_FLUSHALL(%g4, %g5, %g6, %g7) 450 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 451 CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_err_2); 452 JP_RESTORE_SPEED(%g2, %g3, %g6, %g7) /* %g2: saved speed */ 453 set jp_estar_tl0_data, %g6 454 ldx [%g6 + 0], %g2 455 ldx [%g6 + 8], %g3 456 fast_ecc_err_2: 457 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 458 459 /* 460 * Flush the Dcache. Since bad data could have been installed in 461 * the Dcache we must flush it before re-enabling it. 462 */ 463 ASM_LD(%g5, dcache_size) 464 ASM_LD(%g6, dcache_linesize) 465 CH_DCACHE_FLUSHALL(%g5, %g6, %g7) 466 467 /* 468 * Flush the Icache. Since we turned off the Icache to capture the 469 * Icache line it is now stale or corrupted and we must flush it 470 * before re-enabling it. 471 */ 472 GET_CPU_PRIVATE_PTR(%g0, %g5, %g7, fast_ecc_err_4); 473 ld [%g5 + CHPR_ICACHE_LINESIZE], %g6 474 ba,pt %icc, 5f 475 ld [%g5 + CHPR_ICACHE_SIZE], %g5 476 fast_ecc_err_4: 477 ASM_LD(%g5, icache_size) 478 ASM_LD(%g6, icache_linesize) 479 5: 480 CH_ICACHE_FLUSHALL(%g5, %g6, %g7, %g4) 481 482 /* 483 * Restore the Dcache and Icache to the previous state. 484 */ 485 stxa %g1, [%g0]ASI_DCU 486 flush %g0 /* flush required after changing the IC bit */ 487 488 /* 489 * Make sure our CPU logout operation was successful. 490 */ 491 cmp %g3, %g0 492 be 8f 493 nop 494 495 /* 496 * If the logout structure had been busy, how many times have 497 * we tried to use it and failed (nesting count)? If we have 498 * already recursed a substantial number of times, then we can 499 * assume things are not going to get better by themselves and 500 * so it would be best to panic. 501 */ 502 cmp %g3, CLO_NESTING_MAX 503 blt 7f 504 nop 505 506 call ptl1_panic 507 mov PTL1_BAD_ECC, %g1 508 509 7: 510 /* 511 * Otherwise, if the logout structure was busy but we have not 512 * nested more times than our maximum value, then we simply 513 * issue a retry. Our TL=0 trap handler code will check and 514 * clear the AFSR after it is done logging what is currently 515 * in the logout struct and handle this event at that time. 516 */ 517 retry 518 8: 519 /* 520 * Call cpu_fast_ecc_error via systrap at PIL 14 unless we're 521 * already at PIL 15. 522 */ 523 set cpu_fast_ecc_error, %g1 524 rdpr %pil, %g4 525 cmp %g4, PIL_14 526 ba sys_trap 527 movl %icc, PIL_14, %g4 528 529 SET_SIZE(fast_ecc_err) 530 531 #endif /* lint */ 532 533 534 /* 535 * Fast ECC error at TL>0 handler 536 * We get here via trap 70 at TL>0->Software trap 0 at TL>0. We enter 537 * this routine with %g1 and %g2 already saved in %tpc, %tnpc and %tstate. 538 * For a complete description of the Fast ECC at TL>0 handling see the 539 * comment block "Cheetah/Cheetah+ Fast ECC at TL>0 trap strategy" in 540 * us3_common_asm.s 541 */ 542 #if defined(lint) 543 544 void 545 fast_ecc_tl1_err(void) 546 {} 547 548 #else /* lint */ 549 550 .section ".text" 551 .align 64 552 ENTRY_NP(fast_ecc_tl1_err) 553 554 /* 555 * This macro turns off the D$/I$ if they are on and saves their 556 * original state in ch_err_tl1_tmp, saves all the %g registers in the 557 * ch_err_tl1_data structure, updates the ch_err_tl1_flags and saves 558 * the %tpc in ch_err_tl1_tpc. At the end of this macro, %g1 will 559 * point to the ch_err_tl1_data structure and the original D$/I$ state 560 * will be saved in ch_err_tl1_tmp. All %g registers except for %g1 561 * will be available. 562 */ 563 CH_ERR_TL1_FECC_ENTER; 564 565 /* 566 * Get the diagnostic logout data. %g4 must be initialized to 567 * current CEEN state, %g5 must point to logout structure in 568 * ch_err_tl1_data_t. %g3 will contain the nesting count upon 569 * return. 570 */ 571 ldxa [%g0]ASI_ESTATE_ERR, %g4 572 and %g4, EN_REG_CEEN, %g4 573 add %g1, CH_ERR_TL1_LOGOUT, %g5 574 DO_TL1_CPU_LOGOUT(%g3, %g2, %g4, %g5, %g6, %g3, %g4) 575 576 /* 577 * If the logout nesting count is exceeded, we're probably 578 * not making any progress, try to panic instead. 579 */ 580 cmp %g3, CLO_NESTING_MAX 581 bge fecc_tl1_err 582 nop 583 584 /* 585 * Save the current CEEN and NCEEN state in %g7 and turn them off 586 * before flushing the Ecache. 587 */ 588 ldxa [%g0]ASI_ESTATE_ERR, %g7 589 andn %g7, EN_REG_CEEN | EN_REG_NCEEN, %g5 590 stxa %g5, [%g0]ASI_ESTATE_ERR 591 membar #Sync 592 593 /* 594 * Flush the Ecache, using the largest possible cache size with the 595 * smallest possible line size since we can't get the actual sizes 596 * from the cpu_node due to DTLB misses. 597 */ 598 set JP_ECACHE_MAX_SIZE, %g4 599 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 600 CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_tl1_err_1); 601 set jp_estar_tl1_data, %g6 602 stx %g2, [%g6 + 0] 603 stx %g3, [%g6 + 8] 604 JP_FORCE_FULL_SPEED(%g2, %g3, %g5, %g6) 605 fast_ecc_tl1_err_1: 606 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 607 ECACHE_FLUSHALL(%g4, JP_ECACHE_MAX_LSIZE, %g5, %g6) 608 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 609 CHK_JP_ERRATA85_ENABLED(%g6, fast_ecc_tl1_err_2); 610 JP_RESTORE_SPEED(%g2, %g3, %g5, %g6) 611 set jp_estar_tl1_data, %g6 612 ldx [%g6 + 0], %g2 613 ldx [%g6 + 8], %g3 614 fast_ecc_tl1_err_2: 615 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 616 617 /* 618 * Restore CEEN and NCEEN to the previous state. 619 */ 620 stxa %g7, [%g0]ASI_ESTATE_ERR 621 membar #Sync 622 623 /* 624 * If we turned off the D$, then flush it and turn it back on. 625 */ 626 ldxa [%g1 + CH_ERR_TL1_TMP]%asi, %g3 627 andcc %g3, CH_ERR_TSTATE_DC_ON, %g0 628 bz %xcc, 3f 629 nop 630 631 /* 632 * Flush the D$. 633 */ 634 ASM_LD(%g4, dcache_size) 635 ASM_LD(%g5, dcache_linesize) 636 CH_DCACHE_FLUSHALL(%g4, %g5, %g6) 637 638 /* 639 * Turn the D$ back on. 640 */ 641 ldxa [%g0]ASI_DCU, %g3 642 or %g3, DCU_DC, %g3 643 stxa %g3, [%g0]ASI_DCU 644 membar #Sync 645 3: 646 /* 647 * If we turned off the I$, then flush it and turn it back on. 648 */ 649 ldxa [%g1 + CH_ERR_TL1_TMP]%asi, %g3 650 andcc %g3, CH_ERR_TSTATE_IC_ON, %g0 651 bz %xcc, 4f 652 nop 653 654 /* 655 * Flush the I$. 656 */ 657 ASM_LD(%g4, icache_size) 658 ASM_LD(%g5, icache_linesize) 659 CH_ICACHE_FLUSHALL(%g4, %g5, %g6, %g3) 660 661 /* 662 * Turn the I$ back on. Changing DCU_IC requires flush. 663 */ 664 ldxa [%g0]ASI_DCU, %g3 665 or %g3, DCU_IC, %g3 666 stxa %g3, [%g0]ASI_DCU 667 flush %g0 668 4: 669 670 #ifdef TRAPTRACE 671 /* 672 * Get current trap trace entry physical pointer. 673 */ 674 CPU_INDEX(%g6, %g5) 675 sll %g6, TRAPTR_SIZE_SHIFT, %g6 676 set trap_trace_ctl, %g5 677 add %g6, %g5, %g6 678 ld [%g6 + TRAPTR_LIMIT], %g5 679 tst %g5 680 be %icc, skip_traptrace 681 nop 682 ldx [%g6 + TRAPTR_PBASE], %g5 683 ld [%g6 + TRAPTR_OFFSET], %g4 684 add %g5, %g4, %g5 685 686 /* 687 * Create trap trace entry. 688 */ 689 rd %asi, %g7 690 wr %g0, TRAPTR_ASI, %asi 691 rd STICK, %g4 692 stxa %g4, [%g5 + TRAP_ENT_TICK]%asi 693 rdpr %tl, %g4 694 stha %g4, [%g5 + TRAP_ENT_TL]%asi 695 rdpr %tt, %g4 696 stha %g4, [%g5 + TRAP_ENT_TT]%asi 697 rdpr %tpc, %g4 698 stna %g4, [%g5 + TRAP_ENT_TPC]%asi 699 rdpr %tstate, %g4 700 stxa %g4, [%g5 + TRAP_ENT_TSTATE]%asi 701 stna %sp, [%g5 + TRAP_ENT_SP]%asi 702 stna %g0, [%g5 + TRAP_ENT_TR]%asi 703 wr %g0, %g7, %asi 704 ldxa [%g1 + CH_ERR_TL1_SDW_AFAR]%asi, %g3 705 ldxa [%g1 + CH_ERR_TL1_SDW_AFSR]%asi, %g4 706 wr %g0, TRAPTR_ASI, %asi 707 stna %g3, [%g5 + TRAP_ENT_F1]%asi 708 stna %g4, [%g5 + TRAP_ENT_F2]%asi 709 wr %g0, %g7, %asi 710 ldxa [%g1 + CH_ERR_TL1_AFAR]%asi, %g3 711 ldxa [%g1 + CH_ERR_TL1_AFSR]%asi, %g4 712 wr %g0, TRAPTR_ASI, %asi 713 stna %g3, [%g5 + TRAP_ENT_F3]%asi 714 stna %g4, [%g5 + TRAP_ENT_F4]%asi 715 wr %g0, %g7, %asi 716 717 /* 718 * Advance trap trace pointer. 719 */ 720 ld [%g6 + TRAPTR_OFFSET], %g5 721 ld [%g6 + TRAPTR_LIMIT], %g4 722 st %g5, [%g6 + TRAPTR_LAST_OFFSET] 723 add %g5, TRAP_ENT_SIZE, %g5 724 sub %g4, TRAP_ENT_SIZE, %g4 725 cmp %g5, %g4 726 movge %icc, 0, %g5 727 st %g5, [%g6 + TRAPTR_OFFSET] 728 skip_traptrace: 729 #endif /* TRAPTRACE */ 730 731 /* 732 * If nesting count is not zero, skip all the AFSR/AFAR 733 * handling and just do the necessary cache-flushing. 734 */ 735 ldxa [%g1 + CH_ERR_TL1_NEST_CNT]%asi, %g2 736 brnz %g2, 6f 737 nop 738 739 /* 740 * If a UCU followed by a WDU has occurred go ahead and panic 741 * since a UE will occur (on the retry) before the UCU and WDU 742 * messages are enqueued. 743 */ 744 ldxa [%g1 + CH_ERR_TL1_AFSR]%asi, %g3 745 set 1, %g4 746 sllx %g4, C_AFSR_UCU_SHIFT, %g4 747 btst %g4, %g3 ! UCU in original AFSR? 748 bz %xcc, 6f 749 nop 750 ldxa [%g0]ASI_AFSR, %g4 ! current AFSR 751 or %g3, %g4, %g3 ! %g3 = original + current AFSR 752 set 1, %g4 753 sllx %g4, C_AFSR_WDU_SHIFT, %g4 754 btst %g4, %g3 ! WDU in original or current AFSR? 755 bnz %xcc, fecc_tl1_err 756 nop 757 758 6: 759 /* 760 * We fall into this macro if we've successfully logged the error in 761 * the ch_err_tl1_data structure and want the PIL15 softint to pick 762 * it up and log it. %g1 must point to the ch_err_tl1_data structure. 763 * Restores the %g registers and issues retry. 764 */ 765 CH_ERR_TL1_EXIT; 766 /* 767 * Establish panic exit label. 768 */ 769 CH_ERR_TL1_PANIC_EXIT(fecc_tl1_err); 770 771 SET_SIZE(fast_ecc_tl1_err) 772 773 #endif /* lint */ 774 775 776 #if defined(lint) 777 778 uint64_t 779 get_jbus_config(void) 780 { return (0); } 781 782 /* ARGSUSED */ 783 void 784 set_jbus_config(uint64_t jbus_config) 785 {} 786 787 /* ARGSUSED */ 788 void 789 set_mcu_ctl_reg1(uint64_t mcu_ctl) 790 {} 791 792 uint64_t 793 get_mcu_ctl_reg1(void) 794 { return (0); } 795 796 #else /* lint */ 797 798 ENTRY(get_jbus_config) 799 ldxa [%g0]ASI_JBUS_CONFIG, %o0 800 retl 801 nop 802 SET_SIZE(get_jbus_config) 803 804 ENTRY(set_jbus_config) 805 stxa %o0, [%g0]ASI_JBUS_CONFIG 806 membar #Sync 807 retl 808 nop 809 SET_SIZE(set_jbus_config) 810 811 812 ENTRY(get_mcu_ctl_reg1) 813 ldxa [%g0]ASI_MCU_CTRL, %o0 ! MCU control reg1 is at offset 0 814 retl 815 nop 816 SET_SIZE(get_mcu_ctl_reg1) 817 818 819 ENTRY(set_mcu_ctl_reg1) 820 stxa %o0, [%g0]ASI_MCU_CTRL ! MCU control reg1 is at offset 0 821 membar #Sync 822 retl 823 nop 824 SET_SIZE(set_mcu_ctl_reg1) 825 826 #endif /* lint */ 827 828 829 #if defined(lint) 830 /* 831 * scrubphys - Pass in the aligned physical memory address 832 * that you want to scrub, along with the ecache set size. 833 * 834 * 1) Displacement flush the E$ line corresponding to %addr. 835 * The first ldxa guarantees that the %addr is no longer in 836 * M, O, or E (goes to I or S (if instruction fetch also happens). 837 * 2) "Write" the data using a CAS %addr,%g0,%g0. 838 * The casxa guarantees a transition from I to M or S to M. 839 * 3) Displacement flush the E$ line corresponding to %addr. 840 * The second ldxa pushes the M line out of the ecache, into the 841 * writeback buffers, on the way to memory. 842 * 4) The "membar #Sync" pushes the cache line out of the writeback 843 * buffers onto the bus, on the way to dram finally. 844 * 845 * This is a modified version of the algorithm suggested by Gary Lauterbach. 846 * In theory the CAS %addr,%g0,%g0 is supposed to mark the addr's cache line 847 * as modified, but then we found out that for spitfire, if it misses in the 848 * E$ it will probably install as an M, but if it hits in the E$, then it 849 * will stay E, if the store doesn't happen. So the first displacement flush 850 * should ensure that the CAS will miss in the E$. Arrgh. 851 */ 852 /* ARGSUSED */ 853 void 854 scrubphys(uint64_t paddr, int ecache_set_size) 855 {} 856 857 #else /* lint */ 858 ENTRY(scrubphys) 859 rdpr %pstate, %o4 860 andn %o4, PSTATE_IE | PSTATE_AM, %o5 861 wrpr %o5, %g0, %pstate ! clear IE, AM bits 862 863 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 864 CHK_JP_ERRATA85_ENABLED(%g1, scrubphys_1); 865 JP_FORCE_FULL_SPEED(%o5, %g1, %g2, %g3) /* %o5: saved speed */ 866 scrubphys_1: 867 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 868 869 ECACHE_FLUSH_LINE(%o0, %o1, %o2, %o3) 870 casxa [%o0]ASI_MEM, %g0, %g0 871 ECACHE_REFLUSH_LINE(%o1, %o2, %o3) 872 873 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 874 CHK_JP_ERRATA85_ENABLED(%g1, scrubphys_2); 875 JP_RESTORE_SPEED(%o5, %g1, %g2, %g3) /* %o5: saved speed */ 876 scrubphys_2: 877 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 878 879 wrpr %g0, %o4, %pstate ! restore earlier pstate register value 880 881 retl 882 membar #Sync ! move the data out of the load buffer 883 SET_SIZE(scrubphys) 884 885 #endif /* lint */ 886 887 888 #if defined(lint) 889 /* 890 * clearphys - Pass in the physical memory address of the checkblock 891 * that you want to push out, cleared with a recognizable pattern, 892 * from the ecache. 893 * 894 * To ensure that the ecc gets recalculated after the bad data is cleared, 895 * we must write out enough data to fill the w$ line (64 bytes). So we read 896 * in an entire ecache subblock's worth of data, and write it back out. 897 * Then we overwrite the 16 bytes of bad data with the pattern. 898 */ 899 /* ARGSUSED */ 900 void 901 clearphys(uint64_t paddr, int ecache_set_size, int ecache_linesize) 902 { 903 } 904 905 #else /* lint */ 906 ENTRY(clearphys) 907 /* turn off IE, AM bits */ 908 rdpr %pstate, %o4 909 andn %o4, PSTATE_IE | PSTATE_AM, %o5 910 wrpr %o5, %g0, %pstate 911 912 /* turn off NCEEN */ 913 ldxa [%g0]ASI_ESTATE_ERR, %o5 914 andn %o5, EN_REG_NCEEN, %o3 915 stxa %o3, [%g0]ASI_ESTATE_ERR 916 membar #Sync 917 918 /* align address passed with 64 bytes subblock size */ 919 mov CH_ECACHE_SUBBLK_SIZE, %o2 920 andn %o0, (CH_ECACHE_SUBBLK_SIZE - 1), %g1 921 922 /* move the good data into the W$ */ 923 1: 924 subcc %o2, 8, %o2 925 ldxa [%g1 + %o2]ASI_MEM, %g2 926 bge 1b 927 stxa %g2, [%g1 + %o2]ASI_MEM 928 929 /* now overwrite the bad data */ 930 setx 0xbadecc00badecc01, %g1, %g2 931 stxa %g2, [%o0]ASI_MEM 932 mov 8, %g1 933 stxa %g2, [%o0 + %g1]ASI_MEM 934 935 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 936 CHK_JP_ERRATA85_ENABLED(%g1, clearphys_1); 937 JP_FORCE_FULL_SPEED(%o5, %g1, %g2, %g3) /* %o5: saved speed */ 938 clearphys_1: 939 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 940 941 ECACHE_FLUSH_LINE(%o0, %o1, %o2, %o3) 942 casxa [%o0]ASI_MEM, %g0, %g0 943 ECACHE_REFLUSH_LINE(%o1, %o2, %o3) 944 945 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 946 CHK_JP_ERRATA85_ENABLED(%g1, clearphys_2); 947 JP_RESTORE_SPEED(%o5, %g1, %g2, %g3) /* %o5: saved speed */ 948 clearphys_2: 949 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 950 951 /* clear the AFSR */ 952 ldxa [%g0]ASI_AFSR, %o1 953 stxa %o1, [%g0]ASI_AFSR 954 membar #Sync 955 956 /* turn NCEEN back on */ 957 stxa %o5, [%g0]ASI_ESTATE_ERR 958 membar #Sync 959 960 /* return and re-enable IE and AM */ 961 retl 962 wrpr %g0, %o4, %pstate 963 SET_SIZE(clearphys) 964 965 #endif /* lint */ 966 967 968 #if defined(lint) 969 /* 970 * Jalapeno Ecache displacement flush the specified line from the E$ 971 * 972 * Register usage: 973 * %o0 - 64 bit physical address for flushing 974 * %o1 - Ecache set size 975 */ 976 /*ARGSUSED*/ 977 void 978 ecache_flush_line(uint64_t flushaddr, int ec_set_size) 979 { 980 } 981 #else /* lint */ 982 ENTRY(ecache_flush_line) 983 984 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 985 CHK_JP_ERRATA85_ENABLED(%g1, ecache_flush_line_1); 986 JP_FORCE_FULL_SPEED(%o5, %g1, %g2, %g3) /* %o5: saved speed */ 987 ecache_flush_line_1: 988 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 989 990 ECACHE_FLUSH_LINE(%o0, %o1, %o2, %o3) 991 992 #if defined(JALAPENO) && defined(JALAPENO_ERRATA_85) 993 CHK_JP_ERRATA85_ENABLED(%g1, ecache_flush_line_2); 994 JP_RESTORE_SPEED(%o5, %g1, %g2, %g3) /* %o5: saved speed */ 995 ecache_flush_line_2: 996 #endif /* JALAPENO && JALAPENO_ERRATA_85 */ 997 998 retl 999 nop 1000 SET_SIZE(ecache_flush_line) 1001 #endif /* lint */ 1002 1003 1004 /* 1005 * Perform necessary cpu workaround to ensure jbus ordering. 1006 * Called only from Fire systems. 1007 * CPU's internal "invalidate FIFOs" are flushed. 1008 */ 1009 1010 #if defined(lint) 1011 void 1012 jbus_stst_order() 1013 {} 1014 #else /* lint */ 1015 1016 #define VIS_BLOCKSIZE 64 1017 1018 .seg ".data" 1019 .align VIS_BLOCKSIZE 1020 .type sync_buf, #object 1021 sync_buf: 1022 .skip VIS_BLOCKSIZE 1023 .size sync_buf, VIS_BLOCKSIZE 1024 1025 ENTRY(jbus_stst_order) 1026 set sync_buf, %o1 1027 1028 rd %fprs, %o2 ! %o2 = saved fprs 1029 or %o2, FPRS_FEF, %o3 1030 wr %g0, %o3, %fprs ! make sure fp is enabled 1031 stda %d0, [%o1]ASI_BLK_COMMIT_P 1032 wr %o2, 0, %fprs ! restore fprs 1033 1034 retl 1035 membar #Sync 1036 SET_SIZE(jbus_stst_order) 1037 1038 #endif /* lint */ 1039 1040 #if defined(lint) 1041 /* 1042 * This routine will not be called in Jalapeno systems. 1043 */ 1044 void 1045 flush_ipb(void) 1046 { return; } 1047 1048 #else /* lint */ 1049 1050 ENTRY(flush_ipb) 1051 retl 1052 nop 1053 SET_SIZE(flush_ipb) 1054 1055 #endif /* lint */