emulate.c 121 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590359135923593359435953596359735983599360036013602360336043605360636073608360936103611361236133614361536163617361836193620362136223623362436253626362736283629363036313632363336343635363636373638363936403641364236433644364536463647364836493650365136523653365436553656365736583659366036613662366336643665366636673668366936703671367236733674367536763677367836793680368136823683368436853686368736883689369036913692369336943695369636973698369937003701370237033704370537063707370837093710371137123713371437153716371737183719372037213722372337243725372637273728372937303731373237333734373537363737373837393740374137423743374437453746374737483749375037513752375337543755375637573758375937603761376237633764376537663767376837693770377137723773377437753776377737783779378037813782378337843785378637873788378937903791379237933794379537963797379837993800380138023803380438053806380738083809381038113812381338143815381638173818381938203821382238233824382538263827382838293830383138323833383438353836383738383839384038413842384338443845384638473848384938503851385238533854385538563857385838593860386138623863386438653866386738683869387038713872387338743875387638773878387938803881388238833884388538863887388838893890389138923893389438953896389738983899390039013902390339043905390639073908390939103911391239133914391539163917391839193920392139223923392439253926392739283929393039313932393339343935393639373938393939403941394239433944394539463947394839493950395139523953395439553956395739583959396039613962396339643965396639673968396939703971397239733974397539763977397839793980398139823983398439853986398739883989399039913992399339943995399639973998399940004001400240034004400540064007400840094010401140124013401440154016401740184019402040214022402340244025402640274028402940304031403240334034403540364037403840394040404140424043404440454046404740484049405040514052405340544055405640574058405940604061406240634064406540664067406840694070407140724073407440754076407740784079408040814082408340844085408640874088408940904091409240934094409540964097409840994100410141024103410441054106410741084109411041114112411341144115411641174118411941204121412241234124412541264127412841294130413141324133413441354136413741384139414041414142414341444145414641474148414941504151415241534154415541564157415841594160416141624163416441654166416741684169417041714172417341744175417641774178417941804181418241834184418541864187418841894190419141924193419441954196419741984199420042014202420342044205420642074208420942104211421242134214421542164217421842194220422142224223422442254226422742284229423042314232423342344235423642374238423942404241424242434244424542464247424842494250425142524253425442554256425742584259426042614262426342644265426642674268426942704271427242734274427542764277427842794280428142824283428442854286428742884289429042914292429342944295429642974298429943004301430243034304430543064307430843094310431143124313431443154316431743184319432043214322432343244325432643274328432943304331433243334334433543364337433843394340434143424343434443454346434743484349435043514352435343544355435643574358435943604361436243634364436543664367436843694370437143724373437443754376437743784379438043814382438343844385438643874388438943904391439243934394439543964397439843994400440144024403440444054406440744084409441044114412441344144415441644174418441944204421442244234424442544264427442844294430443144324433443444354436443744384439444044414442444344444445444644474448444944504451445244534454445544564457445844594460446144624463446444654466446744684469447044714472447344744475447644774478447944804481448244834484448544864487448844894490449144924493449444954496449744984499450045014502450345044505450645074508450945104511451245134514451545164517451845194520452145224523452445254526452745284529453045314532453345344535453645374538453945404541454245434544454545464547454845494550455145524553455445554556455745584559456045614562456345644565456645674568456945704571457245734574457545764577457845794580458145824583458445854586458745884589459045914592459345944595459645974598459946004601460246034604460546064607460846094610461146124613461446154616461746184619462046214622462346244625462646274628462946304631463246334634463546364637463846394640464146424643464446454646464746484649465046514652465346544655465646574658465946604661466246634664466546664667466846694670467146724673467446754676467746784679468046814682468346844685468646874688468946904691469246934694469546964697469846994700470147024703470447054706470747084709471047114712471347144715471647174718471947204721472247234724472547264727472847294730473147324733473447354736473747384739474047414742474347444745
  1. /******************************************************************************
  2. * emulate.c
  3. *
  4. * Generic x86 (32-bit and 64-bit) instruction decoder and emulator.
  5. *
  6. * Copyright (c) 2005 Keir Fraser
  7. *
  8. * Linux coding style, mod r/m decoder, segment base fixes, real-mode
  9. * privileged instructions:
  10. *
  11. * Copyright (C) 2006 Qumranet
  12. * Copyright 2010 Red Hat, Inc. and/or its affiliates.
  13. *
  14. * Avi Kivity <avi@qumranet.com>
  15. * Yaniv Kamay <yaniv@qumranet.com>
  16. *
  17. * This work is licensed under the terms of the GNU GPL, version 2. See
  18. * the COPYING file in the top-level directory.
  19. *
  20. * From: xen-unstable 10676:af9809f51f81a3c43f276f00c81a52ef558afda4
  21. */
  22. #include <linux/kvm_host.h>
  23. #include "kvm_cache_regs.h"
  24. #include <linux/module.h>
  25. #include <asm/kvm_emulate.h>
  26. #include "x86.h"
  27. #include "tss.h"
  28. /*
  29. * Operand types
  30. */
  31. #define OpNone 0ull
  32. #define OpImplicit 1ull /* No generic decode */
  33. #define OpReg 2ull /* Register */
  34. #define OpMem 3ull /* Memory */
  35. #define OpAcc 4ull /* Accumulator: AL/AX/EAX/RAX */
  36. #define OpDI 5ull /* ES:DI/EDI/RDI */
  37. #define OpMem64 6ull /* Memory, 64-bit */
  38. #define OpImmUByte 7ull /* Zero-extended 8-bit immediate */
  39. #define OpDX 8ull /* DX register */
  40. #define OpCL 9ull /* CL register (for shifts) */
  41. #define OpImmByte 10ull /* 8-bit sign extended immediate */
  42. #define OpOne 11ull /* Implied 1 */
  43. #define OpImm 12ull /* Sign extended up to 32-bit immediate */
  44. #define OpMem16 13ull /* Memory operand (16-bit). */
  45. #define OpMem32 14ull /* Memory operand (32-bit). */
  46. #define OpImmU 15ull /* Immediate operand, zero extended */
  47. #define OpSI 16ull /* SI/ESI/RSI */
  48. #define OpImmFAddr 17ull /* Immediate far address */
  49. #define OpMemFAddr 18ull /* Far address in memory */
  50. #define OpImmU16 19ull /* Immediate operand, 16 bits, zero extended */
  51. #define OpES 20ull /* ES */
  52. #define OpCS 21ull /* CS */
  53. #define OpSS 22ull /* SS */
  54. #define OpDS 23ull /* DS */
  55. #define OpFS 24ull /* FS */
  56. #define OpGS 25ull /* GS */
  57. #define OpMem8 26ull /* 8-bit zero extended memory operand */
  58. #define OpImm64 27ull /* Sign extended 16/32/64-bit immediate */
  59. #define OpBits 5 /* Width of operand field */
  60. #define OpMask ((1ull << OpBits) - 1)
  61. /*
  62. * Opcode effective-address decode tables.
  63. * Note that we only emulate instructions that have at least one memory
  64. * operand (excluding implicit stack references). We assume that stack
  65. * references and instruction fetches will never occur in special memory
  66. * areas that require emulation. So, for example, 'mov <imm>,<reg>' need
  67. * not be handled.
  68. */
  69. /* Operand sizes: 8-bit operands or specified/overridden size. */
  70. #define ByteOp (1<<0) /* 8-bit operands. */
  71. /* Destination operand type. */
  72. #define DstShift 1
  73. #define ImplicitOps (OpImplicit << DstShift)
  74. #define DstReg (OpReg << DstShift)
  75. #define DstMem (OpMem << DstShift)
  76. #define DstAcc (OpAcc << DstShift)
  77. #define DstDI (OpDI << DstShift)
  78. #define DstMem64 (OpMem64 << DstShift)
  79. #define DstImmUByte (OpImmUByte << DstShift)
  80. #define DstDX (OpDX << DstShift)
  81. #define DstMask (OpMask << DstShift)
  82. /* Source operand type. */
  83. #define SrcShift 6
  84. #define SrcNone (OpNone << SrcShift)
  85. #define SrcReg (OpReg << SrcShift)
  86. #define SrcMem (OpMem << SrcShift)
  87. #define SrcMem16 (OpMem16 << SrcShift)
  88. #define SrcMem32 (OpMem32 << SrcShift)
  89. #define SrcImm (OpImm << SrcShift)
  90. #define SrcImmByte (OpImmByte << SrcShift)
  91. #define SrcOne (OpOne << SrcShift)
  92. #define SrcImmUByte (OpImmUByte << SrcShift)
  93. #define SrcImmU (OpImmU << SrcShift)
  94. #define SrcSI (OpSI << SrcShift)
  95. #define SrcImmFAddr (OpImmFAddr << SrcShift)
  96. #define SrcMemFAddr (OpMemFAddr << SrcShift)
  97. #define SrcAcc (OpAcc << SrcShift)
  98. #define SrcImmU16 (OpImmU16 << SrcShift)
  99. #define SrcImm64 (OpImm64 << SrcShift)
  100. #define SrcDX (OpDX << SrcShift)
  101. #define SrcMem8 (OpMem8 << SrcShift)
  102. #define SrcMask (OpMask << SrcShift)
  103. #define BitOp (1<<11)
  104. #define MemAbs (1<<12) /* Memory operand is absolute displacement */
  105. #define String (1<<13) /* String instruction (rep capable) */
  106. #define Stack (1<<14) /* Stack instruction (push/pop) */
  107. #define GroupMask (7<<15) /* Opcode uses one of the group mechanisms */
  108. #define Group (1<<15) /* Bits 3:5 of modrm byte extend opcode */
  109. #define GroupDual (2<<15) /* Alternate decoding of mod == 3 */
  110. #define Prefix (3<<15) /* Instruction varies with 66/f2/f3 prefix */
  111. #define RMExt (4<<15) /* Opcode extension in ModRM r/m if mod == 3 */
  112. #define Sse (1<<18) /* SSE Vector instruction */
  113. /* Generic ModRM decode. */
  114. #define ModRM (1<<19)
  115. /* Destination is only written; never read. */
  116. #define Mov (1<<20)
  117. /* Misc flags */
  118. #define Prot (1<<21) /* instruction generates #UD if not in prot-mode */
  119. #define VendorSpecific (1<<22) /* Vendor specific instruction */
  120. #define NoAccess (1<<23) /* Don't access memory (lea/invlpg/verr etc) */
  121. #define Op3264 (1<<24) /* Operand is 64b in long mode, 32b otherwise */
  122. #define Undefined (1<<25) /* No Such Instruction */
  123. #define Lock (1<<26) /* lock prefix is allowed for the instruction */
  124. #define Priv (1<<27) /* instruction generates #GP if current CPL != 0 */
  125. #define No64 (1<<28)
  126. #define PageTable (1 << 29) /* instruction used to write page table */
  127. /* Source 2 operand type */
  128. #define Src2Shift (30)
  129. #define Src2None (OpNone << Src2Shift)
  130. #define Src2CL (OpCL << Src2Shift)
  131. #define Src2ImmByte (OpImmByte << Src2Shift)
  132. #define Src2One (OpOne << Src2Shift)
  133. #define Src2Imm (OpImm << Src2Shift)
  134. #define Src2ES (OpES << Src2Shift)
  135. #define Src2CS (OpCS << Src2Shift)
  136. #define Src2SS (OpSS << Src2Shift)
  137. #define Src2DS (OpDS << Src2Shift)
  138. #define Src2FS (OpFS << Src2Shift)
  139. #define Src2GS (OpGS << Src2Shift)
  140. #define Src2Mask (OpMask << Src2Shift)
  141. #define Mmx ((u64)1 << 40) /* MMX Vector instruction */
  142. #define Aligned ((u64)1 << 41) /* Explicitly aligned (e.g. MOVDQA) */
  143. #define Unaligned ((u64)1 << 42) /* Explicitly unaligned (e.g. MOVDQU) */
  144. #define Avx ((u64)1 << 43) /* Advanced Vector Extensions */
  145. #define X2(x...) x, x
  146. #define X3(x...) X2(x), x
  147. #define X4(x...) X2(x), X2(x)
  148. #define X5(x...) X4(x), x
  149. #define X6(x...) X4(x), X2(x)
  150. #define X7(x...) X4(x), X3(x)
  151. #define X8(x...) X4(x), X4(x)
  152. #define X16(x...) X8(x), X8(x)
  153. struct opcode {
  154. u64 flags : 56;
  155. u64 intercept : 8;
  156. union {
  157. int (*execute)(struct x86_emulate_ctxt *ctxt);
  158. const struct opcode *group;
  159. const struct group_dual *gdual;
  160. const struct gprefix *gprefix;
  161. } u;
  162. int (*check_perm)(struct x86_emulate_ctxt *ctxt);
  163. };
  164. struct group_dual {
  165. struct opcode mod012[8];
  166. struct opcode mod3[8];
  167. };
  168. struct gprefix {
  169. struct opcode pfx_no;
  170. struct opcode pfx_66;
  171. struct opcode pfx_f2;
  172. struct opcode pfx_f3;
  173. };
  174. /* EFLAGS bit definitions. */
  175. #define EFLG_ID (1<<21)
  176. #define EFLG_VIP (1<<20)
  177. #define EFLG_VIF (1<<19)
  178. #define EFLG_AC (1<<18)
  179. #define EFLG_VM (1<<17)
  180. #define EFLG_RF (1<<16)
  181. #define EFLG_IOPL (3<<12)
  182. #define EFLG_NT (1<<14)
  183. #define EFLG_OF (1<<11)
  184. #define EFLG_DF (1<<10)
  185. #define EFLG_IF (1<<9)
  186. #define EFLG_TF (1<<8)
  187. #define EFLG_SF (1<<7)
  188. #define EFLG_ZF (1<<6)
  189. #define EFLG_AF (1<<4)
  190. #define EFLG_PF (1<<2)
  191. #define EFLG_CF (1<<0)
  192. #define EFLG_RESERVED_ZEROS_MASK 0xffc0802a
  193. #define EFLG_RESERVED_ONE_MASK 2
  194. static ulong reg_read(struct x86_emulate_ctxt *ctxt, unsigned nr)
  195. {
  196. if (!(ctxt->regs_valid & (1 << nr))) {
  197. ctxt->regs_valid |= 1 << nr;
  198. ctxt->_regs[nr] = ctxt->ops->read_gpr(ctxt, nr);
  199. }
  200. return ctxt->_regs[nr];
  201. }
  202. static ulong *reg_write(struct x86_emulate_ctxt *ctxt, unsigned nr)
  203. {
  204. ctxt->regs_valid |= 1 << nr;
  205. ctxt->regs_dirty |= 1 << nr;
  206. return &ctxt->_regs[nr];
  207. }
  208. static ulong *reg_rmw(struct x86_emulate_ctxt *ctxt, unsigned nr)
  209. {
  210. reg_read(ctxt, nr);
  211. return reg_write(ctxt, nr);
  212. }
  213. static void writeback_registers(struct x86_emulate_ctxt *ctxt)
  214. {
  215. unsigned reg;
  216. for_each_set_bit(reg, (ulong *)&ctxt->regs_dirty, 16)
  217. ctxt->ops->write_gpr(ctxt, reg, ctxt->_regs[reg]);
  218. }
  219. static void invalidate_registers(struct x86_emulate_ctxt *ctxt)
  220. {
  221. ctxt->regs_dirty = 0;
  222. ctxt->regs_valid = 0;
  223. }
  224. /*
  225. * Instruction emulation:
  226. * Most instructions are emulated directly via a fragment of inline assembly
  227. * code. This allows us to save/restore EFLAGS and thus very easily pick up
  228. * any modified flags.
  229. */
  230. #if defined(CONFIG_X86_64)
  231. #define _LO32 "k" /* force 32-bit operand */
  232. #define _STK "%%rsp" /* stack pointer */
  233. #elif defined(__i386__)
  234. #define _LO32 "" /* force 32-bit operand */
  235. #define _STK "%%esp" /* stack pointer */
  236. #endif
  237. /*
  238. * These EFLAGS bits are restored from saved value during emulation, and
  239. * any changes are written back to the saved value after emulation.
  240. */
  241. #define EFLAGS_MASK (EFLG_OF|EFLG_SF|EFLG_ZF|EFLG_AF|EFLG_PF|EFLG_CF)
  242. /* Before executing instruction: restore necessary bits in EFLAGS. */
  243. #define _PRE_EFLAGS(_sav, _msk, _tmp) \
  244. /* EFLAGS = (_sav & _msk) | (EFLAGS & ~_msk); _sav &= ~_msk; */ \
  245. "movl %"_sav",%"_LO32 _tmp"; " \
  246. "push %"_tmp"; " \
  247. "push %"_tmp"; " \
  248. "movl %"_msk",%"_LO32 _tmp"; " \
  249. "andl %"_LO32 _tmp",("_STK"); " \
  250. "pushf; " \
  251. "notl %"_LO32 _tmp"; " \
  252. "andl %"_LO32 _tmp",("_STK"); " \
  253. "andl %"_LO32 _tmp","__stringify(BITS_PER_LONG/4)"("_STK"); " \
  254. "pop %"_tmp"; " \
  255. "orl %"_LO32 _tmp",("_STK"); " \
  256. "popf; " \
  257. "pop %"_sav"; "
  258. /* After executing instruction: write-back necessary bits in EFLAGS. */
  259. #define _POST_EFLAGS(_sav, _msk, _tmp) \
  260. /* _sav |= EFLAGS & _msk; */ \
  261. "pushf; " \
  262. "pop %"_tmp"; " \
  263. "andl %"_msk",%"_LO32 _tmp"; " \
  264. "orl %"_LO32 _tmp",%"_sav"; "
  265. #ifdef CONFIG_X86_64
  266. #define ON64(x) x
  267. #else
  268. #define ON64(x)
  269. #endif
  270. #define ____emulate_2op(ctxt, _op, _x, _y, _suffix, _dsttype) \
  271. do { \
  272. __asm__ __volatile__ ( \
  273. _PRE_EFLAGS("0", "4", "2") \
  274. _op _suffix " %"_x"3,%1; " \
  275. _POST_EFLAGS("0", "4", "2") \
  276. : "=m" ((ctxt)->eflags), \
  277. "+q" (*(_dsttype*)&(ctxt)->dst.val), \
  278. "=&r" (_tmp) \
  279. : _y ((ctxt)->src.val), "i" (EFLAGS_MASK)); \
  280. } while (0)
  281. /* Raw emulation: instruction has two explicit operands. */
  282. #define __emulate_2op_nobyte(ctxt,_op,_wx,_wy,_lx,_ly,_qx,_qy) \
  283. do { \
  284. unsigned long _tmp; \
  285. \
  286. switch ((ctxt)->dst.bytes) { \
  287. case 2: \
  288. ____emulate_2op(ctxt,_op,_wx,_wy,"w",u16); \
  289. break; \
  290. case 4: \
  291. ____emulate_2op(ctxt,_op,_lx,_ly,"l",u32); \
  292. break; \
  293. case 8: \
  294. ON64(____emulate_2op(ctxt,_op,_qx,_qy,"q",u64)); \
  295. break; \
  296. } \
  297. } while (0)
  298. #define __emulate_2op(ctxt,_op,_bx,_by,_wx,_wy,_lx,_ly,_qx,_qy) \
  299. do { \
  300. unsigned long _tmp; \
  301. switch ((ctxt)->dst.bytes) { \
  302. case 1: \
  303. ____emulate_2op(ctxt,_op,_bx,_by,"b",u8); \
  304. break; \
  305. default: \
  306. __emulate_2op_nobyte(ctxt, _op, \
  307. _wx, _wy, _lx, _ly, _qx, _qy); \
  308. break; \
  309. } \
  310. } while (0)
  311. /* Source operand is byte-sized and may be restricted to just %cl. */
  312. #define emulate_2op_SrcB(ctxt, _op) \
  313. __emulate_2op(ctxt, _op, "b", "c", "b", "c", "b", "c", "b", "c")
  314. /* Source operand is byte, word, long or quad sized. */
  315. #define emulate_2op_SrcV(ctxt, _op) \
  316. __emulate_2op(ctxt, _op, "b", "q", "w", "r", _LO32, "r", "", "r")
  317. /* Source operand is word, long or quad sized. */
  318. #define emulate_2op_SrcV_nobyte(ctxt, _op) \
  319. __emulate_2op_nobyte(ctxt, _op, "w", "r", _LO32, "r", "", "r")
  320. /* Instruction has three operands and one operand is stored in ECX register */
  321. #define __emulate_2op_cl(ctxt, _op, _suffix, _type) \
  322. do { \
  323. unsigned long _tmp; \
  324. _type _clv = (ctxt)->src2.val; \
  325. _type _srcv = (ctxt)->src.val; \
  326. _type _dstv = (ctxt)->dst.val; \
  327. \
  328. __asm__ __volatile__ ( \
  329. _PRE_EFLAGS("0", "5", "2") \
  330. _op _suffix " %4,%1 \n" \
  331. _POST_EFLAGS("0", "5", "2") \
  332. : "=m" ((ctxt)->eflags), "+r" (_dstv), "=&r" (_tmp) \
  333. : "c" (_clv) , "r" (_srcv), "i" (EFLAGS_MASK) \
  334. ); \
  335. \
  336. (ctxt)->src2.val = (unsigned long) _clv; \
  337. (ctxt)->src2.val = (unsigned long) _srcv; \
  338. (ctxt)->dst.val = (unsigned long) _dstv; \
  339. } while (0)
  340. #define emulate_2op_cl(ctxt, _op) \
  341. do { \
  342. switch ((ctxt)->dst.bytes) { \
  343. case 2: \
  344. __emulate_2op_cl(ctxt, _op, "w", u16); \
  345. break; \
  346. case 4: \
  347. __emulate_2op_cl(ctxt, _op, "l", u32); \
  348. break; \
  349. case 8: \
  350. ON64(__emulate_2op_cl(ctxt, _op, "q", ulong)); \
  351. break; \
  352. } \
  353. } while (0)
  354. #define __emulate_1op(ctxt, _op, _suffix) \
  355. do { \
  356. unsigned long _tmp; \
  357. \
  358. __asm__ __volatile__ ( \
  359. _PRE_EFLAGS("0", "3", "2") \
  360. _op _suffix " %1; " \
  361. _POST_EFLAGS("0", "3", "2") \
  362. : "=m" ((ctxt)->eflags), "+m" ((ctxt)->dst.val), \
  363. "=&r" (_tmp) \
  364. : "i" (EFLAGS_MASK)); \
  365. } while (0)
  366. /* Instruction has only one explicit operand (no source operand). */
  367. #define emulate_1op(ctxt, _op) \
  368. do { \
  369. switch ((ctxt)->dst.bytes) { \
  370. case 1: __emulate_1op(ctxt, _op, "b"); break; \
  371. case 2: __emulate_1op(ctxt, _op, "w"); break; \
  372. case 4: __emulate_1op(ctxt, _op, "l"); break; \
  373. case 8: ON64(__emulate_1op(ctxt, _op, "q")); break; \
  374. } \
  375. } while (0)
  376. #define __emulate_1op_rax_rdx(ctxt, _op, _suffix, _ex) \
  377. do { \
  378. unsigned long _tmp; \
  379. ulong *rax = reg_rmw((ctxt), VCPU_REGS_RAX); \
  380. ulong *rdx = reg_rmw((ctxt), VCPU_REGS_RDX); \
  381. \
  382. __asm__ __volatile__ ( \
  383. _PRE_EFLAGS("0", "5", "1") \
  384. "1: \n\t" \
  385. _op _suffix " %6; " \
  386. "2: \n\t" \
  387. _POST_EFLAGS("0", "5", "1") \
  388. ".pushsection .fixup,\"ax\" \n\t" \
  389. "3: movb $1, %4 \n\t" \
  390. "jmp 2b \n\t" \
  391. ".popsection \n\t" \
  392. _ASM_EXTABLE(1b, 3b) \
  393. : "=m" ((ctxt)->eflags), "=&r" (_tmp), \
  394. "+a" (*rax), "+d" (*rdx), "+qm"(_ex) \
  395. : "i" (EFLAGS_MASK), "m" ((ctxt)->src.val)); \
  396. } while (0)
  397. /* instruction has only one source operand, destination is implicit (e.g. mul, div, imul, idiv) */
  398. #define emulate_1op_rax_rdx(ctxt, _op, _ex) \
  399. do { \
  400. switch((ctxt)->src.bytes) { \
  401. case 1: \
  402. __emulate_1op_rax_rdx(ctxt, _op, "b", _ex); \
  403. break; \
  404. case 2: \
  405. __emulate_1op_rax_rdx(ctxt, _op, "w", _ex); \
  406. break; \
  407. case 4: \
  408. __emulate_1op_rax_rdx(ctxt, _op, "l", _ex); \
  409. break; \
  410. case 8: ON64( \
  411. __emulate_1op_rax_rdx(ctxt, _op, "q", _ex)); \
  412. break; \
  413. } \
  414. } while (0)
  415. static int emulator_check_intercept(struct x86_emulate_ctxt *ctxt,
  416. enum x86_intercept intercept,
  417. enum x86_intercept_stage stage)
  418. {
  419. struct x86_instruction_info info = {
  420. .intercept = intercept,
  421. .rep_prefix = ctxt->rep_prefix,
  422. .modrm_mod = ctxt->modrm_mod,
  423. .modrm_reg = ctxt->modrm_reg,
  424. .modrm_rm = ctxt->modrm_rm,
  425. .src_val = ctxt->src.val64,
  426. .src_bytes = ctxt->src.bytes,
  427. .dst_bytes = ctxt->dst.bytes,
  428. .ad_bytes = ctxt->ad_bytes,
  429. .next_rip = ctxt->eip,
  430. };
  431. return ctxt->ops->intercept(ctxt, &info, stage);
  432. }
  433. static void assign_masked(ulong *dest, ulong src, ulong mask)
  434. {
  435. *dest = (*dest & ~mask) | (src & mask);
  436. }
  437. static inline unsigned long ad_mask(struct x86_emulate_ctxt *ctxt)
  438. {
  439. return (1UL << (ctxt->ad_bytes << 3)) - 1;
  440. }
  441. static ulong stack_mask(struct x86_emulate_ctxt *ctxt)
  442. {
  443. u16 sel;
  444. struct desc_struct ss;
  445. if (ctxt->mode == X86EMUL_MODE_PROT64)
  446. return ~0UL;
  447. ctxt->ops->get_segment(ctxt, &sel, &ss, NULL, VCPU_SREG_SS);
  448. return ~0U >> ((ss.d ^ 1) * 16); /* d=0: 0xffff; d=1: 0xffffffff */
  449. }
  450. static int stack_size(struct x86_emulate_ctxt *ctxt)
  451. {
  452. return (__fls(stack_mask(ctxt)) + 1) >> 3;
  453. }
  454. /* Access/update address held in a register, based on addressing mode. */
  455. static inline unsigned long
  456. address_mask(struct x86_emulate_ctxt *ctxt, unsigned long reg)
  457. {
  458. if (ctxt->ad_bytes == sizeof(unsigned long))
  459. return reg;
  460. else
  461. return reg & ad_mask(ctxt);
  462. }
  463. static inline unsigned long
  464. register_address(struct x86_emulate_ctxt *ctxt, unsigned long reg)
  465. {
  466. return address_mask(ctxt, reg);
  467. }
  468. static void masked_increment(ulong *reg, ulong mask, int inc)
  469. {
  470. assign_masked(reg, *reg + inc, mask);
  471. }
  472. static inline void
  473. register_address_increment(struct x86_emulate_ctxt *ctxt, unsigned long *reg, int inc)
  474. {
  475. ulong mask;
  476. if (ctxt->ad_bytes == sizeof(unsigned long))
  477. mask = ~0UL;
  478. else
  479. mask = ad_mask(ctxt);
  480. masked_increment(reg, mask, inc);
  481. }
  482. static void rsp_increment(struct x86_emulate_ctxt *ctxt, int inc)
  483. {
  484. masked_increment(reg_rmw(ctxt, VCPU_REGS_RSP), stack_mask(ctxt), inc);
  485. }
  486. static inline void jmp_rel(struct x86_emulate_ctxt *ctxt, int rel)
  487. {
  488. register_address_increment(ctxt, &ctxt->_eip, rel);
  489. }
  490. static u32 desc_limit_scaled(struct desc_struct *desc)
  491. {
  492. u32 limit = get_desc_limit(desc);
  493. return desc->g ? (limit << 12) | 0xfff : limit;
  494. }
  495. static void set_seg_override(struct x86_emulate_ctxt *ctxt, int seg)
  496. {
  497. ctxt->has_seg_override = true;
  498. ctxt->seg_override = seg;
  499. }
  500. static unsigned long seg_base(struct x86_emulate_ctxt *ctxt, int seg)
  501. {
  502. if (ctxt->mode == X86EMUL_MODE_PROT64 && seg < VCPU_SREG_FS)
  503. return 0;
  504. return ctxt->ops->get_cached_segment_base(ctxt, seg);
  505. }
  506. static unsigned seg_override(struct x86_emulate_ctxt *ctxt)
  507. {
  508. if (!ctxt->has_seg_override)
  509. return 0;
  510. return ctxt->seg_override;
  511. }
  512. static int emulate_exception(struct x86_emulate_ctxt *ctxt, int vec,
  513. u32 error, bool valid)
  514. {
  515. ctxt->exception.vector = vec;
  516. ctxt->exception.error_code = error;
  517. ctxt->exception.error_code_valid = valid;
  518. return X86EMUL_PROPAGATE_FAULT;
  519. }
  520. static int emulate_db(struct x86_emulate_ctxt *ctxt)
  521. {
  522. return emulate_exception(ctxt, DB_VECTOR, 0, false);
  523. }
  524. static int emulate_gp(struct x86_emulate_ctxt *ctxt, int err)
  525. {
  526. return emulate_exception(ctxt, GP_VECTOR, err, true);
  527. }
  528. static int emulate_ss(struct x86_emulate_ctxt *ctxt, int err)
  529. {
  530. return emulate_exception(ctxt, SS_VECTOR, err, true);
  531. }
  532. static int emulate_ud(struct x86_emulate_ctxt *ctxt)
  533. {
  534. return emulate_exception(ctxt, UD_VECTOR, 0, false);
  535. }
  536. static int emulate_ts(struct x86_emulate_ctxt *ctxt, int err)
  537. {
  538. return emulate_exception(ctxt, TS_VECTOR, err, true);
  539. }
  540. static int emulate_de(struct x86_emulate_ctxt *ctxt)
  541. {
  542. return emulate_exception(ctxt, DE_VECTOR, 0, false);
  543. }
  544. static int emulate_nm(struct x86_emulate_ctxt *ctxt)
  545. {
  546. return emulate_exception(ctxt, NM_VECTOR, 0, false);
  547. }
  548. static u16 get_segment_selector(struct x86_emulate_ctxt *ctxt, unsigned seg)
  549. {
  550. u16 selector;
  551. struct desc_struct desc;
  552. ctxt->ops->get_segment(ctxt, &selector, &desc, NULL, seg);
  553. return selector;
  554. }
  555. static void set_segment_selector(struct x86_emulate_ctxt *ctxt, u16 selector,
  556. unsigned seg)
  557. {
  558. u16 dummy;
  559. u32 base3;
  560. struct desc_struct desc;
  561. ctxt->ops->get_segment(ctxt, &dummy, &desc, &base3, seg);
  562. ctxt->ops->set_segment(ctxt, selector, &desc, base3, seg);
  563. }
  564. /*
  565. * x86 defines three classes of vector instructions: explicitly
  566. * aligned, explicitly unaligned, and the rest, which change behaviour
  567. * depending on whether they're AVX encoded or not.
  568. *
  569. * Also included is CMPXCHG16B which is not a vector instruction, yet it is
  570. * subject to the same check.
  571. */
  572. static bool insn_aligned(struct x86_emulate_ctxt *ctxt, unsigned size)
  573. {
  574. if (likely(size < 16))
  575. return false;
  576. if (ctxt->d & Aligned)
  577. return true;
  578. else if (ctxt->d & Unaligned)
  579. return false;
  580. else if (ctxt->d & Avx)
  581. return false;
  582. else
  583. return true;
  584. }
  585. static int __linearize(struct x86_emulate_ctxt *ctxt,
  586. struct segmented_address addr,
  587. unsigned size, bool write, bool fetch,
  588. ulong *linear)
  589. {
  590. struct desc_struct desc;
  591. bool usable;
  592. ulong la;
  593. u32 lim;
  594. u16 sel;
  595. unsigned cpl, rpl;
  596. la = seg_base(ctxt, addr.seg) + addr.ea;
  597. switch (ctxt->mode) {
  598. case X86EMUL_MODE_PROT64:
  599. if (((signed long)la << 16) >> 16 != la)
  600. return emulate_gp(ctxt, 0);
  601. break;
  602. default:
  603. usable = ctxt->ops->get_segment(ctxt, &sel, &desc, NULL,
  604. addr.seg);
  605. if (!usable)
  606. goto bad;
  607. /* code segment in protected mode or read-only data segment */
  608. if ((((ctxt->mode != X86EMUL_MODE_REAL) && (desc.type & 8))
  609. || !(desc.type & 2)) && write)
  610. goto bad;
  611. /* unreadable code segment */
  612. if (!fetch && (desc.type & 8) && !(desc.type & 2))
  613. goto bad;
  614. lim = desc_limit_scaled(&desc);
  615. if ((desc.type & 8) || !(desc.type & 4)) {
  616. /* expand-up segment */
  617. if (addr.ea > lim || (u32)(addr.ea + size - 1) > lim)
  618. goto bad;
  619. } else {
  620. /* expand-down segment */
  621. if (addr.ea <= lim || (u32)(addr.ea + size - 1) <= lim)
  622. goto bad;
  623. lim = desc.d ? 0xffffffff : 0xffff;
  624. if (addr.ea > lim || (u32)(addr.ea + size - 1) > lim)
  625. goto bad;
  626. }
  627. cpl = ctxt->ops->cpl(ctxt);
  628. if (ctxt->mode == X86EMUL_MODE_REAL)
  629. rpl = 0;
  630. else
  631. rpl = sel & 3;
  632. cpl = max(cpl, rpl);
  633. if (!(desc.type & 8)) {
  634. /* data segment */
  635. if (cpl > desc.dpl)
  636. goto bad;
  637. } else if ((desc.type & 8) && !(desc.type & 4)) {
  638. /* nonconforming code segment */
  639. if (cpl != desc.dpl)
  640. goto bad;
  641. } else if ((desc.type & 8) && (desc.type & 4)) {
  642. /* conforming code segment */
  643. if (cpl < desc.dpl)
  644. goto bad;
  645. }
  646. break;
  647. }
  648. if (fetch ? ctxt->mode != X86EMUL_MODE_PROT64 : ctxt->ad_bytes != 8)
  649. la &= (u32)-1;
  650. if (insn_aligned(ctxt, size) && ((la & (size - 1)) != 0))
  651. return emulate_gp(ctxt, 0);
  652. *linear = la;
  653. return X86EMUL_CONTINUE;
  654. bad:
  655. if (addr.seg == VCPU_SREG_SS)
  656. return emulate_ss(ctxt, sel);
  657. else
  658. return emulate_gp(ctxt, sel);
  659. }
  660. static int linearize(struct x86_emulate_ctxt *ctxt,
  661. struct segmented_address addr,
  662. unsigned size, bool write,
  663. ulong *linear)
  664. {
  665. return __linearize(ctxt, addr, size, write, false, linear);
  666. }
  667. static int segmented_read_std(struct x86_emulate_ctxt *ctxt,
  668. struct segmented_address addr,
  669. void *data,
  670. unsigned size)
  671. {
  672. int rc;
  673. ulong linear;
  674. rc = linearize(ctxt, addr, size, false, &linear);
  675. if (rc != X86EMUL_CONTINUE)
  676. return rc;
  677. return ctxt->ops->read_std(ctxt, linear, data, size, &ctxt->exception);
  678. }
  679. /*
  680. * Fetch the next byte of the instruction being emulated which is pointed to
  681. * by ctxt->_eip, then increment ctxt->_eip.
  682. *
  683. * Also prefetch the remaining bytes of the instruction without crossing page
  684. * boundary if they are not in fetch_cache yet.
  685. */
  686. static int do_insn_fetch_byte(struct x86_emulate_ctxt *ctxt, u8 *dest)
  687. {
  688. struct fetch_cache *fc = &ctxt->fetch;
  689. int rc;
  690. int size, cur_size;
  691. if (ctxt->_eip == fc->end) {
  692. unsigned long linear;
  693. struct segmented_address addr = { .seg = VCPU_SREG_CS,
  694. .ea = ctxt->_eip };
  695. cur_size = fc->end - fc->start;
  696. size = min(15UL - cur_size,
  697. PAGE_SIZE - offset_in_page(ctxt->_eip));
  698. rc = __linearize(ctxt, addr, size, false, true, &linear);
  699. if (unlikely(rc != X86EMUL_CONTINUE))
  700. return rc;
  701. rc = ctxt->ops->fetch(ctxt, linear, fc->data + cur_size,
  702. size, &ctxt->exception);
  703. if (unlikely(rc != X86EMUL_CONTINUE))
  704. return rc;
  705. fc->end += size;
  706. }
  707. *dest = fc->data[ctxt->_eip - fc->start];
  708. ctxt->_eip++;
  709. return X86EMUL_CONTINUE;
  710. }
  711. static int do_insn_fetch(struct x86_emulate_ctxt *ctxt,
  712. void *dest, unsigned size)
  713. {
  714. int rc;
  715. /* x86 instructions are limited to 15 bytes. */
  716. if (unlikely(ctxt->_eip + size - ctxt->eip > 15))
  717. return X86EMUL_UNHANDLEABLE;
  718. while (size--) {
  719. rc = do_insn_fetch_byte(ctxt, dest++);
  720. if (rc != X86EMUL_CONTINUE)
  721. return rc;
  722. }
  723. return X86EMUL_CONTINUE;
  724. }
  725. /* Fetch next part of the instruction being emulated. */
  726. #define insn_fetch(_type, _ctxt) \
  727. ({ unsigned long _x; \
  728. rc = do_insn_fetch(_ctxt, &_x, sizeof(_type)); \
  729. if (rc != X86EMUL_CONTINUE) \
  730. goto done; \
  731. (_type)_x; \
  732. })
  733. #define insn_fetch_arr(_arr, _size, _ctxt) \
  734. ({ rc = do_insn_fetch(_ctxt, _arr, (_size)); \
  735. if (rc != X86EMUL_CONTINUE) \
  736. goto done; \
  737. })
  738. /*
  739. * Given the 'reg' portion of a ModRM byte, and a register block, return a
  740. * pointer into the block that addresses the relevant register.
  741. * @highbyte_regs specifies whether to decode AH,CH,DH,BH.
  742. */
  743. static void *decode_register(struct x86_emulate_ctxt *ctxt, u8 modrm_reg,
  744. int highbyte_regs)
  745. {
  746. void *p;
  747. if (highbyte_regs && modrm_reg >= 4 && modrm_reg < 8)
  748. p = (unsigned char *)reg_rmw(ctxt, modrm_reg & 3) + 1;
  749. else
  750. p = reg_rmw(ctxt, modrm_reg);
  751. return p;
  752. }
  753. static int read_descriptor(struct x86_emulate_ctxt *ctxt,
  754. struct segmented_address addr,
  755. u16 *size, unsigned long *address, int op_bytes)
  756. {
  757. int rc;
  758. if (op_bytes == 2)
  759. op_bytes = 3;
  760. *address = 0;
  761. rc = segmented_read_std(ctxt, addr, size, 2);
  762. if (rc != X86EMUL_CONTINUE)
  763. return rc;
  764. addr.ea += 2;
  765. rc = segmented_read_std(ctxt, addr, address, op_bytes);
  766. return rc;
  767. }
  768. static int test_cc(unsigned int condition, unsigned int flags)
  769. {
  770. int rc = 0;
  771. switch ((condition & 15) >> 1) {
  772. case 0: /* o */
  773. rc |= (flags & EFLG_OF);
  774. break;
  775. case 1: /* b/c/nae */
  776. rc |= (flags & EFLG_CF);
  777. break;
  778. case 2: /* z/e */
  779. rc |= (flags & EFLG_ZF);
  780. break;
  781. case 3: /* be/na */
  782. rc |= (flags & (EFLG_CF|EFLG_ZF));
  783. break;
  784. case 4: /* s */
  785. rc |= (flags & EFLG_SF);
  786. break;
  787. case 5: /* p/pe */
  788. rc |= (flags & EFLG_PF);
  789. break;
  790. case 7: /* le/ng */
  791. rc |= (flags & EFLG_ZF);
  792. /* fall through */
  793. case 6: /* l/nge */
  794. rc |= (!(flags & EFLG_SF) != !(flags & EFLG_OF));
  795. break;
  796. }
  797. /* Odd condition identifiers (lsb == 1) have inverted sense. */
  798. return (!!rc ^ (condition & 1));
  799. }
  800. static void fetch_register_operand(struct operand *op)
  801. {
  802. switch (op->bytes) {
  803. case 1:
  804. op->val = *(u8 *)op->addr.reg;
  805. break;
  806. case 2:
  807. op->val = *(u16 *)op->addr.reg;
  808. break;
  809. case 4:
  810. op->val = *(u32 *)op->addr.reg;
  811. break;
  812. case 8:
  813. op->val = *(u64 *)op->addr.reg;
  814. break;
  815. }
  816. }
  817. static void read_sse_reg(struct x86_emulate_ctxt *ctxt, sse128_t *data, int reg)
  818. {
  819. ctxt->ops->get_fpu(ctxt);
  820. switch (reg) {
  821. case 0: asm("movdqa %%xmm0, %0" : "=m"(*data)); break;
  822. case 1: asm("movdqa %%xmm1, %0" : "=m"(*data)); break;
  823. case 2: asm("movdqa %%xmm2, %0" : "=m"(*data)); break;
  824. case 3: asm("movdqa %%xmm3, %0" : "=m"(*data)); break;
  825. case 4: asm("movdqa %%xmm4, %0" : "=m"(*data)); break;
  826. case 5: asm("movdqa %%xmm5, %0" : "=m"(*data)); break;
  827. case 6: asm("movdqa %%xmm6, %0" : "=m"(*data)); break;
  828. case 7: asm("movdqa %%xmm7, %0" : "=m"(*data)); break;
  829. #ifdef CONFIG_X86_64
  830. case 8: asm("movdqa %%xmm8, %0" : "=m"(*data)); break;
  831. case 9: asm("movdqa %%xmm9, %0" : "=m"(*data)); break;
  832. case 10: asm("movdqa %%xmm10, %0" : "=m"(*data)); break;
  833. case 11: asm("movdqa %%xmm11, %0" : "=m"(*data)); break;
  834. case 12: asm("movdqa %%xmm12, %0" : "=m"(*data)); break;
  835. case 13: asm("movdqa %%xmm13, %0" : "=m"(*data)); break;
  836. case 14: asm("movdqa %%xmm14, %0" : "=m"(*data)); break;
  837. case 15: asm("movdqa %%xmm15, %0" : "=m"(*data)); break;
  838. #endif
  839. default: BUG();
  840. }
  841. ctxt->ops->put_fpu(ctxt);
  842. }
  843. static void write_sse_reg(struct x86_emulate_ctxt *ctxt, sse128_t *data,
  844. int reg)
  845. {
  846. ctxt->ops->get_fpu(ctxt);
  847. switch (reg) {
  848. case 0: asm("movdqa %0, %%xmm0" : : "m"(*data)); break;
  849. case 1: asm("movdqa %0, %%xmm1" : : "m"(*data)); break;
  850. case 2: asm("movdqa %0, %%xmm2" : : "m"(*data)); break;
  851. case 3: asm("movdqa %0, %%xmm3" : : "m"(*data)); break;
  852. case 4: asm("movdqa %0, %%xmm4" : : "m"(*data)); break;
  853. case 5: asm("movdqa %0, %%xmm5" : : "m"(*data)); break;
  854. case 6: asm("movdqa %0, %%xmm6" : : "m"(*data)); break;
  855. case 7: asm("movdqa %0, %%xmm7" : : "m"(*data)); break;
  856. #ifdef CONFIG_X86_64
  857. case 8: asm("movdqa %0, %%xmm8" : : "m"(*data)); break;
  858. case 9: asm("movdqa %0, %%xmm9" : : "m"(*data)); break;
  859. case 10: asm("movdqa %0, %%xmm10" : : "m"(*data)); break;
  860. case 11: asm("movdqa %0, %%xmm11" : : "m"(*data)); break;
  861. case 12: asm("movdqa %0, %%xmm12" : : "m"(*data)); break;
  862. case 13: asm("movdqa %0, %%xmm13" : : "m"(*data)); break;
  863. case 14: asm("movdqa %0, %%xmm14" : : "m"(*data)); break;
  864. case 15: asm("movdqa %0, %%xmm15" : : "m"(*data)); break;
  865. #endif
  866. default: BUG();
  867. }
  868. ctxt->ops->put_fpu(ctxt);
  869. }
  870. static void read_mmx_reg(struct x86_emulate_ctxt *ctxt, u64 *data, int reg)
  871. {
  872. ctxt->ops->get_fpu(ctxt);
  873. switch (reg) {
  874. case 0: asm("movq %%mm0, %0" : "=m"(*data)); break;
  875. case 1: asm("movq %%mm1, %0" : "=m"(*data)); break;
  876. case 2: asm("movq %%mm2, %0" : "=m"(*data)); break;
  877. case 3: asm("movq %%mm3, %0" : "=m"(*data)); break;
  878. case 4: asm("movq %%mm4, %0" : "=m"(*data)); break;
  879. case 5: asm("movq %%mm5, %0" : "=m"(*data)); break;
  880. case 6: asm("movq %%mm6, %0" : "=m"(*data)); break;
  881. case 7: asm("movq %%mm7, %0" : "=m"(*data)); break;
  882. default: BUG();
  883. }
  884. ctxt->ops->put_fpu(ctxt);
  885. }
  886. static void write_mmx_reg(struct x86_emulate_ctxt *ctxt, u64 *data, int reg)
  887. {
  888. ctxt->ops->get_fpu(ctxt);
  889. switch (reg) {
  890. case 0: asm("movq %0, %%mm0" : : "m"(*data)); break;
  891. case 1: asm("movq %0, %%mm1" : : "m"(*data)); break;
  892. case 2: asm("movq %0, %%mm2" : : "m"(*data)); break;
  893. case 3: asm("movq %0, %%mm3" : : "m"(*data)); break;
  894. case 4: asm("movq %0, %%mm4" : : "m"(*data)); break;
  895. case 5: asm("movq %0, %%mm5" : : "m"(*data)); break;
  896. case 6: asm("movq %0, %%mm6" : : "m"(*data)); break;
  897. case 7: asm("movq %0, %%mm7" : : "m"(*data)); break;
  898. default: BUG();
  899. }
  900. ctxt->ops->put_fpu(ctxt);
  901. }
  902. static void decode_register_operand(struct x86_emulate_ctxt *ctxt,
  903. struct operand *op)
  904. {
  905. unsigned reg = ctxt->modrm_reg;
  906. int highbyte_regs = ctxt->rex_prefix == 0;
  907. if (!(ctxt->d & ModRM))
  908. reg = (ctxt->b & 7) | ((ctxt->rex_prefix & 1) << 3);
  909. if (ctxt->d & Sse) {
  910. op->type = OP_XMM;
  911. op->bytes = 16;
  912. op->addr.xmm = reg;
  913. read_sse_reg(ctxt, &op->vec_val, reg);
  914. return;
  915. }
  916. if (ctxt->d & Mmx) {
  917. reg &= 7;
  918. op->type = OP_MM;
  919. op->bytes = 8;
  920. op->addr.mm = reg;
  921. return;
  922. }
  923. op->type = OP_REG;
  924. if (ctxt->d & ByteOp) {
  925. op->addr.reg = decode_register(ctxt, reg, highbyte_regs);
  926. op->bytes = 1;
  927. } else {
  928. op->addr.reg = decode_register(ctxt, reg, 0);
  929. op->bytes = ctxt->op_bytes;
  930. }
  931. fetch_register_operand(op);
  932. op->orig_val = op->val;
  933. }
  934. static void adjust_modrm_seg(struct x86_emulate_ctxt *ctxt, int base_reg)
  935. {
  936. if (base_reg == VCPU_REGS_RSP || base_reg == VCPU_REGS_RBP)
  937. ctxt->modrm_seg = VCPU_SREG_SS;
  938. }
  939. static int decode_modrm(struct x86_emulate_ctxt *ctxt,
  940. struct operand *op)
  941. {
  942. u8 sib;
  943. int index_reg = 0, base_reg = 0, scale;
  944. int rc = X86EMUL_CONTINUE;
  945. ulong modrm_ea = 0;
  946. if (ctxt->rex_prefix) {
  947. ctxt->modrm_reg = (ctxt->rex_prefix & 4) << 1; /* REX.R */
  948. index_reg = (ctxt->rex_prefix & 2) << 2; /* REX.X */
  949. ctxt->modrm_rm = base_reg = (ctxt->rex_prefix & 1) << 3; /* REG.B */
  950. }
  951. ctxt->modrm_mod |= (ctxt->modrm & 0xc0) >> 6;
  952. ctxt->modrm_reg |= (ctxt->modrm & 0x38) >> 3;
  953. ctxt->modrm_rm |= (ctxt->modrm & 0x07);
  954. ctxt->modrm_seg = VCPU_SREG_DS;
  955. if (ctxt->modrm_mod == 3) {
  956. op->type = OP_REG;
  957. op->bytes = (ctxt->d & ByteOp) ? 1 : ctxt->op_bytes;
  958. op->addr.reg = decode_register(ctxt, ctxt->modrm_rm, ctxt->d & ByteOp);
  959. if (ctxt->d & Sse) {
  960. op->type = OP_XMM;
  961. op->bytes = 16;
  962. op->addr.xmm = ctxt->modrm_rm;
  963. read_sse_reg(ctxt, &op->vec_val, ctxt->modrm_rm);
  964. return rc;
  965. }
  966. if (ctxt->d & Mmx) {
  967. op->type = OP_MM;
  968. op->bytes = 8;
  969. op->addr.xmm = ctxt->modrm_rm & 7;
  970. return rc;
  971. }
  972. fetch_register_operand(op);
  973. return rc;
  974. }
  975. op->type = OP_MEM;
  976. if (ctxt->ad_bytes == 2) {
  977. unsigned bx = reg_read(ctxt, VCPU_REGS_RBX);
  978. unsigned bp = reg_read(ctxt, VCPU_REGS_RBP);
  979. unsigned si = reg_read(ctxt, VCPU_REGS_RSI);
  980. unsigned di = reg_read(ctxt, VCPU_REGS_RDI);
  981. /* 16-bit ModR/M decode. */
  982. switch (ctxt->modrm_mod) {
  983. case 0:
  984. if (ctxt->modrm_rm == 6)
  985. modrm_ea += insn_fetch(u16, ctxt);
  986. break;
  987. case 1:
  988. modrm_ea += insn_fetch(s8, ctxt);
  989. break;
  990. case 2:
  991. modrm_ea += insn_fetch(u16, ctxt);
  992. break;
  993. }
  994. switch (ctxt->modrm_rm) {
  995. case 0:
  996. modrm_ea += bx + si;
  997. break;
  998. case 1:
  999. modrm_ea += bx + di;
  1000. break;
  1001. case 2:
  1002. modrm_ea += bp + si;
  1003. break;
  1004. case 3:
  1005. modrm_ea += bp + di;
  1006. break;
  1007. case 4:
  1008. modrm_ea += si;
  1009. break;
  1010. case 5:
  1011. modrm_ea += di;
  1012. break;
  1013. case 6:
  1014. if (ctxt->modrm_mod != 0)
  1015. modrm_ea += bp;
  1016. break;
  1017. case 7:
  1018. modrm_ea += bx;
  1019. break;
  1020. }
  1021. if (ctxt->modrm_rm == 2 || ctxt->modrm_rm == 3 ||
  1022. (ctxt->modrm_rm == 6 && ctxt->modrm_mod != 0))
  1023. ctxt->modrm_seg = VCPU_SREG_SS;
  1024. modrm_ea = (u16)modrm_ea;
  1025. } else {
  1026. /* 32/64-bit ModR/M decode. */
  1027. if ((ctxt->modrm_rm & 7) == 4) {
  1028. sib = insn_fetch(u8, ctxt);
  1029. index_reg |= (sib >> 3) & 7;
  1030. base_reg |= sib & 7;
  1031. scale = sib >> 6;
  1032. if ((base_reg & 7) == 5 && ctxt->modrm_mod == 0)
  1033. modrm_ea += insn_fetch(s32, ctxt);
  1034. else {
  1035. modrm_ea += reg_read(ctxt, base_reg);
  1036. adjust_modrm_seg(ctxt, base_reg);
  1037. }
  1038. if (index_reg != 4)
  1039. modrm_ea += reg_read(ctxt, index_reg) << scale;
  1040. } else if ((ctxt->modrm_rm & 7) == 5 && ctxt->modrm_mod == 0) {
  1041. if (ctxt->mode == X86EMUL_MODE_PROT64)
  1042. ctxt->rip_relative = 1;
  1043. } else {
  1044. base_reg = ctxt->modrm_rm;
  1045. modrm_ea += reg_read(ctxt, base_reg);
  1046. adjust_modrm_seg(ctxt, base_reg);
  1047. }
  1048. switch (ctxt->modrm_mod) {
  1049. case 0:
  1050. if (ctxt->modrm_rm == 5)
  1051. modrm_ea += insn_fetch(s32, ctxt);
  1052. break;
  1053. case 1:
  1054. modrm_ea += insn_fetch(s8, ctxt);
  1055. break;
  1056. case 2:
  1057. modrm_ea += insn_fetch(s32, ctxt);
  1058. break;
  1059. }
  1060. }
  1061. op->addr.mem.ea = modrm_ea;
  1062. done:
  1063. return rc;
  1064. }
  1065. static int decode_abs(struct x86_emulate_ctxt *ctxt,
  1066. struct operand *op)
  1067. {
  1068. int rc = X86EMUL_CONTINUE;
  1069. op->type = OP_MEM;
  1070. switch (ctxt->ad_bytes) {
  1071. case 2:
  1072. op->addr.mem.ea = insn_fetch(u16, ctxt);
  1073. break;
  1074. case 4:
  1075. op->addr.mem.ea = insn_fetch(u32, ctxt);
  1076. break;
  1077. case 8:
  1078. op->addr.mem.ea = insn_fetch(u64, ctxt);
  1079. break;
  1080. }
  1081. done:
  1082. return rc;
  1083. }
  1084. static void fetch_bit_operand(struct x86_emulate_ctxt *ctxt)
  1085. {
  1086. long sv = 0, mask;
  1087. if (ctxt->dst.type == OP_MEM && ctxt->src.type == OP_REG) {
  1088. mask = ~(ctxt->dst.bytes * 8 - 1);
  1089. if (ctxt->src.bytes == 2)
  1090. sv = (s16)ctxt->src.val & (s16)mask;
  1091. else if (ctxt->src.bytes == 4)
  1092. sv = (s32)ctxt->src.val & (s32)mask;
  1093. ctxt->dst.addr.mem.ea += (sv >> 3);
  1094. }
  1095. /* only subword offset */
  1096. ctxt->src.val &= (ctxt->dst.bytes << 3) - 1;
  1097. }
  1098. static int read_emulated(struct x86_emulate_ctxt *ctxt,
  1099. unsigned long addr, void *dest, unsigned size)
  1100. {
  1101. int rc;
  1102. struct read_cache *mc = &ctxt->mem_read;
  1103. if (mc->pos < mc->end)
  1104. goto read_cached;
  1105. WARN_ON((mc->end + size) >= sizeof(mc->data));
  1106. rc = ctxt->ops->read_emulated(ctxt, addr, mc->data + mc->end, size,
  1107. &ctxt->exception);
  1108. if (rc != X86EMUL_CONTINUE)
  1109. return rc;
  1110. mc->end += size;
  1111. read_cached:
  1112. memcpy(dest, mc->data + mc->pos, size);
  1113. mc->pos += size;
  1114. return X86EMUL_CONTINUE;
  1115. }
  1116. static int segmented_read(struct x86_emulate_ctxt *ctxt,
  1117. struct segmented_address addr,
  1118. void *data,
  1119. unsigned size)
  1120. {
  1121. int rc;
  1122. ulong linear;
  1123. rc = linearize(ctxt, addr, size, false, &linear);
  1124. if (rc != X86EMUL_CONTINUE)
  1125. return rc;
  1126. return read_emulated(ctxt, linear, data, size);
  1127. }
  1128. static int segmented_write(struct x86_emulate_ctxt *ctxt,
  1129. struct segmented_address addr,
  1130. const void *data,
  1131. unsigned size)
  1132. {
  1133. int rc;
  1134. ulong linear;
  1135. rc = linearize(ctxt, addr, size, true, &linear);
  1136. if (rc != X86EMUL_CONTINUE)
  1137. return rc;
  1138. return ctxt->ops->write_emulated(ctxt, linear, data, size,
  1139. &ctxt->exception);
  1140. }
  1141. static int segmented_cmpxchg(struct x86_emulate_ctxt *ctxt,
  1142. struct segmented_address addr,
  1143. const void *orig_data, const void *data,
  1144. unsigned size)
  1145. {
  1146. int rc;
  1147. ulong linear;
  1148. rc = linearize(ctxt, addr, size, true, &linear);
  1149. if (rc != X86EMUL_CONTINUE)
  1150. return rc;
  1151. return ctxt->ops->cmpxchg_emulated(ctxt, linear, orig_data, data,
  1152. size, &ctxt->exception);
  1153. }
  1154. static int pio_in_emulated(struct x86_emulate_ctxt *ctxt,
  1155. unsigned int size, unsigned short port,
  1156. void *dest)
  1157. {
  1158. struct read_cache *rc = &ctxt->io_read;
  1159. if (rc->pos == rc->end) { /* refill pio read ahead */
  1160. unsigned int in_page, n;
  1161. unsigned int count = ctxt->rep_prefix ?
  1162. address_mask(ctxt, reg_read(ctxt, VCPU_REGS_RCX)) : 1;
  1163. in_page = (ctxt->eflags & EFLG_DF) ?
  1164. offset_in_page(reg_read(ctxt, VCPU_REGS_RDI)) :
  1165. PAGE_SIZE - offset_in_page(reg_read(ctxt, VCPU_REGS_RDI));
  1166. n = min(min(in_page, (unsigned int)sizeof(rc->data)) / size,
  1167. count);
  1168. if (n == 0)
  1169. n = 1;
  1170. rc->pos = rc->end = 0;
  1171. if (!ctxt->ops->pio_in_emulated(ctxt, size, port, rc->data, n))
  1172. return 0;
  1173. rc->end = n * size;
  1174. }
  1175. if (ctxt->rep_prefix && !(ctxt->eflags & EFLG_DF)) {
  1176. ctxt->dst.data = rc->data + rc->pos;
  1177. ctxt->dst.type = OP_MEM_STR;
  1178. ctxt->dst.count = (rc->end - rc->pos) / size;
  1179. rc->pos = rc->end;
  1180. } else {
  1181. memcpy(dest, rc->data + rc->pos, size);
  1182. rc->pos += size;
  1183. }
  1184. return 1;
  1185. }
  1186. static int read_interrupt_descriptor(struct x86_emulate_ctxt *ctxt,
  1187. u16 index, struct desc_struct *desc)
  1188. {
  1189. struct desc_ptr dt;
  1190. ulong addr;
  1191. ctxt->ops->get_idt(ctxt, &dt);
  1192. if (dt.size < index * 8 + 7)
  1193. return emulate_gp(ctxt, index << 3 | 0x2);
  1194. addr = dt.address + index * 8;
  1195. return ctxt->ops->read_std(ctxt, addr, desc, sizeof *desc,
  1196. &ctxt->exception);
  1197. }
  1198. static void get_descriptor_table_ptr(struct x86_emulate_ctxt *ctxt,
  1199. u16 selector, struct desc_ptr *dt)
  1200. {
  1201. const struct x86_emulate_ops *ops = ctxt->ops;
  1202. if (selector & 1 << 2) {
  1203. struct desc_struct desc;
  1204. u16 sel;
  1205. memset (dt, 0, sizeof *dt);
  1206. if (!ops->get_segment(ctxt, &sel, &desc, NULL, VCPU_SREG_LDTR))
  1207. return;
  1208. dt->size = desc_limit_scaled(&desc); /* what if limit > 65535? */
  1209. dt->address = get_desc_base(&desc);
  1210. } else
  1211. ops->get_gdt(ctxt, dt);
  1212. }
  1213. /* allowed just for 8 bytes segments */
  1214. static int read_segment_descriptor(struct x86_emulate_ctxt *ctxt,
  1215. u16 selector, struct desc_struct *desc,
  1216. ulong *desc_addr_p)
  1217. {
  1218. struct desc_ptr dt;
  1219. u16 index = selector >> 3;
  1220. ulong addr;
  1221. get_descriptor_table_ptr(ctxt, selector, &dt);
  1222. if (dt.size < index * 8 + 7)
  1223. return emulate_gp(ctxt, selector & 0xfffc);
  1224. *desc_addr_p = addr = dt.address + index * 8;
  1225. return ctxt->ops->read_std(ctxt, addr, desc, sizeof *desc,
  1226. &ctxt->exception);
  1227. }
  1228. /* allowed just for 8 bytes segments */
  1229. static int write_segment_descriptor(struct x86_emulate_ctxt *ctxt,
  1230. u16 selector, struct desc_struct *desc)
  1231. {
  1232. struct desc_ptr dt;
  1233. u16 index = selector >> 3;
  1234. ulong addr;
  1235. get_descriptor_table_ptr(ctxt, selector, &dt);
  1236. if (dt.size < index * 8 + 7)
  1237. return emulate_gp(ctxt, selector & 0xfffc);
  1238. addr = dt.address + index * 8;
  1239. return ctxt->ops->write_std(ctxt, addr, desc, sizeof *desc,
  1240. &ctxt->exception);
  1241. }
  1242. /* Does not support long mode */
  1243. static int load_segment_descriptor(struct x86_emulate_ctxt *ctxt,
  1244. u16 selector, int seg)
  1245. {
  1246. struct desc_struct seg_desc, old_desc;
  1247. u8 dpl, rpl, cpl;
  1248. unsigned err_vec = GP_VECTOR;
  1249. u32 err_code = 0;
  1250. bool null_selector = !(selector & ~0x3); /* 0000-0003 are null */
  1251. ulong desc_addr;
  1252. int ret;
  1253. u16 dummy;
  1254. memset(&seg_desc, 0, sizeof seg_desc);
  1255. if ((seg <= VCPU_SREG_GS && ctxt->mode == X86EMUL_MODE_VM86)
  1256. || ctxt->mode == X86EMUL_MODE_REAL) {
  1257. /* set real mode segment descriptor */
  1258. ctxt->ops->get_segment(ctxt, &dummy, &seg_desc, NULL, seg);
  1259. set_desc_base(&seg_desc, selector << 4);
  1260. goto load;
  1261. }
  1262. rpl = selector & 3;
  1263. cpl = ctxt->ops->cpl(ctxt);
  1264. /* NULL selector is not valid for TR, CS and SS (except for long mode) */
  1265. if ((seg == VCPU_SREG_CS
  1266. || (seg == VCPU_SREG_SS
  1267. && (ctxt->mode != X86EMUL_MODE_PROT64 || rpl != cpl))
  1268. || seg == VCPU_SREG_TR)
  1269. && null_selector)
  1270. goto exception;
  1271. /* TR should be in GDT only */
  1272. if (seg == VCPU_SREG_TR && (selector & (1 << 2)))
  1273. goto exception;
  1274. if (null_selector) /* for NULL selector skip all following checks */
  1275. goto load;
  1276. ret = read_segment_descriptor(ctxt, selector, &seg_desc, &desc_addr);
  1277. if (ret != X86EMUL_CONTINUE)
  1278. return ret;
  1279. err_code = selector & 0xfffc;
  1280. err_vec = GP_VECTOR;
  1281. /* can't load system descriptor into segment selector */
  1282. if (seg <= VCPU_SREG_GS && !seg_desc.s)
  1283. goto exception;
  1284. if (!seg_desc.p) {
  1285. err_vec = (seg == VCPU_SREG_SS) ? SS_VECTOR : NP_VECTOR;
  1286. goto exception;
  1287. }
  1288. dpl = seg_desc.dpl;
  1289. switch (seg) {
  1290. case VCPU_SREG_SS:
  1291. /*
  1292. * segment is not a writable data segment or segment
  1293. * selector's RPL != CPL or segment selector's RPL != CPL
  1294. */
  1295. if (rpl != cpl || (seg_desc.type & 0xa) != 0x2 || dpl != cpl)
  1296. goto exception;
  1297. break;
  1298. case VCPU_SREG_CS:
  1299. if (!(seg_desc.type & 8))
  1300. goto exception;
  1301. if (seg_desc.type & 4) {
  1302. /* conforming */
  1303. if (dpl > cpl)
  1304. goto exception;
  1305. } else {
  1306. /* nonconforming */
  1307. if (rpl > cpl || dpl != cpl)
  1308. goto exception;
  1309. }
  1310. /* CS(RPL) <- CPL */
  1311. selector = (selector & 0xfffc) | cpl;
  1312. break;
  1313. case VCPU_SREG_TR:
  1314. if (seg_desc.s || (seg_desc.type != 1 && seg_desc.type != 9))
  1315. goto exception;
  1316. old_desc = seg_desc;
  1317. seg_desc.type |= 2; /* busy */
  1318. ret = ctxt->ops->cmpxchg_emulated(ctxt, desc_addr, &old_desc, &seg_desc,
  1319. sizeof(seg_desc), &ctxt->exception);
  1320. if (ret != X86EMUL_CONTINUE)
  1321. return ret;
  1322. break;
  1323. case VCPU_SREG_LDTR:
  1324. if (seg_desc.s || seg_desc.type != 2)
  1325. goto exception;
  1326. break;
  1327. default: /* DS, ES, FS, or GS */
  1328. /*
  1329. * segment is not a data or readable code segment or
  1330. * ((segment is a data or nonconforming code segment)
  1331. * and (both RPL and CPL > DPL))
  1332. */
  1333. if ((seg_desc.type & 0xa) == 0x8 ||
  1334. (((seg_desc.type & 0xc) != 0xc) &&
  1335. (rpl > dpl && cpl > dpl)))
  1336. goto exception;
  1337. break;
  1338. }
  1339. if (seg_desc.s) {
  1340. /* mark segment as accessed */
  1341. seg_desc.type |= 1;
  1342. ret = write_segment_descriptor(ctxt, selector, &seg_desc);
  1343. if (ret != X86EMUL_CONTINUE)
  1344. return ret;
  1345. }
  1346. load:
  1347. ctxt->ops->set_segment(ctxt, selector, &seg_desc, 0, seg);
  1348. return X86EMUL_CONTINUE;
  1349. exception:
  1350. emulate_exception(ctxt, err_vec, err_code, true);
  1351. return X86EMUL_PROPAGATE_FAULT;
  1352. }
  1353. static void write_register_operand(struct operand *op)
  1354. {
  1355. /* The 4-byte case *is* correct: in 64-bit mode we zero-extend. */
  1356. switch (op->bytes) {
  1357. case 1:
  1358. *(u8 *)op->addr.reg = (u8)op->val;
  1359. break;
  1360. case 2:
  1361. *(u16 *)op->addr.reg = (u16)op->val;
  1362. break;
  1363. case 4:
  1364. *op->addr.reg = (u32)op->val;
  1365. break; /* 64b: zero-extend */
  1366. case 8:
  1367. *op->addr.reg = op->val;
  1368. break;
  1369. }
  1370. }
  1371. static int writeback(struct x86_emulate_ctxt *ctxt)
  1372. {
  1373. int rc;
  1374. switch (ctxt->dst.type) {
  1375. case OP_REG:
  1376. write_register_operand(&ctxt->dst);
  1377. break;
  1378. case OP_MEM:
  1379. if (ctxt->lock_prefix)
  1380. rc = segmented_cmpxchg(ctxt,
  1381. ctxt->dst.addr.mem,
  1382. &ctxt->dst.orig_val,
  1383. &ctxt->dst.val,
  1384. ctxt->dst.bytes);
  1385. else
  1386. rc = segmented_write(ctxt,
  1387. ctxt->dst.addr.mem,
  1388. &ctxt->dst.val,
  1389. ctxt->dst.bytes);
  1390. if (rc != X86EMUL_CONTINUE)
  1391. return rc;
  1392. break;
  1393. case OP_MEM_STR:
  1394. rc = segmented_write(ctxt,
  1395. ctxt->dst.addr.mem,
  1396. ctxt->dst.data,
  1397. ctxt->dst.bytes * ctxt->dst.count);
  1398. if (rc != X86EMUL_CONTINUE)
  1399. return rc;
  1400. break;
  1401. case OP_XMM:
  1402. write_sse_reg(ctxt, &ctxt->dst.vec_val, ctxt->dst.addr.xmm);
  1403. break;
  1404. case OP_MM:
  1405. write_mmx_reg(ctxt, &ctxt->dst.mm_val, ctxt->dst.addr.mm);
  1406. break;
  1407. case OP_NONE:
  1408. /* no writeback */
  1409. break;
  1410. default:
  1411. break;
  1412. }
  1413. return X86EMUL_CONTINUE;
  1414. }
  1415. static int push(struct x86_emulate_ctxt *ctxt, void *data, int bytes)
  1416. {
  1417. struct segmented_address addr;
  1418. rsp_increment(ctxt, -bytes);
  1419. addr.ea = reg_read(ctxt, VCPU_REGS_RSP) & stack_mask(ctxt);
  1420. addr.seg = VCPU_SREG_SS;
  1421. return segmented_write(ctxt, addr, data, bytes);
  1422. }
  1423. static int em_push(struct x86_emulate_ctxt *ctxt)
  1424. {
  1425. /* Disable writeback. */
  1426. ctxt->dst.type = OP_NONE;
  1427. return push(ctxt, &ctxt->src.val, ctxt->op_bytes);
  1428. }
  1429. static int emulate_pop(struct x86_emulate_ctxt *ctxt,
  1430. void *dest, int len)
  1431. {
  1432. int rc;
  1433. struct segmented_address addr;
  1434. addr.ea = reg_read(ctxt, VCPU_REGS_RSP) & stack_mask(ctxt);
  1435. addr.seg = VCPU_SREG_SS;
  1436. rc = segmented_read(ctxt, addr, dest, len);
  1437. if (rc != X86EMUL_CONTINUE)
  1438. return rc;
  1439. rsp_increment(ctxt, len);
  1440. return rc;
  1441. }
  1442. static int em_pop(struct x86_emulate_ctxt *ctxt)
  1443. {
  1444. return emulate_pop(ctxt, &ctxt->dst.val, ctxt->op_bytes);
  1445. }
  1446. static int emulate_popf(struct x86_emulate_ctxt *ctxt,
  1447. void *dest, int len)
  1448. {
  1449. int rc;
  1450. unsigned long val, change_mask;
  1451. int iopl = (ctxt->eflags & X86_EFLAGS_IOPL) >> IOPL_SHIFT;
  1452. int cpl = ctxt->ops->cpl(ctxt);
  1453. rc = emulate_pop(ctxt, &val, len);
  1454. if (rc != X86EMUL_CONTINUE)
  1455. return rc;
  1456. change_mask = EFLG_CF | EFLG_PF | EFLG_AF | EFLG_ZF | EFLG_SF | EFLG_OF
  1457. | EFLG_TF | EFLG_DF | EFLG_NT | EFLG_RF | EFLG_AC | EFLG_ID;
  1458. switch(ctxt->mode) {
  1459. case X86EMUL_MODE_PROT64:
  1460. case X86EMUL_MODE_PROT32:
  1461. case X86EMUL_MODE_PROT16:
  1462. if (cpl == 0)
  1463. change_mask |= EFLG_IOPL;
  1464. if (cpl <= iopl)
  1465. change_mask |= EFLG_IF;
  1466. break;
  1467. case X86EMUL_MODE_VM86:
  1468. if (iopl < 3)
  1469. return emulate_gp(ctxt, 0);
  1470. change_mask |= EFLG_IF;
  1471. break;
  1472. default: /* real mode */
  1473. change_mask |= (EFLG_IOPL | EFLG_IF);
  1474. break;
  1475. }
  1476. *(unsigned long *)dest =
  1477. (ctxt->eflags & ~change_mask) | (val & change_mask);
  1478. return rc;
  1479. }
  1480. static int em_popf(struct x86_emulate_ctxt *ctxt)
  1481. {
  1482. ctxt->dst.type = OP_REG;
  1483. ctxt->dst.addr.reg = &ctxt->eflags;
  1484. ctxt->dst.bytes = ctxt->op_bytes;
  1485. return emulate_popf(ctxt, &ctxt->dst.val, ctxt->op_bytes);
  1486. }
  1487. static int em_enter(struct x86_emulate_ctxt *ctxt)
  1488. {
  1489. int rc;
  1490. unsigned frame_size = ctxt->src.val;
  1491. unsigned nesting_level = ctxt->src2.val & 31;
  1492. ulong rbp;
  1493. if (nesting_level)
  1494. return X86EMUL_UNHANDLEABLE;
  1495. rbp = reg_read(ctxt, VCPU_REGS_RBP);
  1496. rc = push(ctxt, &rbp, stack_size(ctxt));
  1497. if (rc != X86EMUL_CONTINUE)
  1498. return rc;
  1499. assign_masked(reg_rmw(ctxt, VCPU_REGS_RBP), reg_read(ctxt, VCPU_REGS_RSP),
  1500. stack_mask(ctxt));
  1501. assign_masked(reg_rmw(ctxt, VCPU_REGS_RSP),
  1502. reg_read(ctxt, VCPU_REGS_RSP) - frame_size,
  1503. stack_mask(ctxt));
  1504. return X86EMUL_CONTINUE;
  1505. }
  1506. static int em_leave(struct x86_emulate_ctxt *ctxt)
  1507. {
  1508. assign_masked(reg_rmw(ctxt, VCPU_REGS_RSP), reg_read(ctxt, VCPU_REGS_RBP),
  1509. stack_mask(ctxt));
  1510. return emulate_pop(ctxt, reg_rmw(ctxt, VCPU_REGS_RBP), ctxt->op_bytes);
  1511. }
  1512. static int em_push_sreg(struct x86_emulate_ctxt *ctxt)
  1513. {
  1514. int seg = ctxt->src2.val;
  1515. ctxt->src.val = get_segment_selector(ctxt, seg);
  1516. return em_push(ctxt);
  1517. }
  1518. static int em_pop_sreg(struct x86_emulate_ctxt *ctxt)
  1519. {
  1520. int seg = ctxt->src2.val;
  1521. unsigned long selector;
  1522. int rc;
  1523. rc = emulate_pop(ctxt, &selector, ctxt->op_bytes);
  1524. if (rc != X86EMUL_CONTINUE)
  1525. return rc;
  1526. rc = load_segment_descriptor(ctxt, (u16)selector, seg);
  1527. return rc;
  1528. }
  1529. static int em_pusha(struct x86_emulate_ctxt *ctxt)
  1530. {
  1531. unsigned long old_esp = reg_read(ctxt, VCPU_REGS_RSP);
  1532. int rc = X86EMUL_CONTINUE;
  1533. int reg = VCPU_REGS_RAX;
  1534. while (reg <= VCPU_REGS_RDI) {
  1535. (reg == VCPU_REGS_RSP) ?
  1536. (ctxt->src.val = old_esp) : (ctxt->src.val = reg_read(ctxt, reg));
  1537. rc = em_push(ctxt);
  1538. if (rc != X86EMUL_CONTINUE)
  1539. return rc;
  1540. ++reg;
  1541. }
  1542. return rc;
  1543. }
  1544. static int em_pushf(struct x86_emulate_ctxt *ctxt)
  1545. {
  1546. ctxt->src.val = (unsigned long)ctxt->eflags;
  1547. return em_push(ctxt);
  1548. }
  1549. static int em_popa(struct x86_emulate_ctxt *ctxt)
  1550. {
  1551. int rc = X86EMUL_CONTINUE;
  1552. int reg = VCPU_REGS_RDI;
  1553. while (reg >= VCPU_REGS_RAX) {
  1554. if (reg == VCPU_REGS_RSP) {
  1555. rsp_increment(ctxt, ctxt->op_bytes);
  1556. --reg;
  1557. }
  1558. rc = emulate_pop(ctxt, reg_rmw(ctxt, reg), ctxt->op_bytes);
  1559. if (rc != X86EMUL_CONTINUE)
  1560. break;
  1561. --reg;
  1562. }
  1563. return rc;
  1564. }
  1565. static int __emulate_int_real(struct x86_emulate_ctxt *ctxt, int irq)
  1566. {
  1567. const struct x86_emulate_ops *ops = ctxt->ops;
  1568. int rc;
  1569. struct desc_ptr dt;
  1570. gva_t cs_addr;
  1571. gva_t eip_addr;
  1572. u16 cs, eip;
  1573. /* TODO: Add limit checks */
  1574. ctxt->src.val = ctxt->eflags;
  1575. rc = em_push(ctxt);
  1576. if (rc != X86EMUL_CONTINUE)
  1577. return rc;
  1578. ctxt->eflags &= ~(EFLG_IF | EFLG_TF | EFLG_AC);
  1579. ctxt->src.val = get_segment_selector(ctxt, VCPU_SREG_CS);
  1580. rc = em_push(ctxt);
  1581. if (rc != X86EMUL_CONTINUE)
  1582. return rc;
  1583. ctxt->src.val = ctxt->_eip;
  1584. rc = em_push(ctxt);
  1585. if (rc != X86EMUL_CONTINUE)
  1586. return rc;
  1587. ops->get_idt(ctxt, &dt);
  1588. eip_addr = dt.address + (irq << 2);
  1589. cs_addr = dt.address + (irq << 2) + 2;
  1590. rc = ops->read_std(ctxt, cs_addr, &cs, 2, &ctxt->exception);
  1591. if (rc != X86EMUL_CONTINUE)
  1592. return rc;
  1593. rc = ops->read_std(ctxt, eip_addr, &eip, 2, &ctxt->exception);
  1594. if (rc != X86EMUL_CONTINUE)
  1595. return rc;
  1596. rc = load_segment_descriptor(ctxt, cs, VCPU_SREG_CS);
  1597. if (rc != X86EMUL_CONTINUE)
  1598. return rc;
  1599. ctxt->_eip = eip;
  1600. return rc;
  1601. }
  1602. int emulate_int_real(struct x86_emulate_ctxt *ctxt, int irq)
  1603. {
  1604. int rc;
  1605. invalidate_registers(ctxt);
  1606. rc = __emulate_int_real(ctxt, irq);
  1607. if (rc == X86EMUL_CONTINUE)
  1608. writeback_registers(ctxt);
  1609. return rc;
  1610. }
  1611. static int emulate_int(struct x86_emulate_ctxt *ctxt, int irq)
  1612. {
  1613. switch(ctxt->mode) {
  1614. case X86EMUL_MODE_REAL:
  1615. return __emulate_int_real(ctxt, irq);
  1616. case X86EMUL_MODE_VM86:
  1617. case X86EMUL_MODE_PROT16:
  1618. case X86EMUL_MODE_PROT32:
  1619. case X86EMUL_MODE_PROT64:
  1620. default:
  1621. /* Protected mode interrupts unimplemented yet */
  1622. return X86EMUL_UNHANDLEABLE;
  1623. }
  1624. }
  1625. static int emulate_iret_real(struct x86_emulate_ctxt *ctxt)
  1626. {
  1627. int rc = X86EMUL_CONTINUE;
  1628. unsigned long temp_eip = 0;
  1629. unsigned long temp_eflags = 0;
  1630. unsigned long cs = 0;
  1631. unsigned long mask = EFLG_CF | EFLG_PF | EFLG_AF | EFLG_ZF | EFLG_SF | EFLG_TF |
  1632. EFLG_IF | EFLG_DF | EFLG_OF | EFLG_IOPL | EFLG_NT | EFLG_RF |
  1633. EFLG_AC | EFLG_ID | (1 << 1); /* Last one is the reserved bit */
  1634. unsigned long vm86_mask = EFLG_VM | EFLG_VIF | EFLG_VIP;
  1635. /* TODO: Add stack limit check */
  1636. rc = emulate_pop(ctxt, &temp_eip, ctxt->op_bytes);
  1637. if (rc != X86EMUL_CONTINUE)
  1638. return rc;
  1639. if (temp_eip & ~0xffff)
  1640. return emulate_gp(ctxt, 0);
  1641. rc = emulate_pop(ctxt, &cs, ctxt->op_bytes);
  1642. if (rc != X86EMUL_CONTINUE)
  1643. return rc;
  1644. rc = emulate_pop(ctxt, &temp_eflags, ctxt->op_bytes);
  1645. if (rc != X86EMUL_CONTINUE)
  1646. return rc;
  1647. rc = load_segment_descriptor(ctxt, (u16)cs, VCPU_SREG_CS);
  1648. if (rc != X86EMUL_CONTINUE)
  1649. return rc;
  1650. ctxt->_eip = temp_eip;
  1651. if (ctxt->op_bytes == 4)
  1652. ctxt->eflags = ((temp_eflags & mask) | (ctxt->eflags & vm86_mask));
  1653. else if (ctxt->op_bytes == 2) {
  1654. ctxt->eflags &= ~0xffff;
  1655. ctxt->eflags |= temp_eflags;
  1656. }
  1657. ctxt->eflags &= ~EFLG_RESERVED_ZEROS_MASK; /* Clear reserved zeros */
  1658. ctxt->eflags |= EFLG_RESERVED_ONE_MASK;
  1659. return rc;
  1660. }
  1661. static int em_iret(struct x86_emulate_ctxt *ctxt)
  1662. {
  1663. switch(ctxt->mode) {
  1664. case X86EMUL_MODE_REAL:
  1665. return emulate_iret_real(ctxt);
  1666. case X86EMUL_MODE_VM86:
  1667. case X86EMUL_MODE_PROT16:
  1668. case X86EMUL_MODE_PROT32:
  1669. case X86EMUL_MODE_PROT64:
  1670. default:
  1671. /* iret from protected mode unimplemented yet */
  1672. return X86EMUL_UNHANDLEABLE;
  1673. }
  1674. }
  1675. static int em_jmp_far(struct x86_emulate_ctxt *ctxt)
  1676. {
  1677. int rc;
  1678. unsigned short sel;
  1679. memcpy(&sel, ctxt->src.valptr + ctxt->op_bytes, 2);
  1680. rc = load_segment_descriptor(ctxt, sel, VCPU_SREG_CS);
  1681. if (rc != X86EMUL_CONTINUE)
  1682. return rc;
  1683. ctxt->_eip = 0;
  1684. memcpy(&ctxt->_eip, ctxt->src.valptr, ctxt->op_bytes);
  1685. return X86EMUL_CONTINUE;
  1686. }
  1687. static int em_grp2(struct x86_emulate_ctxt *ctxt)
  1688. {
  1689. switch (ctxt->modrm_reg) {
  1690. case 0: /* rol */
  1691. emulate_2op_SrcB(ctxt, "rol");
  1692. break;
  1693. case 1: /* ror */
  1694. emulate_2op_SrcB(ctxt, "ror");
  1695. break;
  1696. case 2: /* rcl */
  1697. emulate_2op_SrcB(ctxt, "rcl");
  1698. break;
  1699. case 3: /* rcr */
  1700. emulate_2op_SrcB(ctxt, "rcr");
  1701. break;
  1702. case 4: /* sal/shl */
  1703. case 6: /* sal/shl */
  1704. emulate_2op_SrcB(ctxt, "sal");
  1705. break;
  1706. case 5: /* shr */
  1707. emulate_2op_SrcB(ctxt, "shr");
  1708. break;
  1709. case 7: /* sar */
  1710. emulate_2op_SrcB(ctxt, "sar");
  1711. break;
  1712. }
  1713. return X86EMUL_CONTINUE;
  1714. }
  1715. static int em_not(struct x86_emulate_ctxt *ctxt)
  1716. {
  1717. ctxt->dst.val = ~ctxt->dst.val;
  1718. return X86EMUL_CONTINUE;
  1719. }
  1720. static int em_neg(struct x86_emulate_ctxt *ctxt)
  1721. {
  1722. emulate_1op(ctxt, "neg");
  1723. return X86EMUL_CONTINUE;
  1724. }
  1725. static int em_mul_ex(struct x86_emulate_ctxt *ctxt)
  1726. {
  1727. u8 ex = 0;
  1728. emulate_1op_rax_rdx(ctxt, "mul", ex);
  1729. return X86EMUL_CONTINUE;
  1730. }
  1731. static int em_imul_ex(struct x86_emulate_ctxt *ctxt)
  1732. {
  1733. u8 ex = 0;
  1734. emulate_1op_rax_rdx(ctxt, "imul", ex);
  1735. return X86EMUL_CONTINUE;
  1736. }
  1737. static int em_div_ex(struct x86_emulate_ctxt *ctxt)
  1738. {
  1739. u8 de = 0;
  1740. emulate_1op_rax_rdx(ctxt, "div", de);
  1741. if (de)
  1742. return emulate_de(ctxt);
  1743. return X86EMUL_CONTINUE;
  1744. }
  1745. static int em_idiv_ex(struct x86_emulate_ctxt *ctxt)
  1746. {
  1747. u8 de = 0;
  1748. emulate_1op_rax_rdx(ctxt, "idiv", de);
  1749. if (de)
  1750. return emulate_de(ctxt);
  1751. return X86EMUL_CONTINUE;
  1752. }
  1753. static int em_grp45(struct x86_emulate_ctxt *ctxt)
  1754. {
  1755. int rc = X86EMUL_CONTINUE;
  1756. switch (ctxt->modrm_reg) {
  1757. case 0: /* inc */
  1758. emulate_1op(ctxt, "inc");
  1759. break;
  1760. case 1: /* dec */
  1761. emulate_1op(ctxt, "dec");
  1762. break;
  1763. case 2: /* call near abs */ {
  1764. long int old_eip;
  1765. old_eip = ctxt->_eip;
  1766. ctxt->_eip = ctxt->src.val;
  1767. ctxt->src.val = old_eip;
  1768. rc = em_push(ctxt);
  1769. break;
  1770. }
  1771. case 4: /* jmp abs */
  1772. ctxt->_eip = ctxt->src.val;
  1773. break;
  1774. case 5: /* jmp far */
  1775. rc = em_jmp_far(ctxt);
  1776. break;
  1777. case 6: /* push */
  1778. rc = em_push(ctxt);
  1779. break;
  1780. }
  1781. return rc;
  1782. }
  1783. static int em_cmpxchg8b(struct x86_emulate_ctxt *ctxt)
  1784. {
  1785. u64 old = ctxt->dst.orig_val64;
  1786. if (((u32) (old >> 0) != (u32) reg_read(ctxt, VCPU_REGS_RAX)) ||
  1787. ((u32) (old >> 32) != (u32) reg_read(ctxt, VCPU_REGS_RDX))) {
  1788. *reg_write(ctxt, VCPU_REGS_RAX) = (u32) (old >> 0);
  1789. *reg_write(ctxt, VCPU_REGS_RDX) = (u32) (old >> 32);
  1790. ctxt->eflags &= ~EFLG_ZF;
  1791. } else {
  1792. ctxt->dst.val64 = ((u64)reg_read(ctxt, VCPU_REGS_RCX) << 32) |
  1793. (u32) reg_read(ctxt, VCPU_REGS_RBX);
  1794. ctxt->eflags |= EFLG_ZF;
  1795. }
  1796. return X86EMUL_CONTINUE;
  1797. }
  1798. static int em_ret(struct x86_emulate_ctxt *ctxt)
  1799. {
  1800. ctxt->dst.type = OP_REG;
  1801. ctxt->dst.addr.reg = &ctxt->_eip;
  1802. ctxt->dst.bytes = ctxt->op_bytes;
  1803. return em_pop(ctxt);
  1804. }
  1805. static int em_ret_far(struct x86_emulate_ctxt *ctxt)
  1806. {
  1807. int rc;
  1808. unsigned long cs;
  1809. rc = emulate_pop(ctxt, &ctxt->_eip, ctxt->op_bytes);
  1810. if (rc != X86EMUL_CONTINUE)
  1811. return rc;
  1812. if (ctxt->op_bytes == 4)
  1813. ctxt->_eip = (u32)ctxt->_eip;
  1814. rc = emulate_pop(ctxt, &cs, ctxt->op_bytes);
  1815. if (rc != X86EMUL_CONTINUE)
  1816. return rc;
  1817. rc = load_segment_descriptor(ctxt, (u16)cs, VCPU_SREG_CS);
  1818. return rc;
  1819. }
  1820. static int em_cmpxchg(struct x86_emulate_ctxt *ctxt)
  1821. {
  1822. /* Save real source value, then compare EAX against destination. */
  1823. ctxt->src.orig_val = ctxt->src.val;
  1824. ctxt->src.val = reg_read(ctxt, VCPU_REGS_RAX);
  1825. emulate_2op_SrcV(ctxt, "cmp");
  1826. if (ctxt->eflags & EFLG_ZF) {
  1827. /* Success: write back to memory. */
  1828. ctxt->dst.val = ctxt->src.orig_val;
  1829. } else {
  1830. /* Failure: write the value we saw to EAX. */
  1831. ctxt->dst.type = OP_REG;
  1832. ctxt->dst.addr.reg = reg_rmw(ctxt, VCPU_REGS_RAX);
  1833. }
  1834. return X86EMUL_CONTINUE;
  1835. }
  1836. static int em_lseg(struct x86_emulate_ctxt *ctxt)
  1837. {
  1838. int seg = ctxt->src2.val;
  1839. unsigned short sel;
  1840. int rc;
  1841. memcpy(&sel, ctxt->src.valptr + ctxt->op_bytes, 2);
  1842. rc = load_segment_descriptor(ctxt, sel, seg);
  1843. if (rc != X86EMUL_CONTINUE)
  1844. return rc;
  1845. ctxt->dst.val = ctxt->src.val;
  1846. return rc;
  1847. }
  1848. static void
  1849. setup_syscalls_segments(struct x86_emulate_ctxt *ctxt,
  1850. struct desc_struct *cs, struct desc_struct *ss)
  1851. {
  1852. cs->l = 0; /* will be adjusted later */
  1853. set_desc_base(cs, 0); /* flat segment */
  1854. cs->g = 1; /* 4kb granularity */
  1855. set_desc_limit(cs, 0xfffff); /* 4GB limit */
  1856. cs->type = 0x0b; /* Read, Execute, Accessed */
  1857. cs->s = 1;
  1858. cs->dpl = 0; /* will be adjusted later */
  1859. cs->p = 1;
  1860. cs->d = 1;
  1861. cs->avl = 0;
  1862. set_desc_base(ss, 0); /* flat segment */
  1863. set_desc_limit(ss, 0xfffff); /* 4GB limit */
  1864. ss->g = 1; /* 4kb granularity */
  1865. ss->s = 1;
  1866. ss->type = 0x03; /* Read/Write, Accessed */
  1867. ss->d = 1; /* 32bit stack segment */
  1868. ss->dpl = 0;
  1869. ss->p = 1;
  1870. ss->l = 0;
  1871. ss->avl = 0;
  1872. }
  1873. static bool vendor_intel(struct x86_emulate_ctxt *ctxt)
  1874. {
  1875. u32 eax, ebx, ecx, edx;
  1876. eax = ecx = 0;
  1877. ctxt->ops->get_cpuid(ctxt, &eax, &ebx, &ecx, &edx);
  1878. return ebx == X86EMUL_CPUID_VENDOR_GenuineIntel_ebx
  1879. && ecx == X86EMUL_CPUID_VENDOR_GenuineIntel_ecx
  1880. && edx == X86EMUL_CPUID_VENDOR_GenuineIntel_edx;
  1881. }
  1882. static bool em_syscall_is_enabled(struct x86_emulate_ctxt *ctxt)
  1883. {
  1884. const struct x86_emulate_ops *ops = ctxt->ops;
  1885. u32 eax, ebx, ecx, edx;
  1886. /*
  1887. * syscall should always be enabled in longmode - so only become
  1888. * vendor specific (cpuid) if other modes are active...
  1889. */
  1890. if (ctxt->mode == X86EMUL_MODE_PROT64)
  1891. return true;
  1892. eax = 0x00000000;
  1893. ecx = 0x00000000;
  1894. ops->get_cpuid(ctxt, &eax, &ebx, &ecx, &edx);
  1895. /*
  1896. * Intel ("GenuineIntel")
  1897. * remark: Intel CPUs only support "syscall" in 64bit
  1898. * longmode. Also an 64bit guest with a
  1899. * 32bit compat-app running will #UD !! While this
  1900. * behaviour can be fixed (by emulating) into AMD
  1901. * response - CPUs of AMD can't behave like Intel.
  1902. */
  1903. if (ebx == X86EMUL_CPUID_VENDOR_GenuineIntel_ebx &&
  1904. ecx == X86EMUL_CPUID_VENDOR_GenuineIntel_ecx &&
  1905. edx == X86EMUL_CPUID_VENDOR_GenuineIntel_edx)
  1906. return false;
  1907. /* AMD ("AuthenticAMD") */
  1908. if (ebx == X86EMUL_CPUID_VENDOR_AuthenticAMD_ebx &&
  1909. ecx == X86EMUL_CPUID_VENDOR_AuthenticAMD_ecx &&
  1910. edx == X86EMUL_CPUID_VENDOR_AuthenticAMD_edx)
  1911. return true;
  1912. /* AMD ("AMDisbetter!") */
  1913. if (ebx == X86EMUL_CPUID_VENDOR_AMDisbetterI_ebx &&
  1914. ecx == X86EMUL_CPUID_VENDOR_AMDisbetterI_ecx &&
  1915. edx == X86EMUL_CPUID_VENDOR_AMDisbetterI_edx)
  1916. return true;
  1917. /* default: (not Intel, not AMD), apply Intel's stricter rules... */
  1918. return false;
  1919. }
  1920. static int em_syscall(struct x86_emulate_ctxt *ctxt)
  1921. {
  1922. const struct x86_emulate_ops *ops = ctxt->ops;
  1923. struct desc_struct cs, ss;
  1924. u64 msr_data;
  1925. u16 cs_sel, ss_sel;
  1926. u64 efer = 0;
  1927. /* syscall is not available in real mode */
  1928. if (ctxt->mode == X86EMUL_MODE_REAL ||
  1929. ctxt->mode == X86EMUL_MODE_VM86)
  1930. return emulate_ud(ctxt);
  1931. if (!(em_syscall_is_enabled(ctxt)))
  1932. return emulate_ud(ctxt);
  1933. ops->get_msr(ctxt, MSR_EFER, &efer);
  1934. setup_syscalls_segments(ctxt, &cs, &ss);
  1935. if (!(efer & EFER_SCE))
  1936. return emulate_ud(ctxt);
  1937. ops->get_msr(ctxt, MSR_STAR, &msr_data);
  1938. msr_data >>= 32;
  1939. cs_sel = (u16)(msr_data & 0xfffc);
  1940. ss_sel = (u16)(msr_data + 8);
  1941. if (efer & EFER_LMA) {
  1942. cs.d = 0;
  1943. cs.l = 1;
  1944. }
  1945. ops->set_segment(ctxt, cs_sel, &cs, 0, VCPU_SREG_CS);
  1946. ops->set_segment(ctxt, ss_sel, &ss, 0, VCPU_SREG_SS);
  1947. *reg_write(ctxt, VCPU_REGS_RCX) = ctxt->_eip;
  1948. if (efer & EFER_LMA) {
  1949. #ifdef CONFIG_X86_64
  1950. *reg_write(ctxt, VCPU_REGS_R11) = ctxt->eflags & ~EFLG_RF;
  1951. ops->get_msr(ctxt,
  1952. ctxt->mode == X86EMUL_MODE_PROT64 ?
  1953. MSR_LSTAR : MSR_CSTAR, &msr_data);
  1954. ctxt->_eip = msr_data;
  1955. ops->get_msr(ctxt, MSR_SYSCALL_MASK, &msr_data);
  1956. ctxt->eflags &= ~(msr_data | EFLG_RF);
  1957. #endif
  1958. } else {
  1959. /* legacy mode */
  1960. ops->get_msr(ctxt, MSR_STAR, &msr_data);
  1961. ctxt->_eip = (u32)msr_data;
  1962. ctxt->eflags &= ~(EFLG_VM | EFLG_IF | EFLG_RF);
  1963. }
  1964. return X86EMUL_CONTINUE;
  1965. }
  1966. static int em_sysenter(struct x86_emulate_ctxt *ctxt)
  1967. {
  1968. const struct x86_emulate_ops *ops = ctxt->ops;
  1969. struct desc_struct cs, ss;
  1970. u64 msr_data;
  1971. u16 cs_sel, ss_sel;
  1972. u64 efer = 0;
  1973. ops->get_msr(ctxt, MSR_EFER, &efer);
  1974. /* inject #GP if in real mode */
  1975. if (ctxt->mode == X86EMUL_MODE_REAL)
  1976. return emulate_gp(ctxt, 0);
  1977. /*
  1978. * Not recognized on AMD in compat mode (but is recognized in legacy
  1979. * mode).
  1980. */
  1981. if ((ctxt->mode == X86EMUL_MODE_PROT32) && (efer & EFER_LMA)
  1982. && !vendor_intel(ctxt))
  1983. return emulate_ud(ctxt);
  1984. /* XXX sysenter/sysexit have not been tested in 64bit mode.
  1985. * Therefore, we inject an #UD.
  1986. */
  1987. if (ctxt->mode == X86EMUL_MODE_PROT64)
  1988. return emulate_ud(ctxt);
  1989. setup_syscalls_segments(ctxt, &cs, &ss);
  1990. ops->get_msr(ctxt, MSR_IA32_SYSENTER_CS, &msr_data);
  1991. switch (ctxt->mode) {
  1992. case X86EMUL_MODE_PROT32:
  1993. if ((msr_data & 0xfffc) == 0x0)
  1994. return emulate_gp(ctxt, 0);
  1995. break;
  1996. case X86EMUL_MODE_PROT64:
  1997. if (msr_data == 0x0)
  1998. return emulate_gp(ctxt, 0);
  1999. break;
  2000. default:
  2001. break;
  2002. }
  2003. ctxt->eflags &= ~(EFLG_VM | EFLG_IF | EFLG_RF);
  2004. cs_sel = (u16)msr_data;
  2005. cs_sel &= ~SELECTOR_RPL_MASK;
  2006. ss_sel = cs_sel + 8;
  2007. ss_sel &= ~SELECTOR_RPL_MASK;
  2008. if (ctxt->mode == X86EMUL_MODE_PROT64 || (efer & EFER_LMA)) {
  2009. cs.d = 0;
  2010. cs.l = 1;
  2011. }
  2012. ops->set_segment(ctxt, cs_sel, &cs, 0, VCPU_SREG_CS);
  2013. ops->set_segment(ctxt, ss_sel, &ss, 0, VCPU_SREG_SS);
  2014. ops->get_msr(ctxt, MSR_IA32_SYSENTER_EIP, &msr_data);
  2015. ctxt->_eip = msr_data;
  2016. ops->get_msr(ctxt, MSR_IA32_SYSENTER_ESP, &msr_data);
  2017. *reg_write(ctxt, VCPU_REGS_RSP) = msr_data;
  2018. return X86EMUL_CONTINUE;
  2019. }
  2020. static int em_sysexit(struct x86_emulate_ctxt *ctxt)
  2021. {
  2022. const struct x86_emulate_ops *ops = ctxt->ops;
  2023. struct desc_struct cs, ss;
  2024. u64 msr_data;
  2025. int usermode;
  2026. u16 cs_sel = 0, ss_sel = 0;
  2027. /* inject #GP if in real mode or Virtual 8086 mode */
  2028. if (ctxt->mode == X86EMUL_MODE_REAL ||
  2029. ctxt->mode == X86EMUL_MODE_VM86)
  2030. return emulate_gp(ctxt, 0);
  2031. setup_syscalls_segments(ctxt, &cs, &ss);
  2032. if ((ctxt->rex_prefix & 0x8) != 0x0)
  2033. usermode = X86EMUL_MODE_PROT64;
  2034. else
  2035. usermode = X86EMUL_MODE_PROT32;
  2036. cs.dpl = 3;
  2037. ss.dpl = 3;
  2038. ops->get_msr(ctxt, MSR_IA32_SYSENTER_CS, &msr_data);
  2039. switch (usermode) {
  2040. case X86EMUL_MODE_PROT32:
  2041. cs_sel = (u16)(msr_data + 16);
  2042. if ((msr_data & 0xfffc) == 0x0)
  2043. return emulate_gp(ctxt, 0);
  2044. ss_sel = (u16)(msr_data + 24);
  2045. break;
  2046. case X86EMUL_MODE_PROT64:
  2047. cs_sel = (u16)(msr_data + 32);
  2048. if (msr_data == 0x0)
  2049. return emulate_gp(ctxt, 0);
  2050. ss_sel = cs_sel + 8;
  2051. cs.d = 0;
  2052. cs.l = 1;
  2053. break;
  2054. }
  2055. cs_sel |= SELECTOR_RPL_MASK;
  2056. ss_sel |= SELECTOR_RPL_MASK;
  2057. ops->set_segment(ctxt, cs_sel, &cs, 0, VCPU_SREG_CS);
  2058. ops->set_segment(ctxt, ss_sel, &ss, 0, VCPU_SREG_SS);
  2059. ctxt->_eip = reg_read(ctxt, VCPU_REGS_RDX);
  2060. *reg_write(ctxt, VCPU_REGS_RSP) = reg_read(ctxt, VCPU_REGS_RCX);
  2061. return X86EMUL_CONTINUE;
  2062. }
  2063. static bool emulator_bad_iopl(struct x86_emulate_ctxt *ctxt)
  2064. {
  2065. int iopl;
  2066. if (ctxt->mode == X86EMUL_MODE_REAL)
  2067. return false;
  2068. if (ctxt->mode == X86EMUL_MODE_VM86)
  2069. return true;
  2070. iopl = (ctxt->eflags & X86_EFLAGS_IOPL) >> IOPL_SHIFT;
  2071. return ctxt->ops->cpl(ctxt) > iopl;
  2072. }
  2073. static bool emulator_io_port_access_allowed(struct x86_emulate_ctxt *ctxt,
  2074. u16 port, u16 len)
  2075. {
  2076. const struct x86_emulate_ops *ops = ctxt->ops;
  2077. struct desc_struct tr_seg;
  2078. u32 base3;
  2079. int r;
  2080. u16 tr, io_bitmap_ptr, perm, bit_idx = port & 0x7;
  2081. unsigned mask = (1 << len) - 1;
  2082. unsigned long base;
  2083. ops->get_segment(ctxt, &tr, &tr_seg, &base3, VCPU_SREG_TR);
  2084. if (!tr_seg.p)
  2085. return false;
  2086. if (desc_limit_scaled(&tr_seg) < 103)
  2087. return false;
  2088. base = get_desc_base(&tr_seg);
  2089. #ifdef CONFIG_X86_64
  2090. base |= ((u64)base3) << 32;
  2091. #endif
  2092. r = ops->read_std(ctxt, base + 102, &io_bitmap_ptr, 2, NULL);
  2093. if (r != X86EMUL_CONTINUE)
  2094. return false;
  2095. if (io_bitmap_ptr + port/8 > desc_limit_scaled(&tr_seg))
  2096. return false;
  2097. r = ops->read_std(ctxt, base + io_bitmap_ptr + port/8, &perm, 2, NULL);
  2098. if (r != X86EMUL_CONTINUE)
  2099. return false;
  2100. if ((perm >> bit_idx) & mask)
  2101. return false;
  2102. return true;
  2103. }
  2104. static bool emulator_io_permited(struct x86_emulate_ctxt *ctxt,
  2105. u16 port, u16 len)
  2106. {
  2107. if (ctxt->perm_ok)
  2108. return true;
  2109. if (emulator_bad_iopl(ctxt))
  2110. if (!emulator_io_port_access_allowed(ctxt, port, len))
  2111. return false;
  2112. ctxt->perm_ok = true;
  2113. return true;
  2114. }
  2115. static void save_state_to_tss16(struct x86_emulate_ctxt *ctxt,
  2116. struct tss_segment_16 *tss)
  2117. {
  2118. tss->ip = ctxt->_eip;
  2119. tss->flag = ctxt->eflags;
  2120. tss->ax = reg_read(ctxt, VCPU_REGS_RAX);
  2121. tss->cx = reg_read(ctxt, VCPU_REGS_RCX);
  2122. tss->dx = reg_read(ctxt, VCPU_REGS_RDX);
  2123. tss->bx = reg_read(ctxt, VCPU_REGS_RBX);
  2124. tss->sp = reg_read(ctxt, VCPU_REGS_RSP);
  2125. tss->bp = reg_read(ctxt, VCPU_REGS_RBP);
  2126. tss->si = reg_read(ctxt, VCPU_REGS_RSI);
  2127. tss->di = reg_read(ctxt, VCPU_REGS_RDI);
  2128. tss->es = get_segment_selector(ctxt, VCPU_SREG_ES);
  2129. tss->cs = get_segment_selector(ctxt, VCPU_SREG_CS);
  2130. tss->ss = get_segment_selector(ctxt, VCPU_SREG_SS);
  2131. tss->ds = get_segment_selector(ctxt, VCPU_SREG_DS);
  2132. tss->ldt = get_segment_selector(ctxt, VCPU_SREG_LDTR);
  2133. }
  2134. static int load_state_from_tss16(struct x86_emulate_ctxt *ctxt,
  2135. struct tss_segment_16 *tss)
  2136. {
  2137. int ret;
  2138. ctxt->_eip = tss->ip;
  2139. ctxt->eflags = tss->flag | 2;
  2140. *reg_write(ctxt, VCPU_REGS_RAX) = tss->ax;
  2141. *reg_write(ctxt, VCPU_REGS_RCX) = tss->cx;
  2142. *reg_write(ctxt, VCPU_REGS_RDX) = tss->dx;
  2143. *reg_write(ctxt, VCPU_REGS_RBX) = tss->bx;
  2144. *reg_write(ctxt, VCPU_REGS_RSP) = tss->sp;
  2145. *reg_write(ctxt, VCPU_REGS_RBP) = tss->bp;
  2146. *reg_write(ctxt, VCPU_REGS_RSI) = tss->si;
  2147. *reg_write(ctxt, VCPU_REGS_RDI) = tss->di;
  2148. /*
  2149. * SDM says that segment selectors are loaded before segment
  2150. * descriptors
  2151. */
  2152. set_segment_selector(ctxt, tss->ldt, VCPU_SREG_LDTR);
  2153. set_segment_selector(ctxt, tss->es, VCPU_SREG_ES);
  2154. set_segment_selector(ctxt, tss->cs, VCPU_SREG_CS);
  2155. set_segment_selector(ctxt, tss->ss, VCPU_SREG_SS);
  2156. set_segment_selector(ctxt, tss->ds, VCPU_SREG_DS);
  2157. /*
  2158. * Now load segment descriptors. If fault happens at this stage
  2159. * it is handled in a context of new task
  2160. */
  2161. ret = load_segment_descriptor(ctxt, tss->ldt, VCPU_SREG_LDTR);
  2162. if (ret != X86EMUL_CONTINUE)
  2163. return ret;
  2164. ret = load_segment_descriptor(ctxt, tss->es, VCPU_SREG_ES);
  2165. if (ret != X86EMUL_CONTINUE)
  2166. return ret;
  2167. ret = load_segment_descriptor(ctxt, tss->cs, VCPU_SREG_CS);
  2168. if (ret != X86EMUL_CONTINUE)
  2169. return ret;
  2170. ret = load_segment_descriptor(ctxt, tss->ss, VCPU_SREG_SS);
  2171. if (ret != X86EMUL_CONTINUE)
  2172. return ret;
  2173. ret = load_segment_descriptor(ctxt, tss->ds, VCPU_SREG_DS);
  2174. if (ret != X86EMUL_CONTINUE)
  2175. return ret;
  2176. return X86EMUL_CONTINUE;
  2177. }
  2178. static int task_switch_16(struct x86_emulate_ctxt *ctxt,
  2179. u16 tss_selector, u16 old_tss_sel,
  2180. ulong old_tss_base, struct desc_struct *new_desc)
  2181. {
  2182. const struct x86_emulate_ops *ops = ctxt->ops;
  2183. struct tss_segment_16 tss_seg;
  2184. int ret;
  2185. u32 new_tss_base = get_desc_base(new_desc);
  2186. ret = ops->read_std(ctxt, old_tss_base, &tss_seg, sizeof tss_seg,
  2187. &ctxt->exception);
  2188. if (ret != X86EMUL_CONTINUE)
  2189. /* FIXME: need to provide precise fault address */
  2190. return ret;
  2191. save_state_to_tss16(ctxt, &tss_seg);
  2192. ret = ops->write_std(ctxt, old_tss_base, &tss_seg, sizeof tss_seg,
  2193. &ctxt->exception);
  2194. if (ret != X86EMUL_CONTINUE)
  2195. /* FIXME: need to provide precise fault address */
  2196. return ret;
  2197. ret = ops->read_std(ctxt, new_tss_base, &tss_seg, sizeof tss_seg,
  2198. &ctxt->exception);
  2199. if (ret != X86EMUL_CONTINUE)
  2200. /* FIXME: need to provide precise fault address */
  2201. return ret;
  2202. if (old_tss_sel != 0xffff) {
  2203. tss_seg.prev_task_link = old_tss_sel;
  2204. ret = ops->write_std(ctxt, new_tss_base,
  2205. &tss_seg.prev_task_link,
  2206. sizeof tss_seg.prev_task_link,
  2207. &ctxt->exception);
  2208. if (ret != X86EMUL_CONTINUE)
  2209. /* FIXME: need to provide precise fault address */
  2210. return ret;
  2211. }
  2212. return load_state_from_tss16(ctxt, &tss_seg);
  2213. }
  2214. static void save_state_to_tss32(struct x86_emulate_ctxt *ctxt,
  2215. struct tss_segment_32 *tss)
  2216. {
  2217. tss->cr3 = ctxt->ops->get_cr(ctxt, 3);
  2218. tss->eip = ctxt->_eip;
  2219. tss->eflags = ctxt->eflags;
  2220. tss->eax = reg_read(ctxt, VCPU_REGS_RAX);
  2221. tss->ecx = reg_read(ctxt, VCPU_REGS_RCX);
  2222. tss->edx = reg_read(ctxt, VCPU_REGS_RDX);
  2223. tss->ebx = reg_read(ctxt, VCPU_REGS_RBX);
  2224. tss->esp = reg_read(ctxt, VCPU_REGS_RSP);
  2225. tss->ebp = reg_read(ctxt, VCPU_REGS_RBP);
  2226. tss->esi = reg_read(ctxt, VCPU_REGS_RSI);
  2227. tss->edi = reg_read(ctxt, VCPU_REGS_RDI);
  2228. tss->es = get_segment_selector(ctxt, VCPU_SREG_ES);
  2229. tss->cs = get_segment_selector(ctxt, VCPU_SREG_CS);
  2230. tss->ss = get_segment_selector(ctxt, VCPU_SREG_SS);
  2231. tss->ds = get_segment_selector(ctxt, VCPU_SREG_DS);
  2232. tss->fs = get_segment_selector(ctxt, VCPU_SREG_FS);
  2233. tss->gs = get_segment_selector(ctxt, VCPU_SREG_GS);
  2234. tss->ldt_selector = get_segment_selector(ctxt, VCPU_SREG_LDTR);
  2235. }
  2236. static int load_state_from_tss32(struct x86_emulate_ctxt *ctxt,
  2237. struct tss_segment_32 *tss)
  2238. {
  2239. int ret;
  2240. if (ctxt->ops->set_cr(ctxt, 3, tss->cr3))
  2241. return emulate_gp(ctxt, 0);
  2242. ctxt->_eip = tss->eip;
  2243. ctxt->eflags = tss->eflags | 2;
  2244. /* General purpose registers */
  2245. *reg_write(ctxt, VCPU_REGS_RAX) = tss->eax;
  2246. *reg_write(ctxt, VCPU_REGS_RCX) = tss->ecx;
  2247. *reg_write(ctxt, VCPU_REGS_RDX) = tss->edx;
  2248. *reg_write(ctxt, VCPU_REGS_RBX) = tss->ebx;
  2249. *reg_write(ctxt, VCPU_REGS_RSP) = tss->esp;
  2250. *reg_write(ctxt, VCPU_REGS_RBP) = tss->ebp;
  2251. *reg_write(ctxt, VCPU_REGS_RSI) = tss->esi;
  2252. *reg_write(ctxt, VCPU_REGS_RDI) = tss->edi;
  2253. /*
  2254. * SDM says that segment selectors are loaded before segment
  2255. * descriptors
  2256. */
  2257. set_segment_selector(ctxt, tss->ldt_selector, VCPU_SREG_LDTR);
  2258. set_segment_selector(ctxt, tss->es, VCPU_SREG_ES);
  2259. set_segment_selector(ctxt, tss->cs, VCPU_SREG_CS);
  2260. set_segment_selector(ctxt, tss->ss, VCPU_SREG_SS);
  2261. set_segment_selector(ctxt, tss->ds, VCPU_SREG_DS);
  2262. set_segment_selector(ctxt, tss->fs, VCPU_SREG_FS);
  2263. set_segment_selector(ctxt, tss->gs, VCPU_SREG_GS);
  2264. /*
  2265. * If we're switching between Protected Mode and VM86, we need to make
  2266. * sure to update the mode before loading the segment descriptors so
  2267. * that the selectors are interpreted correctly.
  2268. *
  2269. * Need to get rflags to the vcpu struct immediately because it
  2270. * influences the CPL which is checked at least when loading the segment
  2271. * descriptors and when pushing an error code to the new kernel stack.
  2272. *
  2273. * TODO Introduce a separate ctxt->ops->set_cpl callback
  2274. */
  2275. if (ctxt->eflags & X86_EFLAGS_VM)
  2276. ctxt->mode = X86EMUL_MODE_VM86;
  2277. else
  2278. ctxt->mode = X86EMUL_MODE_PROT32;
  2279. ctxt->ops->set_rflags(ctxt, ctxt->eflags);
  2280. /*
  2281. * Now load segment descriptors. If fault happenes at this stage
  2282. * it is handled in a context of new task
  2283. */
  2284. ret = load_segment_descriptor(ctxt, tss->ldt_selector, VCPU_SREG_LDTR);
  2285. if (ret != X86EMUL_CONTINUE)
  2286. return ret;
  2287. ret = load_segment_descriptor(ctxt, tss->es, VCPU_SREG_ES);
  2288. if (ret != X86EMUL_CONTINUE)
  2289. return ret;
  2290. ret = load_segment_descriptor(ctxt, tss->cs, VCPU_SREG_CS);
  2291. if (ret != X86EMUL_CONTINUE)
  2292. return ret;
  2293. ret = load_segment_descriptor(ctxt, tss->ss, VCPU_SREG_SS);
  2294. if (ret != X86EMUL_CONTINUE)
  2295. return ret;
  2296. ret = load_segment_descriptor(ctxt, tss->ds, VCPU_SREG_DS);
  2297. if (ret != X86EMUL_CONTINUE)
  2298. return ret;
  2299. ret = load_segment_descriptor(ctxt, tss->fs, VCPU_SREG_FS);
  2300. if (ret != X86EMUL_CONTINUE)
  2301. return ret;
  2302. ret = load_segment_descriptor(ctxt, tss->gs, VCPU_SREG_GS);
  2303. if (ret != X86EMUL_CONTINUE)
  2304. return ret;
  2305. return X86EMUL_CONTINUE;
  2306. }
  2307. static int task_switch_32(struct x86_emulate_ctxt *ctxt,
  2308. u16 tss_selector, u16 old_tss_sel,
  2309. ulong old_tss_base, struct desc_struct *new_desc)
  2310. {
  2311. const struct x86_emulate_ops *ops = ctxt->ops;
  2312. struct tss_segment_32 tss_seg;
  2313. int ret;
  2314. u32 new_tss_base = get_desc_base(new_desc);
  2315. ret = ops->read_std(ctxt, old_tss_base, &tss_seg, sizeof tss_seg,
  2316. &ctxt->exception);
  2317. if (ret != X86EMUL_CONTINUE)
  2318. /* FIXME: need to provide precise fault address */
  2319. return ret;
  2320. save_state_to_tss32(ctxt, &tss_seg);
  2321. ret = ops->write_std(ctxt, old_tss_base, &tss_seg, sizeof tss_seg,
  2322. &ctxt->exception);
  2323. if (ret != X86EMUL_CONTINUE)
  2324. /* FIXME: need to provide precise fault address */
  2325. return ret;
  2326. ret = ops->read_std(ctxt, new_tss_base, &tss_seg, sizeof tss_seg,
  2327. &ctxt->exception);
  2328. if (ret != X86EMUL_CONTINUE)
  2329. /* FIXME: need to provide precise fault address */
  2330. return ret;
  2331. if (old_tss_sel != 0xffff) {
  2332. tss_seg.prev_task_link = old_tss_sel;
  2333. ret = ops->write_std(ctxt, new_tss_base,
  2334. &tss_seg.prev_task_link,
  2335. sizeof tss_seg.prev_task_link,
  2336. &ctxt->exception);
  2337. if (ret != X86EMUL_CONTINUE)
  2338. /* FIXME: need to provide precise fault address */
  2339. return ret;
  2340. }
  2341. return load_state_from_tss32(ctxt, &tss_seg);
  2342. }
  2343. static int emulator_do_task_switch(struct x86_emulate_ctxt *ctxt,
  2344. u16 tss_selector, int idt_index, int reason,
  2345. bool has_error_code, u32 error_code)
  2346. {
  2347. const struct x86_emulate_ops *ops = ctxt->ops;
  2348. struct desc_struct curr_tss_desc, next_tss_desc;
  2349. int ret;
  2350. u16 old_tss_sel = get_segment_selector(ctxt, VCPU_SREG_TR);
  2351. ulong old_tss_base =
  2352. ops->get_cached_segment_base(ctxt, VCPU_SREG_TR);
  2353. u32 desc_limit;
  2354. ulong desc_addr;
  2355. /* FIXME: old_tss_base == ~0 ? */
  2356. ret = read_segment_descriptor(ctxt, tss_selector, &next_tss_desc, &desc_addr);
  2357. if (ret != X86EMUL_CONTINUE)
  2358. return ret;
  2359. ret = read_segment_descriptor(ctxt, old_tss_sel, &curr_tss_desc, &desc_addr);
  2360. if (ret != X86EMUL_CONTINUE)
  2361. return ret;
  2362. /* FIXME: check that next_tss_desc is tss */
  2363. /*
  2364. * Check privileges. The three cases are task switch caused by...
  2365. *
  2366. * 1. jmp/call/int to task gate: Check against DPL of the task gate
  2367. * 2. Exception/IRQ/iret: No check is performed
  2368. * 3. jmp/call to TSS: Check against DPL of the TSS
  2369. */
  2370. if (reason == TASK_SWITCH_GATE) {
  2371. if (idt_index != -1) {
  2372. /* Software interrupts */
  2373. struct desc_struct task_gate_desc;
  2374. int dpl;
  2375. ret = read_interrupt_descriptor(ctxt, idt_index,
  2376. &task_gate_desc);
  2377. if (ret != X86EMUL_CONTINUE)
  2378. return ret;
  2379. dpl = task_gate_desc.dpl;
  2380. if ((tss_selector & 3) > dpl || ops->cpl(ctxt) > dpl)
  2381. return emulate_gp(ctxt, (idt_index << 3) | 0x2);
  2382. }
  2383. } else if (reason != TASK_SWITCH_IRET) {
  2384. int dpl = next_tss_desc.dpl;
  2385. if ((tss_selector & 3) > dpl || ops->cpl(ctxt) > dpl)
  2386. return emulate_gp(ctxt, tss_selector);
  2387. }
  2388. desc_limit = desc_limit_scaled(&next_tss_desc);
  2389. if (!next_tss_desc.p ||
  2390. ((desc_limit < 0x67 && (next_tss_desc.type & 8)) ||
  2391. desc_limit < 0x2b)) {
  2392. emulate_ts(ctxt, tss_selector & 0xfffc);
  2393. return X86EMUL_PROPAGATE_FAULT;
  2394. }
  2395. if (reason == TASK_SWITCH_IRET || reason == TASK_SWITCH_JMP) {
  2396. curr_tss_desc.type &= ~(1 << 1); /* clear busy flag */
  2397. write_segment_descriptor(ctxt, old_tss_sel, &curr_tss_desc);
  2398. }
  2399. if (reason == TASK_SWITCH_IRET)
  2400. ctxt->eflags = ctxt->eflags & ~X86_EFLAGS_NT;
  2401. /* set back link to prev task only if NT bit is set in eflags
  2402. note that old_tss_sel is not used after this point */
  2403. if (reason != TASK_SWITCH_CALL && reason != TASK_SWITCH_GATE)
  2404. old_tss_sel = 0xffff;
  2405. if (next_tss_desc.type & 8)
  2406. ret = task_switch_32(ctxt, tss_selector, old_tss_sel,
  2407. old_tss_base, &next_tss_desc);
  2408. else
  2409. ret = task_switch_16(ctxt, tss_selector, old_tss_sel,
  2410. old_tss_base, &next_tss_desc);
  2411. if (ret != X86EMUL_CONTINUE)
  2412. return ret;
  2413. if (reason == TASK_SWITCH_CALL || reason == TASK_SWITCH_GATE)
  2414. ctxt->eflags = ctxt->eflags | X86_EFLAGS_NT;
  2415. if (reason != TASK_SWITCH_IRET) {
  2416. next_tss_desc.type |= (1 << 1); /* set busy flag */
  2417. write_segment_descriptor(ctxt, tss_selector, &next_tss_desc);
  2418. }
  2419. ops->set_cr(ctxt, 0, ops->get_cr(ctxt, 0) | X86_CR0_TS);
  2420. ops->set_segment(ctxt, tss_selector, &next_tss_desc, 0, VCPU_SREG_TR);
  2421. if (has_error_code) {
  2422. ctxt->op_bytes = ctxt->ad_bytes = (next_tss_desc.type & 8) ? 4 : 2;
  2423. ctxt->lock_prefix = 0;
  2424. ctxt->src.val = (unsigned long) error_code;
  2425. ret = em_push(ctxt);
  2426. }
  2427. return ret;
  2428. }
  2429. int emulator_task_switch(struct x86_emulate_ctxt *ctxt,
  2430. u16 tss_selector, int idt_index, int reason,
  2431. bool has_error_code, u32 error_code)
  2432. {
  2433. int rc;
  2434. invalidate_registers(ctxt);
  2435. ctxt->_eip = ctxt->eip;
  2436. ctxt->dst.type = OP_NONE;
  2437. rc = emulator_do_task_switch(ctxt, tss_selector, idt_index, reason,
  2438. has_error_code, error_code);
  2439. if (rc == X86EMUL_CONTINUE) {
  2440. ctxt->eip = ctxt->_eip;
  2441. writeback_registers(ctxt);
  2442. }
  2443. return (rc == X86EMUL_UNHANDLEABLE) ? EMULATION_FAILED : EMULATION_OK;
  2444. }
  2445. static void string_addr_inc(struct x86_emulate_ctxt *ctxt, int reg,
  2446. struct operand *op)
  2447. {
  2448. int df = (ctxt->eflags & EFLG_DF) ? -op->count : op->count;
  2449. register_address_increment(ctxt, reg_rmw(ctxt, reg), df * op->bytes);
  2450. op->addr.mem.ea = register_address(ctxt, reg_read(ctxt, reg));
  2451. }
  2452. static int em_das(struct x86_emulate_ctxt *ctxt)
  2453. {
  2454. u8 al, old_al;
  2455. bool af, cf, old_cf;
  2456. cf = ctxt->eflags & X86_EFLAGS_CF;
  2457. al = ctxt->dst.val;
  2458. old_al = al;
  2459. old_cf = cf;
  2460. cf = false;
  2461. af = ctxt->eflags & X86_EFLAGS_AF;
  2462. if ((al & 0x0f) > 9 || af) {
  2463. al -= 6;
  2464. cf = old_cf | (al >= 250);
  2465. af = true;
  2466. } else {
  2467. af = false;
  2468. }
  2469. if (old_al > 0x99 || old_cf) {
  2470. al -= 0x60;
  2471. cf = true;
  2472. }
  2473. ctxt->dst.val = al;
  2474. /* Set PF, ZF, SF */
  2475. ctxt->src.type = OP_IMM;
  2476. ctxt->src.val = 0;
  2477. ctxt->src.bytes = 1;
  2478. emulate_2op_SrcV(ctxt, "or");
  2479. ctxt->eflags &= ~(X86_EFLAGS_AF | X86_EFLAGS_CF);
  2480. if (cf)
  2481. ctxt->eflags |= X86_EFLAGS_CF;
  2482. if (af)
  2483. ctxt->eflags |= X86_EFLAGS_AF;
  2484. return X86EMUL_CONTINUE;
  2485. }
  2486. static int em_aad(struct x86_emulate_ctxt *ctxt)
  2487. {
  2488. u8 al = ctxt->dst.val & 0xff;
  2489. u8 ah = (ctxt->dst.val >> 8) & 0xff;
  2490. al = (al + (ah * ctxt->src.val)) & 0xff;
  2491. ctxt->dst.val = (ctxt->dst.val & 0xffff0000) | al;
  2492. ctxt->eflags &= ~(X86_EFLAGS_PF | X86_EFLAGS_SF | X86_EFLAGS_ZF);
  2493. if (!al)
  2494. ctxt->eflags |= X86_EFLAGS_ZF;
  2495. if (!(al & 1))
  2496. ctxt->eflags |= X86_EFLAGS_PF;
  2497. if (al & 0x80)
  2498. ctxt->eflags |= X86_EFLAGS_SF;
  2499. return X86EMUL_CONTINUE;
  2500. }
  2501. static int em_call(struct x86_emulate_ctxt *ctxt)
  2502. {
  2503. long rel = ctxt->src.val;
  2504. ctxt->src.val = (unsigned long)ctxt->_eip;
  2505. jmp_rel(ctxt, rel);
  2506. return em_push(ctxt);
  2507. }
  2508. static int em_call_far(struct x86_emulate_ctxt *ctxt)
  2509. {
  2510. u16 sel, old_cs;
  2511. ulong old_eip;
  2512. int rc;
  2513. old_cs = get_segment_selector(ctxt, VCPU_SREG_CS);
  2514. old_eip = ctxt->_eip;
  2515. memcpy(&sel, ctxt->src.valptr + ctxt->op_bytes, 2);
  2516. if (load_segment_descriptor(ctxt, sel, VCPU_SREG_CS))
  2517. return X86EMUL_CONTINUE;
  2518. ctxt->_eip = 0;
  2519. memcpy(&ctxt->_eip, ctxt->src.valptr, ctxt->op_bytes);
  2520. ctxt->src.val = old_cs;
  2521. rc = em_push(ctxt);
  2522. if (rc != X86EMUL_CONTINUE)
  2523. return rc;
  2524. ctxt->src.val = old_eip;
  2525. return em_push(ctxt);
  2526. }
  2527. static int em_ret_near_imm(struct x86_emulate_ctxt *ctxt)
  2528. {
  2529. int rc;
  2530. ctxt->dst.type = OP_REG;
  2531. ctxt->dst.addr.reg = &ctxt->_eip;
  2532. ctxt->dst.bytes = ctxt->op_bytes;
  2533. rc = emulate_pop(ctxt, &ctxt->dst.val, ctxt->op_bytes);
  2534. if (rc != X86EMUL_CONTINUE)
  2535. return rc;
  2536. rsp_increment(ctxt, ctxt->src.val);
  2537. return X86EMUL_CONTINUE;
  2538. }
  2539. static int em_add(struct x86_emulate_ctxt *ctxt)
  2540. {
  2541. emulate_2op_SrcV(ctxt, "add");
  2542. return X86EMUL_CONTINUE;
  2543. }
  2544. static int em_or(struct x86_emulate_ctxt *ctxt)
  2545. {
  2546. emulate_2op_SrcV(ctxt, "or");
  2547. return X86EMUL_CONTINUE;
  2548. }
  2549. static int em_adc(struct x86_emulate_ctxt *ctxt)
  2550. {
  2551. emulate_2op_SrcV(ctxt, "adc");
  2552. return X86EMUL_CONTINUE;
  2553. }
  2554. static int em_sbb(struct x86_emulate_ctxt *ctxt)
  2555. {
  2556. emulate_2op_SrcV(ctxt, "sbb");
  2557. return X86EMUL_CONTINUE;
  2558. }
  2559. static int em_and(struct x86_emulate_ctxt *ctxt)
  2560. {
  2561. emulate_2op_SrcV(ctxt, "and");
  2562. return X86EMUL_CONTINUE;
  2563. }
  2564. static int em_sub(struct x86_emulate_ctxt *ctxt)
  2565. {
  2566. emulate_2op_SrcV(ctxt, "sub");
  2567. return X86EMUL_CONTINUE;
  2568. }
  2569. static int em_xor(struct x86_emulate_ctxt *ctxt)
  2570. {
  2571. emulate_2op_SrcV(ctxt, "xor");
  2572. return X86EMUL_CONTINUE;
  2573. }
  2574. static int em_cmp(struct x86_emulate_ctxt *ctxt)
  2575. {
  2576. emulate_2op_SrcV(ctxt, "cmp");
  2577. /* Disable writeback. */
  2578. ctxt->dst.type = OP_NONE;
  2579. return X86EMUL_CONTINUE;
  2580. }
  2581. static int em_test(struct x86_emulate_ctxt *ctxt)
  2582. {
  2583. emulate_2op_SrcV(ctxt, "test");
  2584. /* Disable writeback. */
  2585. ctxt->dst.type = OP_NONE;
  2586. return X86EMUL_CONTINUE;
  2587. }
  2588. static int em_xchg(struct x86_emulate_ctxt *ctxt)
  2589. {
  2590. /* Write back the register source. */
  2591. ctxt->src.val = ctxt->dst.val;
  2592. write_register_operand(&ctxt->src);
  2593. /* Write back the memory destination with implicit LOCK prefix. */
  2594. ctxt->dst.val = ctxt->src.orig_val;
  2595. ctxt->lock_prefix = 1;
  2596. return X86EMUL_CONTINUE;
  2597. }
  2598. static int em_imul(struct x86_emulate_ctxt *ctxt)
  2599. {
  2600. emulate_2op_SrcV_nobyte(ctxt, "imul");
  2601. return X86EMUL_CONTINUE;
  2602. }
  2603. static int em_imul_3op(struct x86_emulate_ctxt *ctxt)
  2604. {
  2605. ctxt->dst.val = ctxt->src2.val;
  2606. return em_imul(ctxt);
  2607. }
  2608. static int em_cwd(struct x86_emulate_ctxt *ctxt)
  2609. {
  2610. ctxt->dst.type = OP_REG;
  2611. ctxt->dst.bytes = ctxt->src.bytes;
  2612. ctxt->dst.addr.reg = reg_rmw(ctxt, VCPU_REGS_RDX);
  2613. ctxt->dst.val = ~((ctxt->src.val >> (ctxt->src.bytes * 8 - 1)) - 1);
  2614. return X86EMUL_CONTINUE;
  2615. }
  2616. static int em_rdtsc(struct x86_emulate_ctxt *ctxt)
  2617. {
  2618. u64 tsc = 0;
  2619. ctxt->ops->get_msr(ctxt, MSR_IA32_TSC, &tsc);
  2620. *reg_write(ctxt, VCPU_REGS_RAX) = (u32)tsc;
  2621. *reg_write(ctxt, VCPU_REGS_RDX) = tsc >> 32;
  2622. return X86EMUL_CONTINUE;
  2623. }
  2624. static int em_rdpmc(struct x86_emulate_ctxt *ctxt)
  2625. {
  2626. u64 pmc;
  2627. if (ctxt->ops->read_pmc(ctxt, reg_read(ctxt, VCPU_REGS_RCX), &pmc))
  2628. return emulate_gp(ctxt, 0);
  2629. *reg_write(ctxt, VCPU_REGS_RAX) = (u32)pmc;
  2630. *reg_write(ctxt, VCPU_REGS_RDX) = pmc >> 32;
  2631. return X86EMUL_CONTINUE;
  2632. }
  2633. static int em_mov(struct x86_emulate_ctxt *ctxt)
  2634. {
  2635. memcpy(ctxt->dst.valptr, ctxt->src.valptr, ctxt->op_bytes);
  2636. return X86EMUL_CONTINUE;
  2637. }
  2638. static int em_cr_write(struct x86_emulate_ctxt *ctxt)
  2639. {
  2640. if (ctxt->ops->set_cr(ctxt, ctxt->modrm_reg, ctxt->src.val))
  2641. return emulate_gp(ctxt, 0);
  2642. /* Disable writeback. */
  2643. ctxt->dst.type = OP_NONE;
  2644. return X86EMUL_CONTINUE;
  2645. }
  2646. static int em_dr_write(struct x86_emulate_ctxt *ctxt)
  2647. {
  2648. unsigned long val;
  2649. if (ctxt->mode == X86EMUL_MODE_PROT64)
  2650. val = ctxt->src.val & ~0ULL;
  2651. else
  2652. val = ctxt->src.val & ~0U;
  2653. /* #UD condition is already handled. */
  2654. if (ctxt->ops->set_dr(ctxt, ctxt->modrm_reg, val) < 0)
  2655. return emulate_gp(ctxt, 0);
  2656. /* Disable writeback. */
  2657. ctxt->dst.type = OP_NONE;
  2658. return X86EMUL_CONTINUE;
  2659. }
  2660. static int em_wrmsr(struct x86_emulate_ctxt *ctxt)
  2661. {
  2662. u64 msr_data;
  2663. msr_data = (u32)reg_read(ctxt, VCPU_REGS_RAX)
  2664. | ((u64)reg_read(ctxt, VCPU_REGS_RDX) << 32);
  2665. if (ctxt->ops->set_msr(ctxt, reg_read(ctxt, VCPU_REGS_RCX), msr_data))
  2666. return emulate_gp(ctxt, 0);
  2667. return X86EMUL_CONTINUE;
  2668. }
  2669. static int em_rdmsr(struct x86_emulate_ctxt *ctxt)
  2670. {
  2671. u64 msr_data;
  2672. if (ctxt->ops->get_msr(ctxt, reg_read(ctxt, VCPU_REGS_RCX), &msr_data))
  2673. return emulate_gp(ctxt, 0);
  2674. *reg_write(ctxt, VCPU_REGS_RAX) = (u32)msr_data;
  2675. *reg_write(ctxt, VCPU_REGS_RDX) = msr_data >> 32;
  2676. return X86EMUL_CONTINUE;
  2677. }
  2678. static int em_mov_rm_sreg(struct x86_emulate_ctxt *ctxt)
  2679. {
  2680. if (ctxt->modrm_reg > VCPU_SREG_GS)
  2681. return emulate_ud(ctxt);
  2682. ctxt->dst.val = get_segment_selector(ctxt, ctxt->modrm_reg);
  2683. return X86EMUL_CONTINUE;
  2684. }
  2685. static int em_mov_sreg_rm(struct x86_emulate_ctxt *ctxt)
  2686. {
  2687. u16 sel = ctxt->src.val;
  2688. if (ctxt->modrm_reg == VCPU_SREG_CS || ctxt->modrm_reg > VCPU_SREG_GS)
  2689. return emulate_ud(ctxt);
  2690. if (ctxt->modrm_reg == VCPU_SREG_SS)
  2691. ctxt->interruptibility = KVM_X86_SHADOW_INT_MOV_SS;
  2692. /* Disable writeback. */
  2693. ctxt->dst.type = OP_NONE;
  2694. return load_segment_descriptor(ctxt, sel, ctxt->modrm_reg);
  2695. }
  2696. static int em_lldt(struct x86_emulate_ctxt *ctxt)
  2697. {
  2698. u16 sel = ctxt->src.val;
  2699. /* Disable writeback. */
  2700. ctxt->dst.type = OP_NONE;
  2701. return load_segment_descriptor(ctxt, sel, VCPU_SREG_LDTR);
  2702. }
  2703. static int em_ltr(struct x86_emulate_ctxt *ctxt)
  2704. {
  2705. u16 sel = ctxt->src.val;
  2706. /* Disable writeback. */
  2707. ctxt->dst.type = OP_NONE;
  2708. return load_segment_descriptor(ctxt, sel, VCPU_SREG_TR);
  2709. }
  2710. static int em_invlpg(struct x86_emulate_ctxt *ctxt)
  2711. {
  2712. int rc;
  2713. ulong linear;
  2714. rc = linearize(ctxt, ctxt->src.addr.mem, 1, false, &linear);
  2715. if (rc == X86EMUL_CONTINUE)
  2716. ctxt->ops->invlpg(ctxt, linear);
  2717. /* Disable writeback. */
  2718. ctxt->dst.type = OP_NONE;
  2719. return X86EMUL_CONTINUE;
  2720. }
  2721. static int em_clts(struct x86_emulate_ctxt *ctxt)
  2722. {
  2723. ulong cr0;
  2724. cr0 = ctxt->ops->get_cr(ctxt, 0);
  2725. cr0 &= ~X86_CR0_TS;
  2726. ctxt->ops->set_cr(ctxt, 0, cr0);
  2727. return X86EMUL_CONTINUE;
  2728. }
  2729. static int em_vmcall(struct x86_emulate_ctxt *ctxt)
  2730. {
  2731. int rc;
  2732. if (ctxt->modrm_mod != 3 || ctxt->modrm_rm != 1)
  2733. return X86EMUL_UNHANDLEABLE;
  2734. rc = ctxt->ops->fix_hypercall(ctxt);
  2735. if (rc != X86EMUL_CONTINUE)
  2736. return rc;
  2737. /* Let the processor re-execute the fixed hypercall */
  2738. ctxt->_eip = ctxt->eip;
  2739. /* Disable writeback. */
  2740. ctxt->dst.type = OP_NONE;
  2741. return X86EMUL_CONTINUE;
  2742. }
  2743. static int emulate_store_desc_ptr(struct x86_emulate_ctxt *ctxt,
  2744. void (*get)(struct x86_emulate_ctxt *ctxt,
  2745. struct desc_ptr *ptr))
  2746. {
  2747. struct desc_ptr desc_ptr;
  2748. if (ctxt->mode == X86EMUL_MODE_PROT64)
  2749. ctxt->op_bytes = 8;
  2750. get(ctxt, &desc_ptr);
  2751. if (ctxt->op_bytes == 2) {
  2752. ctxt->op_bytes = 4;
  2753. desc_ptr.address &= 0x00ffffff;
  2754. }
  2755. /* Disable writeback. */
  2756. ctxt->dst.type = OP_NONE;
  2757. return segmented_write(ctxt, ctxt->dst.addr.mem,
  2758. &desc_ptr, 2 + ctxt->op_bytes);
  2759. }
  2760. static int em_sgdt(struct x86_emulate_ctxt *ctxt)
  2761. {
  2762. return emulate_store_desc_ptr(ctxt, ctxt->ops->get_gdt);
  2763. }
  2764. static int em_sidt(struct x86_emulate_ctxt *ctxt)
  2765. {
  2766. return emulate_store_desc_ptr(ctxt, ctxt->ops->get_idt);
  2767. }
  2768. static int em_lgdt(struct x86_emulate_ctxt *ctxt)
  2769. {
  2770. struct desc_ptr desc_ptr;
  2771. int rc;
  2772. if (ctxt->mode == X86EMUL_MODE_PROT64)
  2773. ctxt->op_bytes = 8;
  2774. rc = read_descriptor(ctxt, ctxt->src.addr.mem,
  2775. &desc_ptr.size, &desc_ptr.address,
  2776. ctxt->op_bytes);
  2777. if (rc != X86EMUL_CONTINUE)
  2778. return rc;
  2779. ctxt->ops->set_gdt(ctxt, &desc_ptr);
  2780. /* Disable writeback. */
  2781. ctxt->dst.type = OP_NONE;
  2782. return X86EMUL_CONTINUE;
  2783. }
  2784. static int em_vmmcall(struct x86_emulate_ctxt *ctxt)
  2785. {
  2786. int rc;
  2787. rc = ctxt->ops->fix_hypercall(ctxt);
  2788. /* Disable writeback. */
  2789. ctxt->dst.type = OP_NONE;
  2790. return rc;
  2791. }
  2792. static int em_lidt(struct x86_emulate_ctxt *ctxt)
  2793. {
  2794. struct desc_ptr desc_ptr;
  2795. int rc;
  2796. if (ctxt->mode == X86EMUL_MODE_PROT64)
  2797. ctxt->op_bytes = 8;
  2798. rc = read_descriptor(ctxt, ctxt->src.addr.mem,
  2799. &desc_ptr.size, &desc_ptr.address,
  2800. ctxt->op_bytes);
  2801. if (rc != X86EMUL_CONTINUE)
  2802. return rc;
  2803. ctxt->ops->set_idt(ctxt, &desc_ptr);
  2804. /* Disable writeback. */
  2805. ctxt->dst.type = OP_NONE;
  2806. return X86EMUL_CONTINUE;
  2807. }
  2808. static int em_smsw(struct x86_emulate_ctxt *ctxt)
  2809. {
  2810. ctxt->dst.bytes = 2;
  2811. ctxt->dst.val = ctxt->ops->get_cr(ctxt, 0);
  2812. return X86EMUL_CONTINUE;
  2813. }
  2814. static int em_lmsw(struct x86_emulate_ctxt *ctxt)
  2815. {
  2816. ctxt->ops->set_cr(ctxt, 0, (ctxt->ops->get_cr(ctxt, 0) & ~0x0eul)
  2817. | (ctxt->src.val & 0x0f));
  2818. ctxt->dst.type = OP_NONE;
  2819. return X86EMUL_CONTINUE;
  2820. }
  2821. static int em_loop(struct x86_emulate_ctxt *ctxt)
  2822. {
  2823. register_address_increment(ctxt, reg_rmw(ctxt, VCPU_REGS_RCX), -1);
  2824. if ((address_mask(ctxt, reg_read(ctxt, VCPU_REGS_RCX)) != 0) &&
  2825. (ctxt->b == 0xe2 || test_cc(ctxt->b ^ 0x5, ctxt->eflags)))
  2826. jmp_rel(ctxt, ctxt->src.val);
  2827. return X86EMUL_CONTINUE;
  2828. }
  2829. static int em_jcxz(struct x86_emulate_ctxt *ctxt)
  2830. {
  2831. if (address_mask(ctxt, reg_read(ctxt, VCPU_REGS_RCX)) == 0)
  2832. jmp_rel(ctxt, ctxt->src.val);
  2833. return X86EMUL_CONTINUE;
  2834. }
  2835. static int em_in(struct x86_emulate_ctxt *ctxt)
  2836. {
  2837. if (!pio_in_emulated(ctxt, ctxt->dst.bytes, ctxt->src.val,
  2838. &ctxt->dst.val))
  2839. return X86EMUL_IO_NEEDED;
  2840. return X86EMUL_CONTINUE;
  2841. }
  2842. static int em_out(struct x86_emulate_ctxt *ctxt)
  2843. {
  2844. ctxt->ops->pio_out_emulated(ctxt, ctxt->src.bytes, ctxt->dst.val,
  2845. &ctxt->src.val, 1);
  2846. /* Disable writeback. */
  2847. ctxt->dst.type = OP_NONE;
  2848. return X86EMUL_CONTINUE;
  2849. }
  2850. static int em_cli(struct x86_emulate_ctxt *ctxt)
  2851. {
  2852. if (emulator_bad_iopl(ctxt))
  2853. return emulate_gp(ctxt, 0);
  2854. ctxt->eflags &= ~X86_EFLAGS_IF;
  2855. return X86EMUL_CONTINUE;
  2856. }
  2857. static int em_sti(struct x86_emulate_ctxt *ctxt)
  2858. {
  2859. if (emulator_bad_iopl(ctxt))
  2860. return emulate_gp(ctxt, 0);
  2861. ctxt->interruptibility = KVM_X86_SHADOW_INT_STI;
  2862. ctxt->eflags |= X86_EFLAGS_IF;
  2863. return X86EMUL_CONTINUE;
  2864. }
  2865. static int em_bt(struct x86_emulate_ctxt *ctxt)
  2866. {
  2867. /* Disable writeback. */
  2868. ctxt->dst.type = OP_NONE;
  2869. /* only subword offset */
  2870. ctxt->src.val &= (ctxt->dst.bytes << 3) - 1;
  2871. emulate_2op_SrcV_nobyte(ctxt, "bt");
  2872. return X86EMUL_CONTINUE;
  2873. }
  2874. static int em_bts(struct x86_emulate_ctxt *ctxt)
  2875. {
  2876. emulate_2op_SrcV_nobyte(ctxt, "bts");
  2877. return X86EMUL_CONTINUE;
  2878. }
  2879. static int em_btr(struct x86_emulate_ctxt *ctxt)
  2880. {
  2881. emulate_2op_SrcV_nobyte(ctxt, "btr");
  2882. return X86EMUL_CONTINUE;
  2883. }
  2884. static int em_btc(struct x86_emulate_ctxt *ctxt)
  2885. {
  2886. emulate_2op_SrcV_nobyte(ctxt, "btc");
  2887. return X86EMUL_CONTINUE;
  2888. }
  2889. static int em_bsf(struct x86_emulate_ctxt *ctxt)
  2890. {
  2891. emulate_2op_SrcV_nobyte(ctxt, "bsf");
  2892. return X86EMUL_CONTINUE;
  2893. }
  2894. static int em_bsr(struct x86_emulate_ctxt *ctxt)
  2895. {
  2896. emulate_2op_SrcV_nobyte(ctxt, "bsr");
  2897. return X86EMUL_CONTINUE;
  2898. }
  2899. static int em_cpuid(struct x86_emulate_ctxt *ctxt)
  2900. {
  2901. u32 eax, ebx, ecx, edx;
  2902. eax = reg_read(ctxt, VCPU_REGS_RAX);
  2903. ecx = reg_read(ctxt, VCPU_REGS_RCX);
  2904. ctxt->ops->get_cpuid(ctxt, &eax, &ebx, &ecx, &edx);
  2905. *reg_write(ctxt, VCPU_REGS_RAX) = eax;
  2906. *reg_write(ctxt, VCPU_REGS_RBX) = ebx;
  2907. *reg_write(ctxt, VCPU_REGS_RCX) = ecx;
  2908. *reg_write(ctxt, VCPU_REGS_RDX) = edx;
  2909. return X86EMUL_CONTINUE;
  2910. }
  2911. static int em_lahf(struct x86_emulate_ctxt *ctxt)
  2912. {
  2913. *reg_rmw(ctxt, VCPU_REGS_RAX) &= ~0xff00UL;
  2914. *reg_rmw(ctxt, VCPU_REGS_RAX) |= (ctxt->eflags & 0xff) << 8;
  2915. return X86EMUL_CONTINUE;
  2916. }
  2917. static int em_bswap(struct x86_emulate_ctxt *ctxt)
  2918. {
  2919. switch (ctxt->op_bytes) {
  2920. #ifdef CONFIG_X86_64
  2921. case 8:
  2922. asm("bswap %0" : "+r"(ctxt->dst.val));
  2923. break;
  2924. #endif
  2925. default:
  2926. asm("bswap %0" : "+r"(*(u32 *)&ctxt->dst.val));
  2927. break;
  2928. }
  2929. return X86EMUL_CONTINUE;
  2930. }
  2931. static bool valid_cr(int nr)
  2932. {
  2933. switch (nr) {
  2934. case 0:
  2935. case 2 ... 4:
  2936. case 8:
  2937. return true;
  2938. default:
  2939. return false;
  2940. }
  2941. }
  2942. static int check_cr_read(struct x86_emulate_ctxt *ctxt)
  2943. {
  2944. if (!valid_cr(ctxt->modrm_reg))
  2945. return emulate_ud(ctxt);
  2946. return X86EMUL_CONTINUE;
  2947. }
  2948. static int check_cr_write(struct x86_emulate_ctxt *ctxt)
  2949. {
  2950. u64 new_val = ctxt->src.val64;
  2951. int cr = ctxt->modrm_reg;
  2952. u64 efer = 0;
  2953. static u64 cr_reserved_bits[] = {
  2954. 0xffffffff00000000ULL,
  2955. 0, 0, 0, /* CR3 checked later */
  2956. CR4_RESERVED_BITS,
  2957. 0, 0, 0,
  2958. CR8_RESERVED_BITS,
  2959. };
  2960. if (!valid_cr(cr))
  2961. return emulate_ud(ctxt);
  2962. if (new_val & cr_reserved_bits[cr])
  2963. return emulate_gp(ctxt, 0);
  2964. switch (cr) {
  2965. case 0: {
  2966. u64 cr4;
  2967. if (((new_val & X86_CR0_PG) && !(new_val & X86_CR0_PE)) ||
  2968. ((new_val & X86_CR0_NW) && !(new_val & X86_CR0_CD)))
  2969. return emulate_gp(ctxt, 0);
  2970. cr4 = ctxt->ops->get_cr(ctxt, 4);
  2971. ctxt->ops->get_msr(ctxt, MSR_EFER, &efer);
  2972. if ((new_val & X86_CR0_PG) && (efer & EFER_LME) &&
  2973. !(cr4 & X86_CR4_PAE))
  2974. return emulate_gp(ctxt, 0);
  2975. break;
  2976. }
  2977. case 3: {
  2978. u64 rsvd = 0;
  2979. ctxt->ops->get_msr(ctxt, MSR_EFER, &efer);
  2980. if (efer & EFER_LMA)
  2981. rsvd = CR3_L_MODE_RESERVED_BITS;
  2982. else if (ctxt->ops->get_cr(ctxt, 4) & X86_CR4_PAE)
  2983. rsvd = CR3_PAE_RESERVED_BITS;
  2984. else if (ctxt->ops->get_cr(ctxt, 0) & X86_CR0_PG)
  2985. rsvd = CR3_NONPAE_RESERVED_BITS;
  2986. if (new_val & rsvd)
  2987. return emulate_gp(ctxt, 0);
  2988. break;
  2989. }
  2990. case 4: {
  2991. ctxt->ops->get_msr(ctxt, MSR_EFER, &efer);
  2992. if ((efer & EFER_LMA) && !(new_val & X86_CR4_PAE))
  2993. return emulate_gp(ctxt, 0);
  2994. break;
  2995. }
  2996. }
  2997. return X86EMUL_CONTINUE;
  2998. }
  2999. static int check_dr7_gd(struct x86_emulate_ctxt *ctxt)
  3000. {
  3001. unsigned long dr7;
  3002. ctxt->ops->get_dr(ctxt, 7, &dr7);
  3003. /* Check if DR7.Global_Enable is set */
  3004. return dr7 & (1 << 13);
  3005. }
  3006. static int check_dr_read(struct x86_emulate_ctxt *ctxt)
  3007. {
  3008. int dr = ctxt->modrm_reg;
  3009. u64 cr4;
  3010. if (dr > 7)
  3011. return emulate_ud(ctxt);
  3012. cr4 = ctxt->ops->get_cr(ctxt, 4);
  3013. if ((cr4 & X86_CR4_DE) && (dr == 4 || dr == 5))
  3014. return emulate_ud(ctxt);
  3015. if (check_dr7_gd(ctxt))
  3016. return emulate_db(ctxt);
  3017. return X86EMUL_CONTINUE;
  3018. }
  3019. static int check_dr_write(struct x86_emulate_ctxt *ctxt)
  3020. {
  3021. u64 new_val = ctxt->src.val64;
  3022. int dr = ctxt->modrm_reg;
  3023. if ((dr == 6 || dr == 7) && (new_val & 0xffffffff00000000ULL))
  3024. return emulate_gp(ctxt, 0);
  3025. return check_dr_read(ctxt);
  3026. }
  3027. static int check_svme(struct x86_emulate_ctxt *ctxt)
  3028. {
  3029. u64 efer;
  3030. ctxt->ops->get_msr(ctxt, MSR_EFER, &efer);
  3031. if (!(efer & EFER_SVME))
  3032. return emulate_ud(ctxt);
  3033. return X86EMUL_CONTINUE;
  3034. }
  3035. static int check_svme_pa(struct x86_emulate_ctxt *ctxt)
  3036. {
  3037. u64 rax = reg_read(ctxt, VCPU_REGS_RAX);
  3038. /* Valid physical address? */
  3039. if (rax & 0xffff000000000000ULL)
  3040. return emulate_gp(ctxt, 0);
  3041. return check_svme(ctxt);
  3042. }
  3043. static int check_rdtsc(struct x86_emulate_ctxt *ctxt)
  3044. {
  3045. u64 cr4 = ctxt->ops->get_cr(ctxt, 4);
  3046. if (cr4 & X86_CR4_TSD && ctxt->ops->cpl(ctxt))
  3047. return emulate_ud(ctxt);
  3048. return X86EMUL_CONTINUE;
  3049. }
  3050. static int check_rdpmc(struct x86_emulate_ctxt *ctxt)
  3051. {
  3052. u64 cr4 = ctxt->ops->get_cr(ctxt, 4);
  3053. u64 rcx = reg_read(ctxt, VCPU_REGS_RCX);
  3054. if ((!(cr4 & X86_CR4_PCE) && ctxt->ops->cpl(ctxt)) ||
  3055. (rcx > 3))
  3056. return emulate_gp(ctxt, 0);
  3057. return X86EMUL_CONTINUE;
  3058. }
  3059. static int check_perm_in(struct x86_emulate_ctxt *ctxt)
  3060. {
  3061. ctxt->dst.bytes = min(ctxt->dst.bytes, 4u);
  3062. if (!emulator_io_permited(ctxt, ctxt->src.val, ctxt->dst.bytes))
  3063. return emulate_gp(ctxt, 0);
  3064. return X86EMUL_CONTINUE;
  3065. }
  3066. static int check_perm_out(struct x86_emulate_ctxt *ctxt)
  3067. {
  3068. ctxt->src.bytes = min(ctxt->src.bytes, 4u);
  3069. if (!emulator_io_permited(ctxt, ctxt->dst.val, ctxt->src.bytes))
  3070. return emulate_gp(ctxt, 0);
  3071. return X86EMUL_CONTINUE;
  3072. }
  3073. #define D(_y) { .flags = (_y) }
  3074. #define DI(_y, _i) { .flags = (_y), .intercept = x86_intercept_##_i }
  3075. #define DIP(_y, _i, _p) { .flags = (_y), .intercept = x86_intercept_##_i, \
  3076. .check_perm = (_p) }
  3077. #define N D(0)
  3078. #define EXT(_f, _e) { .flags = ((_f) | RMExt), .u.group = (_e) }
  3079. #define G(_f, _g) { .flags = ((_f) | Group | ModRM), .u.group = (_g) }
  3080. #define GD(_f, _g) { .flags = ((_f) | GroupDual | ModRM), .u.gdual = (_g) }
  3081. #define I(_f, _e) { .flags = (_f), .u.execute = (_e) }
  3082. #define II(_f, _e, _i) \
  3083. { .flags = (_f), .u.execute = (_e), .intercept = x86_intercept_##_i }
  3084. #define IIP(_f, _e, _i, _p) \
  3085. { .flags = (_f), .u.execute = (_e), .intercept = x86_intercept_##_i, \
  3086. .check_perm = (_p) }
  3087. #define GP(_f, _g) { .flags = ((_f) | Prefix), .u.gprefix = (_g) }
  3088. #define D2bv(_f) D((_f) | ByteOp), D(_f)
  3089. #define D2bvIP(_f, _i, _p) DIP((_f) | ByteOp, _i, _p), DIP(_f, _i, _p)
  3090. #define I2bv(_f, _e) I((_f) | ByteOp, _e), I(_f, _e)
  3091. #define I2bvIP(_f, _e, _i, _p) \
  3092. IIP((_f) | ByteOp, _e, _i, _p), IIP(_f, _e, _i, _p)
  3093. #define I6ALU(_f, _e) I2bv((_f) | DstMem | SrcReg | ModRM, _e), \
  3094. I2bv(((_f) | DstReg | SrcMem | ModRM) & ~Lock, _e), \
  3095. I2bv(((_f) & ~Lock) | DstAcc | SrcImm, _e)
  3096. static const struct opcode group7_rm1[] = {
  3097. DI(SrcNone | Priv, monitor),
  3098. DI(SrcNone | Priv, mwait),
  3099. N, N, N, N, N, N,
  3100. };
  3101. static const struct opcode group7_rm3[] = {
  3102. DIP(SrcNone | Prot | Priv, vmrun, check_svme_pa),
  3103. II(SrcNone | Prot | VendorSpecific, em_vmmcall, vmmcall),
  3104. DIP(SrcNone | Prot | Priv, vmload, check_svme_pa),
  3105. DIP(SrcNone | Prot | Priv, vmsave, check_svme_pa),
  3106. DIP(SrcNone | Prot | Priv, stgi, check_svme),
  3107. DIP(SrcNone | Prot | Priv, clgi, check_svme),
  3108. DIP(SrcNone | Prot | Priv, skinit, check_svme),
  3109. DIP(SrcNone | Prot | Priv, invlpga, check_svme),
  3110. };
  3111. static const struct opcode group7_rm7[] = {
  3112. N,
  3113. DIP(SrcNone, rdtscp, check_rdtsc),
  3114. N, N, N, N, N, N,
  3115. };
  3116. static const struct opcode group1[] = {
  3117. I(Lock, em_add),
  3118. I(Lock | PageTable, em_or),
  3119. I(Lock, em_adc),
  3120. I(Lock, em_sbb),
  3121. I(Lock | PageTable, em_and),
  3122. I(Lock, em_sub),
  3123. I(Lock, em_xor),
  3124. I(0, em_cmp),
  3125. };
  3126. static const struct opcode group1A[] = {
  3127. I(DstMem | SrcNone | Mov | Stack, em_pop), N, N, N, N, N, N, N,
  3128. };
  3129. static const struct opcode group3[] = {
  3130. I(DstMem | SrcImm, em_test),
  3131. I(DstMem | SrcImm, em_test),
  3132. I(DstMem | SrcNone | Lock, em_not),
  3133. I(DstMem | SrcNone | Lock, em_neg),
  3134. I(SrcMem, em_mul_ex),
  3135. I(SrcMem, em_imul_ex),
  3136. I(SrcMem, em_div_ex),
  3137. I(SrcMem, em_idiv_ex),
  3138. };
  3139. static const struct opcode group4[] = {
  3140. I(ByteOp | DstMem | SrcNone | Lock, em_grp45),
  3141. I(ByteOp | DstMem | SrcNone | Lock, em_grp45),
  3142. N, N, N, N, N, N,
  3143. };
  3144. static const struct opcode group5[] = {
  3145. I(DstMem | SrcNone | Lock, em_grp45),
  3146. I(DstMem | SrcNone | Lock, em_grp45),
  3147. I(SrcMem | Stack, em_grp45),
  3148. I(SrcMemFAddr | ImplicitOps | Stack, em_call_far),
  3149. I(SrcMem | Stack, em_grp45),
  3150. I(SrcMemFAddr | ImplicitOps, em_grp45),
  3151. I(SrcMem | Stack, em_grp45), N,
  3152. };
  3153. static const struct opcode group6[] = {
  3154. DI(Prot, sldt),
  3155. DI(Prot, str),
  3156. II(Prot | Priv | SrcMem16, em_lldt, lldt),
  3157. II(Prot | Priv | SrcMem16, em_ltr, ltr),
  3158. N, N, N, N,
  3159. };
  3160. static const struct group_dual group7 = { {
  3161. II(Mov | DstMem | Priv, em_sgdt, sgdt),
  3162. II(Mov | DstMem | Priv, em_sidt, sidt),
  3163. II(SrcMem | Priv, em_lgdt, lgdt),
  3164. II(SrcMem | Priv, em_lidt, lidt),
  3165. II(SrcNone | DstMem | Mov, em_smsw, smsw), N,
  3166. II(SrcMem16 | Mov | Priv, em_lmsw, lmsw),
  3167. II(SrcMem | ByteOp | Priv | NoAccess, em_invlpg, invlpg),
  3168. }, {
  3169. I(SrcNone | Priv | VendorSpecific, em_vmcall),
  3170. EXT(0, group7_rm1),
  3171. N, EXT(0, group7_rm3),
  3172. II(SrcNone | DstMem | Mov, em_smsw, smsw), N,
  3173. II(SrcMem16 | Mov | Priv, em_lmsw, lmsw),
  3174. EXT(0, group7_rm7),
  3175. } };
  3176. static const struct opcode group8[] = {
  3177. N, N, N, N,
  3178. I(DstMem | SrcImmByte, em_bt),
  3179. I(DstMem | SrcImmByte | Lock | PageTable, em_bts),
  3180. I(DstMem | SrcImmByte | Lock, em_btr),
  3181. I(DstMem | SrcImmByte | Lock | PageTable, em_btc),
  3182. };
  3183. static const struct group_dual group9 = { {
  3184. N, I(DstMem64 | Lock | PageTable, em_cmpxchg8b), N, N, N, N, N, N,
  3185. }, {
  3186. N, N, N, N, N, N, N, N,
  3187. } };
  3188. static const struct opcode group11[] = {
  3189. I(DstMem | SrcImm | Mov | PageTable, em_mov),
  3190. X7(D(Undefined)),
  3191. };
  3192. static const struct gprefix pfx_0f_6f_0f_7f = {
  3193. I(Mmx, em_mov), I(Sse | Aligned, em_mov), N, I(Sse | Unaligned, em_mov),
  3194. };
  3195. static const struct gprefix pfx_vmovntpx = {
  3196. I(0, em_mov), N, N, N,
  3197. };
  3198. static const struct opcode opcode_table[256] = {
  3199. /* 0x00 - 0x07 */
  3200. I6ALU(Lock, em_add),
  3201. I(ImplicitOps | Stack | No64 | Src2ES, em_push_sreg),
  3202. I(ImplicitOps | Stack | No64 | Src2ES, em_pop_sreg),
  3203. /* 0x08 - 0x0F */
  3204. I6ALU(Lock | PageTable, em_or),
  3205. I(ImplicitOps | Stack | No64 | Src2CS, em_push_sreg),
  3206. N,
  3207. /* 0x10 - 0x17 */
  3208. I6ALU(Lock, em_adc),
  3209. I(ImplicitOps | Stack | No64 | Src2SS, em_push_sreg),
  3210. I(ImplicitOps | Stack | No64 | Src2SS, em_pop_sreg),
  3211. /* 0x18 - 0x1F */
  3212. I6ALU(Lock, em_sbb),
  3213. I(ImplicitOps | Stack | No64 | Src2DS, em_push_sreg),
  3214. I(ImplicitOps | Stack | No64 | Src2DS, em_pop_sreg),
  3215. /* 0x20 - 0x27 */
  3216. I6ALU(Lock | PageTable, em_and), N, N,
  3217. /* 0x28 - 0x2F */
  3218. I6ALU(Lock, em_sub), N, I(ByteOp | DstAcc | No64, em_das),
  3219. /* 0x30 - 0x37 */
  3220. I6ALU(Lock, em_xor), N, N,
  3221. /* 0x38 - 0x3F */
  3222. I6ALU(0, em_cmp), N, N,
  3223. /* 0x40 - 0x4F */
  3224. X16(D(DstReg)),
  3225. /* 0x50 - 0x57 */
  3226. X8(I(SrcReg | Stack, em_push)),
  3227. /* 0x58 - 0x5F */
  3228. X8(I(DstReg | Stack, em_pop)),
  3229. /* 0x60 - 0x67 */
  3230. I(ImplicitOps | Stack | No64, em_pusha),
  3231. I(ImplicitOps | Stack | No64, em_popa),
  3232. N, D(DstReg | SrcMem32 | ModRM | Mov) /* movsxd (x86/64) */ ,
  3233. N, N, N, N,
  3234. /* 0x68 - 0x6F */
  3235. I(SrcImm | Mov | Stack, em_push),
  3236. I(DstReg | SrcMem | ModRM | Src2Imm, em_imul_3op),
  3237. I(SrcImmByte | Mov | Stack, em_push),
  3238. I(DstReg | SrcMem | ModRM | Src2ImmByte, em_imul_3op),
  3239. I2bvIP(DstDI | SrcDX | Mov | String | Unaligned, em_in, ins, check_perm_in), /* insb, insw/insd */
  3240. I2bvIP(SrcSI | DstDX | String, em_out, outs, check_perm_out), /* outsb, outsw/outsd */
  3241. /* 0x70 - 0x7F */
  3242. X16(D(SrcImmByte)),
  3243. /* 0x80 - 0x87 */
  3244. G(ByteOp | DstMem | SrcImm, group1),
  3245. G(DstMem | SrcImm, group1),
  3246. G(ByteOp | DstMem | SrcImm | No64, group1),
  3247. G(DstMem | SrcImmByte, group1),
  3248. I2bv(DstMem | SrcReg | ModRM, em_test),
  3249. I2bv(DstMem | SrcReg | ModRM | Lock | PageTable, em_xchg),
  3250. /* 0x88 - 0x8F */
  3251. I2bv(DstMem | SrcReg | ModRM | Mov | PageTable, em_mov),
  3252. I2bv(DstReg | SrcMem | ModRM | Mov, em_mov),
  3253. I(DstMem | SrcNone | ModRM | Mov | PageTable, em_mov_rm_sreg),
  3254. D(ModRM | SrcMem | NoAccess | DstReg),
  3255. I(ImplicitOps | SrcMem16 | ModRM, em_mov_sreg_rm),
  3256. G(0, group1A),
  3257. /* 0x90 - 0x97 */
  3258. DI(SrcAcc | DstReg, pause), X7(D(SrcAcc | DstReg)),
  3259. /* 0x98 - 0x9F */
  3260. D(DstAcc | SrcNone), I(ImplicitOps | SrcAcc, em_cwd),
  3261. I(SrcImmFAddr | No64, em_call_far), N,
  3262. II(ImplicitOps | Stack, em_pushf, pushf),
  3263. II(ImplicitOps | Stack, em_popf, popf), N, I(ImplicitOps, em_lahf),
  3264. /* 0xA0 - 0xA7 */
  3265. I2bv(DstAcc | SrcMem | Mov | MemAbs, em_mov),
  3266. I2bv(DstMem | SrcAcc | Mov | MemAbs | PageTable, em_mov),
  3267. I2bv(SrcSI | DstDI | Mov | String, em_mov),
  3268. I2bv(SrcSI | DstDI | String, em_cmp),
  3269. /* 0xA8 - 0xAF */
  3270. I2bv(DstAcc | SrcImm, em_test),
  3271. I2bv(SrcAcc | DstDI | Mov | String, em_mov),
  3272. I2bv(SrcSI | DstAcc | Mov | String, em_mov),
  3273. I2bv(SrcAcc | DstDI | String, em_cmp),
  3274. /* 0xB0 - 0xB7 */
  3275. X8(I(ByteOp | DstReg | SrcImm | Mov, em_mov)),
  3276. /* 0xB8 - 0xBF */
  3277. X8(I(DstReg | SrcImm64 | Mov, em_mov)),
  3278. /* 0xC0 - 0xC7 */
  3279. D2bv(DstMem | SrcImmByte | ModRM),
  3280. I(ImplicitOps | Stack | SrcImmU16, em_ret_near_imm),
  3281. I(ImplicitOps | Stack, em_ret),
  3282. I(DstReg | SrcMemFAddr | ModRM | No64 | Src2ES, em_lseg),
  3283. I(DstReg | SrcMemFAddr | ModRM | No64 | Src2DS, em_lseg),
  3284. G(ByteOp, group11), G(0, group11),
  3285. /* 0xC8 - 0xCF */
  3286. I(Stack | SrcImmU16 | Src2ImmByte, em_enter), I(Stack, em_leave),
  3287. N, I(ImplicitOps | Stack, em_ret_far),
  3288. D(ImplicitOps), DI(SrcImmByte, intn),
  3289. D(ImplicitOps | No64), II(ImplicitOps, em_iret, iret),
  3290. /* 0xD0 - 0xD7 */
  3291. D2bv(DstMem | SrcOne | ModRM), D2bv(DstMem | ModRM),
  3292. N, I(DstAcc | SrcImmByte | No64, em_aad), N, N,
  3293. /* 0xD8 - 0xDF */
  3294. N, N, N, N, N, N, N, N,
  3295. /* 0xE0 - 0xE7 */
  3296. X3(I(SrcImmByte, em_loop)),
  3297. I(SrcImmByte, em_jcxz),
  3298. I2bvIP(SrcImmUByte | DstAcc, em_in, in, check_perm_in),
  3299. I2bvIP(SrcAcc | DstImmUByte, em_out, out, check_perm_out),
  3300. /* 0xE8 - 0xEF */
  3301. I(SrcImm | Stack, em_call), D(SrcImm | ImplicitOps),
  3302. I(SrcImmFAddr | No64, em_jmp_far), D(SrcImmByte | ImplicitOps),
  3303. I2bvIP(SrcDX | DstAcc, em_in, in, check_perm_in),
  3304. I2bvIP(SrcAcc | DstDX, em_out, out, check_perm_out),
  3305. /* 0xF0 - 0xF7 */
  3306. N, DI(ImplicitOps, icebp), N, N,
  3307. DI(ImplicitOps | Priv, hlt), D(ImplicitOps),
  3308. G(ByteOp, group3), G(0, group3),
  3309. /* 0xF8 - 0xFF */
  3310. D(ImplicitOps), D(ImplicitOps),
  3311. I(ImplicitOps, em_cli), I(ImplicitOps, em_sti),
  3312. D(ImplicitOps), D(ImplicitOps), G(0, group4), G(0, group5),
  3313. };
  3314. static const struct opcode twobyte_table[256] = {
  3315. /* 0x00 - 0x0F */
  3316. G(0, group6), GD(0, &group7), N, N,
  3317. N, I(ImplicitOps | VendorSpecific, em_syscall),
  3318. II(ImplicitOps | Priv, em_clts, clts), N,
  3319. DI(ImplicitOps | Priv, invd), DI(ImplicitOps | Priv, wbinvd), N, N,
  3320. N, D(ImplicitOps | ModRM), N, N,
  3321. /* 0x10 - 0x1F */
  3322. N, N, N, N, N, N, N, N, D(ImplicitOps | ModRM), N, N, N, N, N, N, N,
  3323. /* 0x20 - 0x2F */
  3324. DIP(ModRM | DstMem | Priv | Op3264, cr_read, check_cr_read),
  3325. DIP(ModRM | DstMem | Priv | Op3264, dr_read, check_dr_read),
  3326. IIP(ModRM | SrcMem | Priv | Op3264, em_cr_write, cr_write, check_cr_write),
  3327. IIP(ModRM | SrcMem | Priv | Op3264, em_dr_write, dr_write, check_dr_write),
  3328. N, N, N, N,
  3329. N, N, N, GP(ModRM | DstMem | SrcReg | Sse | Mov | Aligned, &pfx_vmovntpx),
  3330. N, N, N, N,
  3331. /* 0x30 - 0x3F */
  3332. II(ImplicitOps | Priv, em_wrmsr, wrmsr),
  3333. IIP(ImplicitOps, em_rdtsc, rdtsc, check_rdtsc),
  3334. II(ImplicitOps | Priv, em_rdmsr, rdmsr),
  3335. IIP(ImplicitOps, em_rdpmc, rdpmc, check_rdpmc),
  3336. I(ImplicitOps | VendorSpecific, em_sysenter),
  3337. I(ImplicitOps | Priv | VendorSpecific, em_sysexit),
  3338. N, N,
  3339. N, N, N, N, N, N, N, N,
  3340. /* 0x40 - 0x4F */
  3341. X16(D(DstReg | SrcMem | ModRM | Mov)),
  3342. /* 0x50 - 0x5F */
  3343. N, N, N, N, N, N, N, N, N, N, N, N, N, N, N, N,
  3344. /* 0x60 - 0x6F */
  3345. N, N, N, N,
  3346. N, N, N, N,
  3347. N, N, N, N,
  3348. N, N, N, GP(SrcMem | DstReg | ModRM | Mov, &pfx_0f_6f_0f_7f),
  3349. /* 0x70 - 0x7F */
  3350. N, N, N, N,
  3351. N, N, N, N,
  3352. N, N, N, N,
  3353. N, N, N, GP(SrcReg | DstMem | ModRM | Mov, &pfx_0f_6f_0f_7f),
  3354. /* 0x80 - 0x8F */
  3355. X16(D(SrcImm)),
  3356. /* 0x90 - 0x9F */
  3357. X16(D(ByteOp | DstMem | SrcNone | ModRM| Mov)),
  3358. /* 0xA0 - 0xA7 */
  3359. I(Stack | Src2FS, em_push_sreg), I(Stack | Src2FS, em_pop_sreg),
  3360. II(ImplicitOps, em_cpuid, cpuid), I(DstMem | SrcReg | ModRM | BitOp, em_bt),
  3361. D(DstMem | SrcReg | Src2ImmByte | ModRM),
  3362. D(DstMem | SrcReg | Src2CL | ModRM), N, N,
  3363. /* 0xA8 - 0xAF */
  3364. I(Stack | Src2GS, em_push_sreg), I(Stack | Src2GS, em_pop_sreg),
  3365. DI(ImplicitOps, rsm),
  3366. I(DstMem | SrcReg | ModRM | BitOp | Lock | PageTable, em_bts),
  3367. D(DstMem | SrcReg | Src2ImmByte | ModRM),
  3368. D(DstMem | SrcReg | Src2CL | ModRM),
  3369. D(ModRM), I(DstReg | SrcMem | ModRM, em_imul),
  3370. /* 0xB0 - 0xB7 */
  3371. I2bv(DstMem | SrcReg | ModRM | Lock | PageTable, em_cmpxchg),
  3372. I(DstReg | SrcMemFAddr | ModRM | Src2SS, em_lseg),
  3373. I(DstMem | SrcReg | ModRM | BitOp | Lock, em_btr),
  3374. I(DstReg | SrcMemFAddr | ModRM | Src2FS, em_lseg),
  3375. I(DstReg | SrcMemFAddr | ModRM | Src2GS, em_lseg),
  3376. D(DstReg | SrcMem8 | ModRM | Mov), D(DstReg | SrcMem16 | ModRM | Mov),
  3377. /* 0xB8 - 0xBF */
  3378. N, N,
  3379. G(BitOp, group8),
  3380. I(DstMem | SrcReg | ModRM | BitOp | Lock | PageTable, em_btc),
  3381. I(DstReg | SrcMem | ModRM, em_bsf), I(DstReg | SrcMem | ModRM, em_bsr),
  3382. D(DstReg | SrcMem8 | ModRM | Mov), D(DstReg | SrcMem16 | ModRM | Mov),
  3383. /* 0xC0 - 0xC7 */
  3384. D2bv(DstMem | SrcReg | ModRM | Lock),
  3385. N, D(DstMem | SrcReg | ModRM | Mov),
  3386. N, N, N, GD(0, &group9),
  3387. /* 0xC8 - 0xCF */
  3388. X8(I(DstReg, em_bswap)),
  3389. /* 0xD0 - 0xDF */
  3390. N, N, N, N, N, N, N, N, N, N, N, N, N, N, N, N,
  3391. /* 0xE0 - 0xEF */
  3392. N, N, N, N, N, N, N, N, N, N, N, N, N, N, N, N,
  3393. /* 0xF0 - 0xFF */
  3394. N, N, N, N, N, N, N, N, N, N, N, N, N, N, N, N
  3395. };
  3396. #undef D
  3397. #undef N
  3398. #undef G
  3399. #undef GD
  3400. #undef I
  3401. #undef GP
  3402. #undef EXT
  3403. #undef D2bv
  3404. #undef D2bvIP
  3405. #undef I2bv
  3406. #undef I2bvIP
  3407. #undef I6ALU
  3408. static unsigned imm_size(struct x86_emulate_ctxt *ctxt)
  3409. {
  3410. unsigned size;
  3411. size = (ctxt->d & ByteOp) ? 1 : ctxt->op_bytes;
  3412. if (size == 8)
  3413. size = 4;
  3414. return size;
  3415. }
  3416. static int decode_imm(struct x86_emulate_ctxt *ctxt, struct operand *op,
  3417. unsigned size, bool sign_extension)
  3418. {
  3419. int rc = X86EMUL_CONTINUE;
  3420. op->type = OP_IMM;
  3421. op->bytes = size;
  3422. op->addr.mem.ea = ctxt->_eip;
  3423. /* NB. Immediates are sign-extended as necessary. */
  3424. switch (op->bytes) {
  3425. case 1:
  3426. op->val = insn_fetch(s8, ctxt);
  3427. break;
  3428. case 2:
  3429. op->val = insn_fetch(s16, ctxt);
  3430. break;
  3431. case 4:
  3432. op->val = insn_fetch(s32, ctxt);
  3433. break;
  3434. case 8:
  3435. op->val = insn_fetch(s64, ctxt);
  3436. break;
  3437. }
  3438. if (!sign_extension) {
  3439. switch (op->bytes) {
  3440. case 1:
  3441. op->val &= 0xff;
  3442. break;
  3443. case 2:
  3444. op->val &= 0xffff;
  3445. break;
  3446. case 4:
  3447. op->val &= 0xffffffff;
  3448. break;
  3449. }
  3450. }
  3451. done:
  3452. return rc;
  3453. }
  3454. static int decode_operand(struct x86_emulate_ctxt *ctxt, struct operand *op,
  3455. unsigned d)
  3456. {
  3457. int rc = X86EMUL_CONTINUE;
  3458. switch (d) {
  3459. case OpReg:
  3460. decode_register_operand(ctxt, op);
  3461. break;
  3462. case OpImmUByte:
  3463. rc = decode_imm(ctxt, op, 1, false);
  3464. break;
  3465. case OpMem:
  3466. ctxt->memop.bytes = (ctxt->d & ByteOp) ? 1 : ctxt->op_bytes;
  3467. mem_common:
  3468. *op = ctxt->memop;
  3469. ctxt->memopp = op;
  3470. if ((ctxt->d & BitOp) && op == &ctxt->dst)
  3471. fetch_bit_operand(ctxt);
  3472. op->orig_val = op->val;
  3473. break;
  3474. case OpMem64:
  3475. ctxt->memop.bytes = 8;
  3476. goto mem_common;
  3477. case OpAcc:
  3478. op->type = OP_REG;
  3479. op->bytes = (ctxt->d & ByteOp) ? 1 : ctxt->op_bytes;
  3480. op->addr.reg = reg_rmw(ctxt, VCPU_REGS_RAX);
  3481. fetch_register_operand(op);
  3482. op->orig_val = op->val;
  3483. break;
  3484. case OpDI:
  3485. op->type = OP_MEM;
  3486. op->bytes = (ctxt->d & ByteOp) ? 1 : ctxt->op_bytes;
  3487. op->addr.mem.ea =
  3488. register_address(ctxt, reg_read(ctxt, VCPU_REGS_RDI));
  3489. op->addr.mem.seg = VCPU_SREG_ES;
  3490. op->val = 0;
  3491. op->count = 1;
  3492. break;
  3493. case OpDX:
  3494. op->type = OP_REG;
  3495. op->bytes = 2;
  3496. op->addr.reg = reg_rmw(ctxt, VCPU_REGS_RDX);
  3497. fetch_register_operand(op);
  3498. break;
  3499. case OpCL:
  3500. op->bytes = 1;
  3501. op->val = reg_read(ctxt, VCPU_REGS_RCX) & 0xff;
  3502. break;
  3503. case OpImmByte:
  3504. rc = decode_imm(ctxt, op, 1, true);
  3505. break;
  3506. case OpOne:
  3507. op->bytes = 1;
  3508. op->val = 1;
  3509. break;
  3510. case OpImm:
  3511. rc = decode_imm(ctxt, op, imm_size(ctxt), true);
  3512. break;
  3513. case OpImm64:
  3514. rc = decode_imm(ctxt, op, ctxt->op_bytes, true);
  3515. break;
  3516. case OpMem8:
  3517. ctxt->memop.bytes = 1;
  3518. goto mem_common;
  3519. case OpMem16:
  3520. ctxt->memop.bytes = 2;
  3521. goto mem_common;
  3522. case OpMem32:
  3523. ctxt->memop.bytes = 4;
  3524. goto mem_common;
  3525. case OpImmU16:
  3526. rc = decode_imm(ctxt, op, 2, false);
  3527. break;
  3528. case OpImmU:
  3529. rc = decode_imm(ctxt, op, imm_size(ctxt), false);
  3530. break;
  3531. case OpSI:
  3532. op->type = OP_MEM;
  3533. op->bytes = (ctxt->d & ByteOp) ? 1 : ctxt->op_bytes;
  3534. op->addr.mem.ea =
  3535. register_address(ctxt, reg_read(ctxt, VCPU_REGS_RSI));
  3536. op->addr.mem.seg = seg_override(ctxt);
  3537. op->val = 0;
  3538. op->count = 1;
  3539. break;
  3540. case OpImmFAddr:
  3541. op->type = OP_IMM;
  3542. op->addr.mem.ea = ctxt->_eip;
  3543. op->bytes = ctxt->op_bytes + 2;
  3544. insn_fetch_arr(op->valptr, op->bytes, ctxt);
  3545. break;
  3546. case OpMemFAddr:
  3547. ctxt->memop.bytes = ctxt->op_bytes + 2;
  3548. goto mem_common;
  3549. case OpES:
  3550. op->val = VCPU_SREG_ES;
  3551. break;
  3552. case OpCS:
  3553. op->val = VCPU_SREG_CS;
  3554. break;
  3555. case OpSS:
  3556. op->val = VCPU_SREG_SS;
  3557. break;
  3558. case OpDS:
  3559. op->val = VCPU_SREG_DS;
  3560. break;
  3561. case OpFS:
  3562. op->val = VCPU_SREG_FS;
  3563. break;
  3564. case OpGS:
  3565. op->val = VCPU_SREG_GS;
  3566. break;
  3567. case OpImplicit:
  3568. /* Special instructions do their own operand decoding. */
  3569. default:
  3570. op->type = OP_NONE; /* Disable writeback. */
  3571. break;
  3572. }
  3573. done:
  3574. return rc;
  3575. }
  3576. int x86_decode_insn(struct x86_emulate_ctxt *ctxt, void *insn, int insn_len)
  3577. {
  3578. int rc = X86EMUL_CONTINUE;
  3579. int mode = ctxt->mode;
  3580. int def_op_bytes, def_ad_bytes, goffset, simd_prefix;
  3581. bool op_prefix = false;
  3582. struct opcode opcode;
  3583. ctxt->memop.type = OP_NONE;
  3584. ctxt->memopp = NULL;
  3585. ctxt->_eip = ctxt->eip;
  3586. ctxt->fetch.start = ctxt->_eip;
  3587. ctxt->fetch.end = ctxt->fetch.start + insn_len;
  3588. if (insn_len > 0)
  3589. memcpy(ctxt->fetch.data, insn, insn_len);
  3590. switch (mode) {
  3591. case X86EMUL_MODE_REAL:
  3592. case X86EMUL_MODE_VM86:
  3593. case X86EMUL_MODE_PROT16:
  3594. def_op_bytes = def_ad_bytes = 2;
  3595. break;
  3596. case X86EMUL_MODE_PROT32:
  3597. def_op_bytes = def_ad_bytes = 4;
  3598. break;
  3599. #ifdef CONFIG_X86_64
  3600. case X86EMUL_MODE_PROT64:
  3601. def_op_bytes = 4;
  3602. def_ad_bytes = 8;
  3603. break;
  3604. #endif
  3605. default:
  3606. return EMULATION_FAILED;
  3607. }
  3608. ctxt->op_bytes = def_op_bytes;
  3609. ctxt->ad_bytes = def_ad_bytes;
  3610. /* Legacy prefixes. */
  3611. for (;;) {
  3612. switch (ctxt->b = insn_fetch(u8, ctxt)) {
  3613. case 0x66: /* operand-size override */
  3614. op_prefix = true;
  3615. /* switch between 2/4 bytes */
  3616. ctxt->op_bytes = def_op_bytes ^ 6;
  3617. break;
  3618. case 0x67: /* address-size override */
  3619. if (mode == X86EMUL_MODE_PROT64)
  3620. /* switch between 4/8 bytes */
  3621. ctxt->ad_bytes = def_ad_bytes ^ 12;
  3622. else
  3623. /* switch between 2/4 bytes */
  3624. ctxt->ad_bytes = def_ad_bytes ^ 6;
  3625. break;
  3626. case 0x26: /* ES override */
  3627. case 0x2e: /* CS override */
  3628. case 0x36: /* SS override */
  3629. case 0x3e: /* DS override */
  3630. set_seg_override(ctxt, (ctxt->b >> 3) & 3);
  3631. break;
  3632. case 0x64: /* FS override */
  3633. case 0x65: /* GS override */
  3634. set_seg_override(ctxt, ctxt->b & 7);
  3635. break;
  3636. case 0x40 ... 0x4f: /* REX */
  3637. if (mode != X86EMUL_MODE_PROT64)
  3638. goto done_prefixes;
  3639. ctxt->rex_prefix = ctxt->b;
  3640. continue;
  3641. case 0xf0: /* LOCK */
  3642. ctxt->lock_prefix = 1;
  3643. break;
  3644. case 0xf2: /* REPNE/REPNZ */
  3645. case 0xf3: /* REP/REPE/REPZ */
  3646. ctxt->rep_prefix = ctxt->b;
  3647. break;
  3648. default:
  3649. goto done_prefixes;
  3650. }
  3651. /* Any legacy prefix after a REX prefix nullifies its effect. */
  3652. ctxt->rex_prefix = 0;
  3653. }
  3654. done_prefixes:
  3655. /* REX prefix. */
  3656. if (ctxt->rex_prefix & 8)
  3657. ctxt->op_bytes = 8; /* REX.W */
  3658. /* Opcode byte(s). */
  3659. opcode = opcode_table[ctxt->b];
  3660. /* Two-byte opcode? */
  3661. if (ctxt->b == 0x0f) {
  3662. ctxt->twobyte = 1;
  3663. ctxt->b = insn_fetch(u8, ctxt);
  3664. opcode = twobyte_table[ctxt->b];
  3665. }
  3666. ctxt->d = opcode.flags;
  3667. if (ctxt->d & ModRM)
  3668. ctxt->modrm = insn_fetch(u8, ctxt);
  3669. while (ctxt->d & GroupMask) {
  3670. switch (ctxt->d & GroupMask) {
  3671. case Group:
  3672. goffset = (ctxt->modrm >> 3) & 7;
  3673. opcode = opcode.u.group[goffset];
  3674. break;
  3675. case GroupDual:
  3676. goffset = (ctxt->modrm >> 3) & 7;
  3677. if ((ctxt->modrm >> 6) == 3)
  3678. opcode = opcode.u.gdual->mod3[goffset];
  3679. else
  3680. opcode = opcode.u.gdual->mod012[goffset];
  3681. break;
  3682. case RMExt:
  3683. goffset = ctxt->modrm & 7;
  3684. opcode = opcode.u.group[goffset];
  3685. break;
  3686. case Prefix:
  3687. if (ctxt->rep_prefix && op_prefix)
  3688. return EMULATION_FAILED;
  3689. simd_prefix = op_prefix ? 0x66 : ctxt->rep_prefix;
  3690. switch (simd_prefix) {
  3691. case 0x00: opcode = opcode.u.gprefix->pfx_no; break;
  3692. case 0x66: opcode = opcode.u.gprefix->pfx_66; break;
  3693. case 0xf2: opcode = opcode.u.gprefix->pfx_f2; break;
  3694. case 0xf3: opcode = opcode.u.gprefix->pfx_f3; break;
  3695. }
  3696. break;
  3697. default:
  3698. return EMULATION_FAILED;
  3699. }
  3700. ctxt->d &= ~(u64)GroupMask;
  3701. ctxt->d |= opcode.flags;
  3702. }
  3703. ctxt->execute = opcode.u.execute;
  3704. ctxt->check_perm = opcode.check_perm;
  3705. ctxt->intercept = opcode.intercept;
  3706. /* Unrecognised? */
  3707. if (ctxt->d == 0 || (ctxt->d & Undefined))
  3708. return EMULATION_FAILED;
  3709. if (!(ctxt->d & VendorSpecific) && ctxt->only_vendor_specific_insn)
  3710. return EMULATION_FAILED;
  3711. if (mode == X86EMUL_MODE_PROT64 && (ctxt->d & Stack))
  3712. ctxt->op_bytes = 8;
  3713. if (ctxt->d & Op3264) {
  3714. if (mode == X86EMUL_MODE_PROT64)
  3715. ctxt->op_bytes = 8;
  3716. else
  3717. ctxt->op_bytes = 4;
  3718. }
  3719. if (ctxt->d & Sse)
  3720. ctxt->op_bytes = 16;
  3721. else if (ctxt->d & Mmx)
  3722. ctxt->op_bytes = 8;
  3723. /* ModRM and SIB bytes. */
  3724. if (ctxt->d & ModRM) {
  3725. rc = decode_modrm(ctxt, &ctxt->memop);
  3726. if (!ctxt->has_seg_override)
  3727. set_seg_override(ctxt, ctxt->modrm_seg);
  3728. } else if (ctxt->d & MemAbs)
  3729. rc = decode_abs(ctxt, &ctxt->memop);
  3730. if (rc != X86EMUL_CONTINUE)
  3731. goto done;
  3732. if (!ctxt->has_seg_override)
  3733. set_seg_override(ctxt, VCPU_SREG_DS);
  3734. ctxt->memop.addr.mem.seg = seg_override(ctxt);
  3735. if (ctxt->memop.type == OP_MEM && ctxt->ad_bytes != 8)
  3736. ctxt->memop.addr.mem.ea = (u32)ctxt->memop.addr.mem.ea;
  3737. /*
  3738. * Decode and fetch the source operand: register, memory
  3739. * or immediate.
  3740. */
  3741. rc = decode_operand(ctxt, &ctxt->src, (ctxt->d >> SrcShift) & OpMask);
  3742. if (rc != X86EMUL_CONTINUE)
  3743. goto done;
  3744. /*
  3745. * Decode and fetch the second source operand: register, memory
  3746. * or immediate.
  3747. */
  3748. rc = decode_operand(ctxt, &ctxt->src2, (ctxt->d >> Src2Shift) & OpMask);
  3749. if (rc != X86EMUL_CONTINUE)
  3750. goto done;
  3751. /* Decode and fetch the destination operand: register or memory. */
  3752. rc = decode_operand(ctxt, &ctxt->dst, (ctxt->d >> DstShift) & OpMask);
  3753. done:
  3754. if (ctxt->memopp && ctxt->memopp->type == OP_MEM && ctxt->rip_relative)
  3755. ctxt->memopp->addr.mem.ea += ctxt->_eip;
  3756. return (rc != X86EMUL_CONTINUE) ? EMULATION_FAILED : EMULATION_OK;
  3757. }
  3758. bool x86_page_table_writing_insn(struct x86_emulate_ctxt *ctxt)
  3759. {
  3760. return ctxt->d & PageTable;
  3761. }
  3762. static bool string_insn_completed(struct x86_emulate_ctxt *ctxt)
  3763. {
  3764. /* The second termination condition only applies for REPE
  3765. * and REPNE. Test if the repeat string operation prefix is
  3766. * REPE/REPZ or REPNE/REPNZ and if it's the case it tests the
  3767. * corresponding termination condition according to:
  3768. * - if REPE/REPZ and ZF = 0 then done
  3769. * - if REPNE/REPNZ and ZF = 1 then done
  3770. */
  3771. if (((ctxt->b == 0xa6) || (ctxt->b == 0xa7) ||
  3772. (ctxt->b == 0xae) || (ctxt->b == 0xaf))
  3773. && (((ctxt->rep_prefix == REPE_PREFIX) &&
  3774. ((ctxt->eflags & EFLG_ZF) == 0))
  3775. || ((ctxt->rep_prefix == REPNE_PREFIX) &&
  3776. ((ctxt->eflags & EFLG_ZF) == EFLG_ZF))))
  3777. return true;
  3778. return false;
  3779. }
  3780. static int flush_pending_x87_faults(struct x86_emulate_ctxt *ctxt)
  3781. {
  3782. bool fault = false;
  3783. ctxt->ops->get_fpu(ctxt);
  3784. asm volatile("1: fwait \n\t"
  3785. "2: \n\t"
  3786. ".pushsection .fixup,\"ax\" \n\t"
  3787. "3: \n\t"
  3788. "movb $1, %[fault] \n\t"
  3789. "jmp 2b \n\t"
  3790. ".popsection \n\t"
  3791. _ASM_EXTABLE(1b, 3b)
  3792. : [fault]"+qm"(fault));
  3793. ctxt->ops->put_fpu(ctxt);
  3794. if (unlikely(fault))
  3795. return emulate_exception(ctxt, MF_VECTOR, 0, false);
  3796. return X86EMUL_CONTINUE;
  3797. }
  3798. static void fetch_possible_mmx_operand(struct x86_emulate_ctxt *ctxt,
  3799. struct operand *op)
  3800. {
  3801. if (op->type == OP_MM)
  3802. read_mmx_reg(ctxt, &op->mm_val, op->addr.mm);
  3803. }
  3804. int x86_emulate_insn(struct x86_emulate_ctxt *ctxt)
  3805. {
  3806. const struct x86_emulate_ops *ops = ctxt->ops;
  3807. int rc = X86EMUL_CONTINUE;
  3808. int saved_dst_type = ctxt->dst.type;
  3809. ctxt->mem_read.pos = 0;
  3810. if (ctxt->mode == X86EMUL_MODE_PROT64 && (ctxt->d & No64)) {
  3811. rc = emulate_ud(ctxt);
  3812. goto done;
  3813. }
  3814. /* LOCK prefix is allowed only with some instructions */
  3815. if (ctxt->lock_prefix && (!(ctxt->d & Lock) || ctxt->dst.type != OP_MEM)) {
  3816. rc = emulate_ud(ctxt);
  3817. goto done;
  3818. }
  3819. if ((ctxt->d & SrcMask) == SrcMemFAddr && ctxt->src.type != OP_MEM) {
  3820. rc = emulate_ud(ctxt);
  3821. goto done;
  3822. }
  3823. if (((ctxt->d & (Sse|Mmx)) && ((ops->get_cr(ctxt, 0) & X86_CR0_EM)))
  3824. || ((ctxt->d & Sse) && !(ops->get_cr(ctxt, 4) & X86_CR4_OSFXSR))) {
  3825. rc = emulate_ud(ctxt);
  3826. goto done;
  3827. }
  3828. if ((ctxt->d & (Sse|Mmx)) && (ops->get_cr(ctxt, 0) & X86_CR0_TS)) {
  3829. rc = emulate_nm(ctxt);
  3830. goto done;
  3831. }
  3832. if (ctxt->d & Mmx) {
  3833. rc = flush_pending_x87_faults(ctxt);
  3834. if (rc != X86EMUL_CONTINUE)
  3835. goto done;
  3836. /*
  3837. * Now that we know the fpu is exception safe, we can fetch
  3838. * operands from it.
  3839. */
  3840. fetch_possible_mmx_operand(ctxt, &ctxt->src);
  3841. fetch_possible_mmx_operand(ctxt, &ctxt->src2);
  3842. if (!(ctxt->d & Mov))
  3843. fetch_possible_mmx_operand(ctxt, &ctxt->dst);
  3844. }
  3845. if (unlikely(ctxt->guest_mode) && ctxt->intercept) {
  3846. rc = emulator_check_intercept(ctxt, ctxt->intercept,
  3847. X86_ICPT_PRE_EXCEPT);
  3848. if (rc != X86EMUL_CONTINUE)
  3849. goto done;
  3850. }
  3851. /* Privileged instruction can be executed only in CPL=0 */
  3852. if ((ctxt->d & Priv) && ops->cpl(ctxt)) {
  3853. rc = emulate_gp(ctxt, 0);
  3854. goto done;
  3855. }
  3856. /* Instruction can only be executed in protected mode */
  3857. if ((ctxt->d & Prot) && ctxt->mode < X86EMUL_MODE_PROT16) {
  3858. rc = emulate_ud(ctxt);
  3859. goto done;
  3860. }
  3861. /* Do instruction specific permission checks */
  3862. if (ctxt->check_perm) {
  3863. rc = ctxt->check_perm(ctxt);
  3864. if (rc != X86EMUL_CONTINUE)
  3865. goto done;
  3866. }
  3867. if (unlikely(ctxt->guest_mode) && ctxt->intercept) {
  3868. rc = emulator_check_intercept(ctxt, ctxt->intercept,
  3869. X86_ICPT_POST_EXCEPT);
  3870. if (rc != X86EMUL_CONTINUE)
  3871. goto done;
  3872. }
  3873. if (ctxt->rep_prefix && (ctxt->d & String)) {
  3874. /* All REP prefixes have the same first termination condition */
  3875. if (address_mask(ctxt, reg_read(ctxt, VCPU_REGS_RCX)) == 0) {
  3876. ctxt->eip = ctxt->_eip;
  3877. goto done;
  3878. }
  3879. }
  3880. if ((ctxt->src.type == OP_MEM) && !(ctxt->d & NoAccess)) {
  3881. rc = segmented_read(ctxt, ctxt->src.addr.mem,
  3882. ctxt->src.valptr, ctxt->src.bytes);
  3883. if (rc != X86EMUL_CONTINUE)
  3884. goto done;
  3885. ctxt->src.orig_val64 = ctxt->src.val64;
  3886. }
  3887. if (ctxt->src2.type == OP_MEM) {
  3888. rc = segmented_read(ctxt, ctxt->src2.addr.mem,
  3889. &ctxt->src2.val, ctxt->src2.bytes);
  3890. if (rc != X86EMUL_CONTINUE)
  3891. goto done;
  3892. }
  3893. if ((ctxt->d & DstMask) == ImplicitOps)
  3894. goto special_insn;
  3895. if ((ctxt->dst.type == OP_MEM) && !(ctxt->d & Mov)) {
  3896. /* optimisation - avoid slow emulated read if Mov */
  3897. rc = segmented_read(ctxt, ctxt->dst.addr.mem,
  3898. &ctxt->dst.val, ctxt->dst.bytes);
  3899. if (rc != X86EMUL_CONTINUE)
  3900. goto done;
  3901. }
  3902. ctxt->dst.orig_val = ctxt->dst.val;
  3903. special_insn:
  3904. if (unlikely(ctxt->guest_mode) && ctxt->intercept) {
  3905. rc = emulator_check_intercept(ctxt, ctxt->intercept,
  3906. X86_ICPT_POST_MEMACCESS);
  3907. if (rc != X86EMUL_CONTINUE)
  3908. goto done;
  3909. }
  3910. if (ctxt->execute) {
  3911. rc = ctxt->execute(ctxt);
  3912. if (rc != X86EMUL_CONTINUE)
  3913. goto done;
  3914. goto writeback;
  3915. }
  3916. if (ctxt->twobyte)
  3917. goto twobyte_insn;
  3918. switch (ctxt->b) {
  3919. case 0x40 ... 0x47: /* inc r16/r32 */
  3920. emulate_1op(ctxt, "inc");
  3921. break;
  3922. case 0x48 ... 0x4f: /* dec r16/r32 */
  3923. emulate_1op(ctxt, "dec");
  3924. break;
  3925. case 0x63: /* movsxd */
  3926. if (ctxt->mode != X86EMUL_MODE_PROT64)
  3927. goto cannot_emulate;
  3928. ctxt->dst.val = (s32) ctxt->src.val;
  3929. break;
  3930. case 0x70 ... 0x7f: /* jcc (short) */
  3931. if (test_cc(ctxt->b, ctxt->eflags))
  3932. jmp_rel(ctxt, ctxt->src.val);
  3933. break;
  3934. case 0x8d: /* lea r16/r32, m */
  3935. ctxt->dst.val = ctxt->src.addr.mem.ea;
  3936. break;
  3937. case 0x90 ... 0x97: /* nop / xchg reg, rax */
  3938. if (ctxt->dst.addr.reg == reg_rmw(ctxt, VCPU_REGS_RAX))
  3939. break;
  3940. rc = em_xchg(ctxt);
  3941. break;
  3942. case 0x98: /* cbw/cwde/cdqe */
  3943. switch (ctxt->op_bytes) {
  3944. case 2: ctxt->dst.val = (s8)ctxt->dst.val; break;
  3945. case 4: ctxt->dst.val = (s16)ctxt->dst.val; break;
  3946. case 8: ctxt->dst.val = (s32)ctxt->dst.val; break;
  3947. }
  3948. break;
  3949. case 0xc0 ... 0xc1:
  3950. rc = em_grp2(ctxt);
  3951. break;
  3952. case 0xcc: /* int3 */
  3953. rc = emulate_int(ctxt, 3);
  3954. break;
  3955. case 0xcd: /* int n */
  3956. rc = emulate_int(ctxt, ctxt->src.val);
  3957. break;
  3958. case 0xce: /* into */
  3959. if (ctxt->eflags & EFLG_OF)
  3960. rc = emulate_int(ctxt, 4);
  3961. break;
  3962. case 0xd0 ... 0xd1: /* Grp2 */
  3963. rc = em_grp2(ctxt);
  3964. break;
  3965. case 0xd2 ... 0xd3: /* Grp2 */
  3966. ctxt->src.val = reg_read(ctxt, VCPU_REGS_RCX);
  3967. rc = em_grp2(ctxt);
  3968. break;
  3969. case 0xe9: /* jmp rel */
  3970. case 0xeb: /* jmp rel short */
  3971. jmp_rel(ctxt, ctxt->src.val);
  3972. ctxt->dst.type = OP_NONE; /* Disable writeback. */
  3973. break;
  3974. case 0xf4: /* hlt */
  3975. ctxt->ops->halt(ctxt);
  3976. break;
  3977. case 0xf5: /* cmc */
  3978. /* complement carry flag from eflags reg */
  3979. ctxt->eflags ^= EFLG_CF;
  3980. break;
  3981. case 0xf8: /* clc */
  3982. ctxt->eflags &= ~EFLG_CF;
  3983. break;
  3984. case 0xf9: /* stc */
  3985. ctxt->eflags |= EFLG_CF;
  3986. break;
  3987. case 0xfc: /* cld */
  3988. ctxt->eflags &= ~EFLG_DF;
  3989. break;
  3990. case 0xfd: /* std */
  3991. ctxt->eflags |= EFLG_DF;
  3992. break;
  3993. default:
  3994. goto cannot_emulate;
  3995. }
  3996. if (rc != X86EMUL_CONTINUE)
  3997. goto done;
  3998. writeback:
  3999. rc = writeback(ctxt);
  4000. if (rc != X86EMUL_CONTINUE)
  4001. goto done;
  4002. /*
  4003. * restore dst type in case the decoding will be reused
  4004. * (happens for string instruction )
  4005. */
  4006. ctxt->dst.type = saved_dst_type;
  4007. if ((ctxt->d & SrcMask) == SrcSI)
  4008. string_addr_inc(ctxt, VCPU_REGS_RSI, &ctxt->src);
  4009. if ((ctxt->d & DstMask) == DstDI)
  4010. string_addr_inc(ctxt, VCPU_REGS_RDI, &ctxt->dst);
  4011. if (ctxt->rep_prefix && (ctxt->d & String)) {
  4012. unsigned int count;
  4013. struct read_cache *r = &ctxt->io_read;
  4014. if ((ctxt->d & SrcMask) == SrcSI)
  4015. count = ctxt->src.count;
  4016. else
  4017. count = ctxt->dst.count;
  4018. register_address_increment(ctxt, reg_rmw(ctxt, VCPU_REGS_RCX),
  4019. -count);
  4020. if (!string_insn_completed(ctxt)) {
  4021. /*
  4022. * Re-enter guest when pio read ahead buffer is empty
  4023. * or, if it is not used, after each 1024 iteration.
  4024. */
  4025. if ((r->end != 0 || reg_read(ctxt, VCPU_REGS_RCX) & 0x3ff) &&
  4026. (r->end == 0 || r->end != r->pos)) {
  4027. /*
  4028. * Reset read cache. Usually happens before
  4029. * decode, but since instruction is restarted
  4030. * we have to do it here.
  4031. */
  4032. ctxt->mem_read.end = 0;
  4033. writeback_registers(ctxt);
  4034. return EMULATION_RESTART;
  4035. }
  4036. goto done; /* skip rip writeback */
  4037. }
  4038. }
  4039. ctxt->eip = ctxt->_eip;
  4040. done:
  4041. if (rc == X86EMUL_PROPAGATE_FAULT)
  4042. ctxt->have_exception = true;
  4043. if (rc == X86EMUL_INTERCEPTED)
  4044. return EMULATION_INTERCEPTED;
  4045. if (rc == X86EMUL_CONTINUE)
  4046. writeback_registers(ctxt);
  4047. return (rc == X86EMUL_UNHANDLEABLE) ? EMULATION_FAILED : EMULATION_OK;
  4048. twobyte_insn:
  4049. switch (ctxt->b) {
  4050. case 0x09: /* wbinvd */
  4051. (ctxt->ops->wbinvd)(ctxt);
  4052. break;
  4053. case 0x08: /* invd */
  4054. case 0x0d: /* GrpP (prefetch) */
  4055. case 0x18: /* Grp16 (prefetch/nop) */
  4056. break;
  4057. case 0x20: /* mov cr, reg */
  4058. ctxt->dst.val = ops->get_cr(ctxt, ctxt->modrm_reg);
  4059. break;
  4060. case 0x21: /* mov from dr to reg */
  4061. ops->get_dr(ctxt, ctxt->modrm_reg, &ctxt->dst.val);
  4062. break;
  4063. case 0x40 ... 0x4f: /* cmov */
  4064. ctxt->dst.val = ctxt->dst.orig_val = ctxt->src.val;
  4065. if (!test_cc(ctxt->b, ctxt->eflags))
  4066. ctxt->dst.type = OP_NONE; /* no writeback */
  4067. break;
  4068. case 0x80 ... 0x8f: /* jnz rel, etc*/
  4069. if (test_cc(ctxt->b, ctxt->eflags))
  4070. jmp_rel(ctxt, ctxt->src.val);
  4071. break;
  4072. case 0x90 ... 0x9f: /* setcc r/m8 */
  4073. ctxt->dst.val = test_cc(ctxt->b, ctxt->eflags);
  4074. break;
  4075. case 0xa4: /* shld imm8, r, r/m */
  4076. case 0xa5: /* shld cl, r, r/m */
  4077. emulate_2op_cl(ctxt, "shld");
  4078. break;
  4079. case 0xac: /* shrd imm8, r, r/m */
  4080. case 0xad: /* shrd cl, r, r/m */
  4081. emulate_2op_cl(ctxt, "shrd");
  4082. break;
  4083. case 0xae: /* clflush */
  4084. break;
  4085. case 0xb6 ... 0xb7: /* movzx */
  4086. ctxt->dst.bytes = ctxt->op_bytes;
  4087. ctxt->dst.val = (ctxt->src.bytes == 1) ? (u8) ctxt->src.val
  4088. : (u16) ctxt->src.val;
  4089. break;
  4090. case 0xbe ... 0xbf: /* movsx */
  4091. ctxt->dst.bytes = ctxt->op_bytes;
  4092. ctxt->dst.val = (ctxt->src.bytes == 1) ? (s8) ctxt->src.val :
  4093. (s16) ctxt->src.val;
  4094. break;
  4095. case 0xc0 ... 0xc1: /* xadd */
  4096. emulate_2op_SrcV(ctxt, "add");
  4097. /* Write back the register source. */
  4098. ctxt->src.val = ctxt->dst.orig_val;
  4099. write_register_operand(&ctxt->src);
  4100. break;
  4101. case 0xc3: /* movnti */
  4102. ctxt->dst.bytes = ctxt->op_bytes;
  4103. ctxt->dst.val = (ctxt->op_bytes == 4) ? (u32) ctxt->src.val :
  4104. (u64) ctxt->src.val;
  4105. break;
  4106. default:
  4107. goto cannot_emulate;
  4108. }
  4109. if (rc != X86EMUL_CONTINUE)
  4110. goto done;
  4111. goto writeback;
  4112. cannot_emulate:
  4113. return EMULATION_FAILED;
  4114. }
  4115. void emulator_invalidate_register_cache(struct x86_emulate_ctxt *ctxt)
  4116. {
  4117. invalidate_registers(ctxt);
  4118. }
  4119. void emulator_writeback_register_cache(struct x86_emulate_ctxt *ctxt)
  4120. {
  4121. writeback_registers(ctxt);
  4122. }