You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

cpuid_x86.c 44 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935
  1. /*********************************************************************/
  2. /* Copyright 2009, 2010 The University of Texas at Austin. */
  3. /* All rights reserved. */
  4. /* */
  5. /* Redistribution and use in source and binary forms, with or */
  6. /* without modification, are permitted provided that the following */
  7. /* conditions are met: */
  8. /* */
  9. /* 1. Redistributions of source code must retain the above */
  10. /* copyright notice, this list of conditions and the following */
  11. /* disclaimer. */
  12. /* */
  13. /* 2. Redistributions in binary form must reproduce the above */
  14. /* copyright notice, this list of conditions and the following */
  15. /* disclaimer in the documentation and/or other materials */
  16. /* provided with the distribution. */
  17. /* */
  18. /* THIS SOFTWARE IS PROVIDED BY THE UNIVERSITY OF TEXAS AT */
  19. /* AUSTIN ``AS IS'' AND ANY EXPRESS OR IMPLIED WARRANTIES, */
  20. /* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF */
  21. /* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE */
  22. /* DISCLAIMED. IN NO EVENT SHALL THE UNIVERSITY OF TEXAS AT */
  23. /* AUSTIN OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, */
  24. /* INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES */
  25. /* (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE */
  26. /* GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR */
  27. /* BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF */
  28. /* LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT */
  29. /* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT */
  30. /* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE */
  31. /* POSSIBILITY OF SUCH DAMAGE. */
  32. /* */
  33. /* The views and conclusions contained in the software and */
  34. /* documentation are those of the authors and should not be */
  35. /* interpreted as representing official policies, either expressed */
  36. /* or implied, of The University of Texas at Austin. */
  37. /*********************************************************************/
  38. #include <stdio.h>
  39. #include <string.h>
  40. #include "cpuid.h"
  41. #if defined(_MSC_VER) && !defined(__clang__)
  42. #define C_INLINE __inline
  43. #else
  44. #define C_INLINE inline
  45. #endif
  46. /*
  47. #ifdef NO_AVX
  48. #define CPUTYPE_HASWELL CPUTYPE_NEHALEM
  49. #define CORE_HASWELL CORE_NEHALEM
  50. #define CPUTYPE_SANDYBRIDGE CPUTYPE_NEHALEM
  51. #define CORE_SANDYBRIDGE CORE_NEHALEM
  52. #define CPUTYPE_BULLDOZER CPUTYPE_BARCELONA
  53. #define CORE_BULLDOZER CORE_BARCELONA
  54. #define CPUTYPE_PILEDRIVER CPUTYPE_BARCELONA
  55. #define CORE_PILEDRIVER CORE_BARCELONA
  56. #endif
  57. */
  58. #if defined(_MSC_VER) && !defined(__clang__)
  59. void cpuid(int op, int *eax, int *ebx, int *ecx, int *edx)
  60. {
  61. int cpuInfo[4] = {-1};
  62. __cpuid(cpuInfo, op);
  63. *eax = cpuInfo[0];
  64. *ebx = cpuInfo[1];
  65. *ecx = cpuInfo[2];
  66. *edx = cpuInfo[3];
  67. }
  68. #else
  69. #ifndef CPUIDEMU
  70. #if defined(__APPLE__) && defined(__i386__)
  71. void cpuid(int op, int *eax, int *ebx, int *ecx, int *edx);
  72. #else
  73. static C_INLINE void cpuid(int op, int *eax, int *ebx, int *ecx, int *edx){
  74. #if defined(__i386__) && defined(__PIC__)
  75. __asm__ __volatile__
  76. ("mov %%ebx, %%edi;"
  77. "cpuid;"
  78. "xchgl %%ebx, %%edi;"
  79. : "=a" (*eax), "=D" (*ebx), "=c" (*ecx), "=d" (*edx) : "a" (op) : "cc");
  80. #else
  81. __asm__ __volatile__
  82. ("cpuid": "=a" (*eax), "=b" (*ebx), "=c" (*ecx), "=d" (*edx) : "a" (op) : "cc");
  83. #endif
  84. }
  85. #endif
  86. #else
  87. typedef struct {
  88. unsigned int id, a, b, c, d;
  89. } idlist_t;
  90. typedef struct {
  91. char *vendor;
  92. char *name;
  93. int start, stop;
  94. } vendor_t;
  95. extern idlist_t idlist[];
  96. extern vendor_t vendor[];
  97. static int cv = VENDOR;
  98. void cpuid(unsigned int op, unsigned int *eax, unsigned int *ebx, unsigned int *ecx, unsigned int *edx){
  99. static int current = 0;
  100. int start = vendor[cv].start;
  101. int stop = vendor[cv].stop;
  102. int count = stop - start;
  103. if ((current < start) || (current > stop)) current = start;
  104. while ((count > 0) && (idlist[current].id != op)) {
  105. current ++;
  106. if (current > stop) current = start;
  107. count --;
  108. }
  109. *eax = idlist[current].a;
  110. *ebx = idlist[current].b;
  111. *ecx = idlist[current].c;
  112. *edx = idlist[current].d;
  113. }
  114. #endif
  115. #endif // _MSC_VER
  116. static C_INLINE int have_cpuid(void){
  117. int eax, ebx, ecx, edx;
  118. cpuid(0, &eax, &ebx, &ecx, &edx);
  119. return eax;
  120. }
  121. static C_INLINE int have_excpuid(void){
  122. int eax, ebx, ecx, edx;
  123. cpuid(0x80000000, &eax, &ebx, &ecx, &edx);
  124. return eax & 0xffff;
  125. }
  126. #ifndef NO_AVX
  127. static C_INLINE void xgetbv(int op, int * eax, int * edx){
  128. //Use binary code for xgetbv
  129. #if defined(_MSC_VER) && !defined(__clang__)
  130. *eax = __xgetbv(op);
  131. #else
  132. __asm__ __volatile__
  133. (".byte 0x0f, 0x01, 0xd0": "=a" (*eax), "=d" (*edx) : "c" (op) : "cc");
  134. #endif
  135. }
  136. #endif
  137. int support_avx(){
  138. #ifndef NO_AVX
  139. int eax, ebx, ecx, edx;
  140. int ret=0;
  141. cpuid(1, &eax, &ebx, &ecx, &edx);
  142. if ((ecx & (1 << 28)) != 0 && (ecx & (1 << 27)) != 0 && (ecx & (1 << 26)) != 0){
  143. xgetbv(0, &eax, &edx);
  144. if((eax & 6) == 6){
  145. ret=1; //OS support AVX
  146. }
  147. }
  148. return ret;
  149. #else
  150. return 0;
  151. #endif
  152. }
  153. int get_vendor(void){
  154. int eax, ebx, ecx, edx;
  155. char vendor[13];
  156. cpuid(0, &eax, &ebx, &ecx, &edx);
  157. *(int *)(&vendor[0]) = ebx;
  158. *(int *)(&vendor[4]) = edx;
  159. *(int *)(&vendor[8]) = ecx;
  160. vendor[12] = (char)0;
  161. if (!strcmp(vendor, "GenuineIntel")) return VENDOR_INTEL;
  162. if (!strcmp(vendor, " UMC UMC UMC")) return VENDOR_UMC;
  163. if (!strcmp(vendor, "AuthenticAMD")) return VENDOR_AMD;
  164. if (!strcmp(vendor, "CyrixInstead")) return VENDOR_CYRIX;
  165. if (!strcmp(vendor, "NexGenDriven")) return VENDOR_NEXGEN;
  166. if (!strcmp(vendor, "CentaurHauls")) return VENDOR_CENTAUR;
  167. if (!strcmp(vendor, "RiseRiseRise")) return VENDOR_RISE;
  168. if (!strcmp(vendor, " SiS SiS SiS")) return VENDOR_SIS;
  169. if (!strcmp(vendor, "GenuineTMx86")) return VENDOR_TRANSMETA;
  170. if (!strcmp(vendor, "Geode by NSC")) return VENDOR_NSC;
  171. if ((eax == 0) || ((eax & 0x500) != 0)) return VENDOR_INTEL;
  172. return VENDOR_UNKNOWN;
  173. }
  174. int get_cputype(int gettype){
  175. int eax, ebx, ecx, edx;
  176. int extend_family, family;
  177. int extend_model, model;
  178. int type, stepping;
  179. int feature = 0;
  180. cpuid(1, &eax, &ebx, &ecx, &edx);
  181. switch (gettype) {
  182. case GET_EXFAMILY :
  183. return BITMASK(eax, 20, 0xff);
  184. case GET_EXMODEL :
  185. return BITMASK(eax, 16, 0x0f);
  186. case GET_TYPE :
  187. return BITMASK(eax, 12, 0x03);
  188. case GET_FAMILY :
  189. return BITMASK(eax, 8, 0x0f);
  190. case GET_MODEL :
  191. return BITMASK(eax, 4, 0x0f);
  192. case GET_APICID :
  193. return BITMASK(ebx, 24, 0x0f);
  194. case GET_LCOUNT :
  195. return BITMASK(ebx, 16, 0x0f);
  196. case GET_CHUNKS :
  197. return BITMASK(ebx, 8, 0x0f);
  198. case GET_STEPPING :
  199. return BITMASK(eax, 0, 0x0f);
  200. case GET_BLANDID :
  201. return BITMASK(ebx, 0, 0xff);
  202. case GET_NUMSHARE :
  203. if (have_cpuid() < 4) return 0;
  204. cpuid(4, &eax, &ebx, &ecx, &edx);
  205. return BITMASK(eax, 14, 0xfff);
  206. case GET_NUMCORES :
  207. if (have_cpuid() < 4) return 0;
  208. cpuid(4, &eax, &ebx, &ecx, &edx);
  209. return BITMASK(eax, 26, 0x3f);
  210. case GET_FEATURE :
  211. if ((edx & (1 << 3)) != 0) feature |= HAVE_PSE;
  212. if ((edx & (1 << 15)) != 0) feature |= HAVE_CMOV;
  213. if ((edx & (1 << 19)) != 0) feature |= HAVE_CFLUSH;
  214. if ((edx & (1 << 23)) != 0) feature |= HAVE_MMX;
  215. if ((edx & (1 << 25)) != 0) feature |= HAVE_SSE;
  216. if ((edx & (1 << 26)) != 0) feature |= HAVE_SSE2;
  217. if ((edx & (1 << 27)) != 0) {
  218. if (BITMASK(ebx, 16, 0x0f) > 0) feature |= HAVE_HIT;
  219. }
  220. if ((ecx & (1 << 0)) != 0) feature |= HAVE_SSE3;
  221. if ((ecx & (1 << 9)) != 0) feature |= HAVE_SSSE3;
  222. if ((ecx & (1 << 19)) != 0) feature |= HAVE_SSE4_1;
  223. if ((ecx & (1 << 20)) != 0) feature |= HAVE_SSE4_2;
  224. #ifndef NO_AVX
  225. if (support_avx()) feature |= HAVE_AVX;
  226. if ((ecx & (1 << 12)) != 0) feature |= HAVE_FMA3;
  227. #endif
  228. if (have_excpuid() >= 0x01) {
  229. cpuid(0x80000001, &eax, &ebx, &ecx, &edx);
  230. if ((ecx & (1 << 6)) != 0) feature |= HAVE_SSE4A;
  231. if ((ecx & (1 << 7)) != 0) feature |= HAVE_MISALIGNSSE;
  232. #ifndef NO_AVX
  233. if ((ecx & (1 << 16)) != 0) feature |= HAVE_FMA4;
  234. #endif
  235. if ((edx & (1 << 30)) != 0) feature |= HAVE_3DNOWEX;
  236. if ((edx & (1 << 31)) != 0) feature |= HAVE_3DNOW;
  237. }
  238. if (have_excpuid() >= 0x1a) {
  239. cpuid(0x8000001a, &eax, &ebx, &ecx, &edx);
  240. if ((eax & (1 << 0)) != 0) feature |= HAVE_128BITFPU;
  241. if ((eax & (1 << 1)) != 0) feature |= HAVE_FASTMOVU;
  242. }
  243. }
  244. return feature;
  245. }
  246. int get_cacheinfo(int type, cache_info_t *cacheinfo){
  247. int eax, ebx, ecx, edx, cpuid_level;
  248. int info[15];
  249. int i;
  250. cache_info_t LC1, LD1, L2, L3,
  251. ITB, DTB, LITB, LDTB,
  252. L2ITB, L2DTB, L2LITB, L2LDTB;
  253. LC1.size = 0; LC1.associative = 0; LC1.linesize = 0; LC1.shared = 0;
  254. LD1.size = 0; LD1.associative = 0; LD1.linesize = 0; LD1.shared = 0;
  255. L2.size = 0; L2.associative = 0; L2.linesize = 0; L2.shared = 0;
  256. L3.size = 0; L3.associative = 0; L3.linesize = 0; L3.shared = 0;
  257. ITB.size = 0; ITB.associative = 0; ITB.linesize = 0; ITB.shared = 0;
  258. DTB.size = 0; DTB.associative = 0; DTB.linesize = 0; DTB.shared = 0;
  259. LITB.size = 0; LITB.associative = 0; LITB.linesize = 0; LITB.shared = 0;
  260. LDTB.size = 0; LDTB.associative = 0; LDTB.linesize = 0; LDTB.shared = 0;
  261. L2ITB.size = 0; L2ITB.associative = 0; L2ITB.linesize = 0; L2ITB.shared = 0;
  262. L2DTB.size = 0; L2DTB.associative = 0; L2DTB.linesize = 0; L2DTB.shared = 0;
  263. L2LITB.size = 0; L2LITB.associative = 0; L2LITB.linesize = 0; L2LITB.shared = 0;
  264. L2LDTB.size = 0; L2LDTB.associative = 0; L2LDTB.linesize = 0; L2LDTB.shared = 0;
  265. cpuid(0, &cpuid_level, &ebx, &ecx, &edx);
  266. if (cpuid_level > 1) {
  267. cpuid(2, &eax, &ebx, &ecx, &edx);
  268. info[ 0] = BITMASK(eax, 8, 0xff);
  269. info[ 1] = BITMASK(eax, 16, 0xff);
  270. info[ 2] = BITMASK(eax, 24, 0xff);
  271. info[ 3] = BITMASK(ebx, 0, 0xff);
  272. info[ 4] = BITMASK(ebx, 8, 0xff);
  273. info[ 5] = BITMASK(ebx, 16, 0xff);
  274. info[ 6] = BITMASK(ebx, 24, 0xff);
  275. info[ 7] = BITMASK(ecx, 0, 0xff);
  276. info[ 8] = BITMASK(ecx, 8, 0xff);
  277. info[ 9] = BITMASK(ecx, 16, 0xff);
  278. info[10] = BITMASK(ecx, 24, 0xff);
  279. info[11] = BITMASK(edx, 0, 0xff);
  280. info[12] = BITMASK(edx, 8, 0xff);
  281. info[13] = BITMASK(edx, 16, 0xff);
  282. info[14] = BITMASK(edx, 24, 0xff);
  283. for (i = 0; i < 15; i++){
  284. switch (info[i]){
  285. /* This table is from http://www.sandpile.org/ia32/cpuid.htm */
  286. case 0x01 :
  287. ITB.size = 4;
  288. ITB.associative = 4;
  289. ITB.linesize = 32;
  290. break;
  291. case 0x02 :
  292. LITB.size = 4096;
  293. LITB.associative = 0;
  294. LITB.linesize = 2;
  295. break;
  296. case 0x03 :
  297. DTB.size = 4;
  298. DTB.associative = 4;
  299. DTB.linesize = 64;
  300. break;
  301. case 0x04 :
  302. LDTB.size = 4096;
  303. LDTB.associative = 4;
  304. LDTB.linesize = 8;
  305. break;
  306. case 0x05 :
  307. LDTB.size = 4096;
  308. LDTB.associative = 4;
  309. LDTB.linesize = 32;
  310. break;
  311. case 0x06 :
  312. LC1.size = 8;
  313. LC1.associative = 4;
  314. LC1.linesize = 32;
  315. break;
  316. case 0x08 :
  317. LC1.size = 16;
  318. LC1.associative = 4;
  319. LC1.linesize = 32;
  320. break;
  321. case 0x09 :
  322. LC1.size = 32;
  323. LC1.associative = 4;
  324. LC1.linesize = 64;
  325. break;
  326. case 0x0a :
  327. LD1.size = 8;
  328. LD1.associative = 2;
  329. LD1.linesize = 32;
  330. break;
  331. case 0x0c :
  332. LD1.size = 16;
  333. LD1.associative = 4;
  334. LD1.linesize = 32;
  335. break;
  336. case 0x0d :
  337. LD1.size = 16;
  338. LD1.associative = 4;
  339. LD1.linesize = 64;
  340. break;
  341. case 0x0e :
  342. LD1.size = 24;
  343. LD1.associative = 6;
  344. LD1.linesize = 64;
  345. break;
  346. case 0x10 :
  347. LD1.size = 16;
  348. LD1.associative = 4;
  349. LD1.linesize = 32;
  350. break;
  351. case 0x15 :
  352. LC1.size = 16;
  353. LC1.associative = 4;
  354. LC1.linesize = 32;
  355. break;
  356. case 0x1a :
  357. L2.size = 96;
  358. L2.associative = 6;
  359. L2.linesize = 64;
  360. break;
  361. case 0x21 :
  362. L2.size = 256;
  363. L2.associative = 8;
  364. L2.linesize = 64;
  365. break;
  366. case 0x22 :
  367. L3.size = 512;
  368. L3.associative = 4;
  369. L3.linesize = 64;
  370. break;
  371. case 0x23 :
  372. L3.size = 1024;
  373. L3.associative = 8;
  374. L3.linesize = 64;
  375. break;
  376. case 0x25 :
  377. L3.size = 2048;
  378. L3.associative = 8;
  379. L3.linesize = 64;
  380. break;
  381. case 0x29 :
  382. L3.size = 4096;
  383. L3.associative = 8;
  384. L3.linesize = 64;
  385. break;
  386. case 0x2c :
  387. LD1.size = 32;
  388. LD1.associative = 8;
  389. LD1.linesize = 64;
  390. break;
  391. case 0x30 :
  392. LC1.size = 32;
  393. LC1.associative = 8;
  394. LC1.linesize = 64;
  395. break;
  396. case 0x39 :
  397. L2.size = 128;
  398. L2.associative = 4;
  399. L2.linesize = 64;
  400. break;
  401. case 0x3a :
  402. L2.size = 192;
  403. L2.associative = 6;
  404. L2.linesize = 64;
  405. break;
  406. case 0x3b :
  407. L2.size = 128;
  408. L2.associative = 2;
  409. L2.linesize = 64;
  410. break;
  411. case 0x3c :
  412. L2.size = 256;
  413. L2.associative = 4;
  414. L2.linesize = 64;
  415. break;
  416. case 0x3d :
  417. L2.size = 384;
  418. L2.associative = 6;
  419. L2.linesize = 64;
  420. break;
  421. case 0x3e :
  422. L2.size = 512;
  423. L2.associative = 4;
  424. L2.linesize = 64;
  425. break;
  426. case 0x41 :
  427. L2.size = 128;
  428. L2.associative = 4;
  429. L2.linesize = 32;
  430. break;
  431. case 0x42 :
  432. L2.size = 256;
  433. L2.associative = 4;
  434. L2.linesize = 32;
  435. break;
  436. case 0x43 :
  437. L2.size = 512;
  438. L2.associative = 4;
  439. L2.linesize = 32;
  440. break;
  441. case 0x44 :
  442. L2.size = 1024;
  443. L2.associative = 4;
  444. L2.linesize = 32;
  445. break;
  446. case 0x45 :
  447. L2.size = 2048;
  448. L2.associative = 4;
  449. L2.linesize = 32;
  450. break;
  451. case 0x46 :
  452. L3.size = 4096;
  453. L3.associative = 4;
  454. L3.linesize = 64;
  455. break;
  456. case 0x47 :
  457. L3.size = 8192;
  458. L3.associative = 8;
  459. L3.linesize = 64;
  460. break;
  461. case 0x48 :
  462. L2.size = 3184;
  463. L2.associative = 12;
  464. L2.linesize = 64;
  465. break;
  466. case 0x49 :
  467. if ((get_cputype(GET_FAMILY) == 0x0f) && (get_cputype(GET_MODEL) == 0x06)) {
  468. L3.size = 4096;
  469. L3.associative = 16;
  470. L3.linesize = 64;
  471. } else {
  472. L2.size = 4096;
  473. L2.associative = 16;
  474. L2.linesize = 64;
  475. }
  476. break;
  477. case 0x4a :
  478. L3.size = 6144;
  479. L3.associative = 12;
  480. L3.linesize = 64;
  481. break;
  482. case 0x4b :
  483. L3.size = 8192;
  484. L3.associative = 16;
  485. L3.linesize = 64;
  486. break;
  487. case 0x4c :
  488. L3.size = 12280;
  489. L3.associative = 12;
  490. L3.linesize = 64;
  491. break;
  492. case 0x4d :
  493. L3.size = 16384;
  494. L3.associative = 16;
  495. L3.linesize = 64;
  496. break;
  497. case 0x4e :
  498. L2.size = 6144;
  499. L2.associative = 24;
  500. L2.linesize = 64;
  501. break;
  502. case 0x4f :
  503. ITB.size = 4;
  504. ITB.associative = 0;
  505. ITB.linesize = 32;
  506. break;
  507. case 0x50 :
  508. ITB.size = 4;
  509. ITB.associative = 0;
  510. ITB.linesize = 64;
  511. LITB.size = 4096;
  512. LITB.associative = 0;
  513. LITB.linesize = 64;
  514. LITB.shared = 1;
  515. break;
  516. case 0x51 :
  517. ITB.size = 4;
  518. ITB.associative = 0;
  519. ITB.linesize = 128;
  520. LITB.size = 4096;
  521. LITB.associative = 0;
  522. LITB.linesize = 128;
  523. LITB.shared = 1;
  524. break;
  525. case 0x52 :
  526. ITB.size = 4;
  527. ITB.associative = 0;
  528. ITB.linesize = 256;
  529. LITB.size = 4096;
  530. LITB.associative = 0;
  531. LITB.linesize = 256;
  532. LITB.shared = 1;
  533. break;
  534. case 0x55 :
  535. LITB.size = 4096;
  536. LITB.associative = 0;
  537. LITB.linesize = 7;
  538. LITB.shared = 1;
  539. break;
  540. case 0x56 :
  541. LDTB.size = 4096;
  542. LDTB.associative = 4;
  543. LDTB.linesize = 16;
  544. break;
  545. case 0x57 :
  546. LDTB.size = 4096;
  547. LDTB.associative = 4;
  548. LDTB.linesize = 16;
  549. break;
  550. case 0x5b :
  551. DTB.size = 4;
  552. DTB.associative = 0;
  553. DTB.linesize = 64;
  554. LDTB.size = 4096;
  555. LDTB.associative = 0;
  556. LDTB.linesize = 64;
  557. LDTB.shared = 1;
  558. break;
  559. case 0x5c :
  560. DTB.size = 4;
  561. DTB.associative = 0;
  562. DTB.linesize = 128;
  563. LDTB.size = 4096;
  564. LDTB.associative = 0;
  565. LDTB.linesize = 128;
  566. LDTB.shared = 1;
  567. break;
  568. case 0x5d :
  569. DTB.size = 4;
  570. DTB.associative = 0;
  571. DTB.linesize = 256;
  572. LDTB.size = 4096;
  573. LDTB.associative = 0;
  574. LDTB.linesize = 256;
  575. LDTB.shared = 1;
  576. break;
  577. case 0x60 :
  578. LD1.size = 16;
  579. LD1.associative = 8;
  580. LD1.linesize = 64;
  581. break;
  582. case 0x66 :
  583. LD1.size = 8;
  584. LD1.associative = 4;
  585. LD1.linesize = 64;
  586. break;
  587. case 0x67 :
  588. LD1.size = 16;
  589. LD1.associative = 4;
  590. LD1.linesize = 64;
  591. break;
  592. case 0x68 :
  593. LD1.size = 32;
  594. LD1.associative = 4;
  595. LD1.linesize = 64;
  596. break;
  597. case 0x70 :
  598. LC1.size = 12;
  599. LC1.associative = 8;
  600. break;
  601. case 0x71 :
  602. LC1.size = 16;
  603. LC1.associative = 8;
  604. break;
  605. case 0x72 :
  606. LC1.size = 32;
  607. LC1.associative = 8;
  608. break;
  609. case 0x73 :
  610. LC1.size = 64;
  611. LC1.associative = 8;
  612. break;
  613. case 0x77 :
  614. LC1.size = 16;
  615. LC1.associative = 4;
  616. LC1.linesize = 64;
  617. break;
  618. case 0x78 :
  619. L2.size = 1024;
  620. L2.associative = 4;
  621. L2.linesize = 64;
  622. break;
  623. case 0x79 :
  624. L2.size = 128;
  625. L2.associative = 8;
  626. L2.linesize = 64;
  627. break;
  628. case 0x7a :
  629. L2.size = 256;
  630. L2.associative = 8;
  631. L2.linesize = 64;
  632. break;
  633. case 0x7b :
  634. L2.size = 512;
  635. L2.associative = 8;
  636. L2.linesize = 64;
  637. break;
  638. case 0x7c :
  639. L2.size = 1024;
  640. L2.associative = 8;
  641. L2.linesize = 64;
  642. break;
  643. case 0x7d :
  644. L2.size = 2048;
  645. L2.associative = 8;
  646. L2.linesize = 64;
  647. break;
  648. case 0x7e :
  649. L2.size = 256;
  650. L2.associative = 8;
  651. L2.linesize = 128;
  652. break;
  653. case 0x7f :
  654. L2.size = 512;
  655. L2.associative = 2;
  656. L2.linesize = 64;
  657. break;
  658. case 0x81 :
  659. L2.size = 128;
  660. L2.associative = 8;
  661. L2.linesize = 32;
  662. break;
  663. case 0x82 :
  664. L2.size = 256;
  665. L2.associative = 8;
  666. L2.linesize = 32;
  667. break;
  668. case 0x83 :
  669. L2.size = 512;
  670. L2.associative = 8;
  671. L2.linesize = 32;
  672. break;
  673. case 0x84 :
  674. L2.size = 1024;
  675. L2.associative = 8;
  676. L2.linesize = 32;
  677. break;
  678. case 0x85 :
  679. L2.size = 2048;
  680. L2.associative = 8;
  681. L2.linesize = 32;
  682. break;
  683. case 0x86 :
  684. L2.size = 512;
  685. L2.associative = 4;
  686. L2.linesize = 64;
  687. break;
  688. case 0x87 :
  689. L2.size = 1024;
  690. L2.associative = 8;
  691. L2.linesize = 64;
  692. break;
  693. case 0x88 :
  694. L3.size = 2048;
  695. L3.associative = 4;
  696. L3.linesize = 64;
  697. break;
  698. case 0x89 :
  699. L3.size = 4096;
  700. L3.associative = 4;
  701. L3.linesize = 64;
  702. break;
  703. case 0x8a :
  704. L3.size = 8192;
  705. L3.associative = 4;
  706. L3.linesize = 64;
  707. break;
  708. case 0x8d :
  709. L3.size = 3096;
  710. L3.associative = 12;
  711. L3.linesize = 128;
  712. break;
  713. case 0x90 :
  714. ITB.size = 4;
  715. ITB.associative = 0;
  716. ITB.linesize = 64;
  717. break;
  718. case 0x96 :
  719. DTB.size = 4;
  720. DTB.associative = 0;
  721. DTB.linesize = 32;
  722. break;
  723. case 0x9b :
  724. L2DTB.size = 4;
  725. L2DTB.associative = 0;
  726. L2DTB.linesize = 96;
  727. break;
  728. case 0xb0 :
  729. ITB.size = 4;
  730. ITB.associative = 4;
  731. ITB.linesize = 128;
  732. break;
  733. case 0xb1 :
  734. LITB.size = 4096;
  735. LITB.associative = 4;
  736. LITB.linesize = 4;
  737. break;
  738. case 0xb2 :
  739. ITB.size = 4;
  740. ITB.associative = 4;
  741. ITB.linesize = 64;
  742. break;
  743. case 0xb3 :
  744. DTB.size = 4;
  745. DTB.associative = 4;
  746. DTB.linesize = 128;
  747. break;
  748. case 0xb4 :
  749. DTB.size = 4;
  750. DTB.associative = 4;
  751. DTB.linesize = 256;
  752. break;
  753. case 0xba :
  754. DTB.size = 4;
  755. DTB.associative = 4;
  756. DTB.linesize = 64;
  757. break;
  758. case 0xd0 :
  759. L3.size = 512;
  760. L3.associative = 4;
  761. L3.linesize = 64;
  762. break;
  763. case 0xd1 :
  764. L3.size = 1024;
  765. L3.associative = 4;
  766. L3.linesize = 64;
  767. break;
  768. case 0xd2 :
  769. L3.size = 2048;
  770. L3.associative = 4;
  771. L3.linesize = 64;
  772. break;
  773. case 0xd6 :
  774. L3.size = 1024;
  775. L3.associative = 8;
  776. L3.linesize = 64;
  777. break;
  778. case 0xd7 :
  779. L3.size = 2048;
  780. L3.associative = 8;
  781. L3.linesize = 64;
  782. break;
  783. case 0xd8 :
  784. L3.size = 4096;
  785. L3.associative = 8;
  786. L3.linesize = 64;
  787. break;
  788. case 0xdc :
  789. L3.size = 2048;
  790. L3.associative = 12;
  791. L3.linesize = 64;
  792. break;
  793. case 0xdd :
  794. L3.size = 4096;
  795. L3.associative = 12;
  796. L3.linesize = 64;
  797. break;
  798. case 0xde :
  799. L3.size = 8192;
  800. L3.associative = 12;
  801. L3.linesize = 64;
  802. break;
  803. case 0xe2 :
  804. L3.size = 2048;
  805. L3.associative = 16;
  806. L3.linesize = 64;
  807. break;
  808. case 0xe3 :
  809. L3.size = 4096;
  810. L3.associative = 16;
  811. L3.linesize = 64;
  812. break;
  813. case 0xe4 :
  814. L3.size = 8192;
  815. L3.associative = 16;
  816. L3.linesize = 64;
  817. break;
  818. }
  819. }
  820. }
  821. if (get_vendor() == VENDOR_INTEL) {
  822. cpuid(0x80000000, &cpuid_level, &ebx, &ecx, &edx);
  823. if (cpuid_level >= 0x80000006) {
  824. if(L2.size<=0){
  825. //If we didn't detect L2 correctly before,
  826. cpuid(0x80000006, &eax, &ebx, &ecx, &edx);
  827. L2.size = BITMASK(ecx, 16, 0xffff);
  828. L2.associative = BITMASK(ecx, 12, 0x0f);
  829. switch (L2.associative){
  830. case 0x06:
  831. L2.associative = 8;
  832. break;
  833. case 0x08:
  834. L2.associative = 16;
  835. break;
  836. }
  837. L2.linesize = BITMASK(ecx, 0, 0xff);
  838. }
  839. }
  840. }
  841. if ((get_vendor() == VENDOR_AMD) || (get_vendor() == VENDOR_CENTAUR)) {
  842. cpuid(0x80000005, &eax, &ebx, &ecx, &edx);
  843. LDTB.size = 4096;
  844. LDTB.associative = BITMASK(eax, 24, 0xff);
  845. if (LDTB.associative == 0xff) LDTB.associative = 0;
  846. LDTB.linesize = BITMASK(eax, 16, 0xff);
  847. LITB.size = 4096;
  848. LITB.associative = BITMASK(eax, 8, 0xff);
  849. if (LITB.associative == 0xff) LITB.associative = 0;
  850. LITB.linesize = BITMASK(eax, 0, 0xff);
  851. DTB.size = 4;
  852. DTB.associative = BITMASK(ebx, 24, 0xff);
  853. if (DTB.associative == 0xff) DTB.associative = 0;
  854. DTB.linesize = BITMASK(ebx, 16, 0xff);
  855. ITB.size = 4;
  856. ITB.associative = BITMASK(ebx, 8, 0xff);
  857. if (ITB.associative == 0xff) ITB.associative = 0;
  858. ITB.linesize = BITMASK(ebx, 0, 0xff);
  859. LD1.size = BITMASK(ecx, 24, 0xff);
  860. LD1.associative = BITMASK(ecx, 16, 0xff);
  861. if (LD1.associative == 0xff) LD1.associative = 0;
  862. LD1.linesize = BITMASK(ecx, 0, 0xff);
  863. LC1.size = BITMASK(ecx, 24, 0xff);
  864. LC1.associative = BITMASK(ecx, 16, 0xff);
  865. if (LC1.associative == 0xff) LC1.associative = 0;
  866. LC1.linesize = BITMASK(ecx, 0, 0xff);
  867. cpuid(0x80000006, &eax, &ebx, &ecx, &edx);
  868. L2LDTB.size = 4096;
  869. L2LDTB.associative = BITMASK(eax, 24, 0xff);
  870. if (L2LDTB.associative == 0xff) L2LDTB.associative = 0;
  871. L2LDTB.linesize = BITMASK(eax, 16, 0xff);
  872. L2LITB.size = 4096;
  873. L2LITB.associative = BITMASK(eax, 8, 0xff);
  874. if (L2LITB.associative == 0xff) L2LITB.associative = 0;
  875. L2LITB.linesize = BITMASK(eax, 0, 0xff);
  876. L2DTB.size = 4;
  877. L2DTB.associative = BITMASK(ebx, 24, 0xff);
  878. if (L2DTB.associative == 0xff) L2DTB.associative = 0;
  879. L2DTB.linesize = BITMASK(ebx, 16, 0xff);
  880. L2ITB.size = 4;
  881. L2ITB.associative = BITMASK(ebx, 8, 0xff);
  882. if (L2ITB.associative == 0xff) L2ITB.associative = 0;
  883. L2ITB.linesize = BITMASK(ebx, 0, 0xff);
  884. if(L2.size <= 0){
  885. //If we didn't detect L2 correctly before,
  886. L2.size = BITMASK(ecx, 16, 0xffff);
  887. L2.associative = BITMASK(ecx, 12, 0xf);
  888. switch (L2.associative){
  889. case 0x06:
  890. L2.associative = 8;
  891. break;
  892. case 0x08:
  893. L2.associative = 16;
  894. break;
  895. }
  896. if (L2.associative == 0xff) L2.associative = 0;
  897. L2.linesize = BITMASK(ecx, 0, 0xff);
  898. }
  899. L3.size = BITMASK(edx, 18, 0x3fff) * 512;
  900. L3.associative = BITMASK(edx, 12, 0xf);
  901. if (L3.associative == 0xff) L2.associative = 0;
  902. L3.linesize = BITMASK(edx, 0, 0xff);
  903. }
  904. switch (type) {
  905. case CACHE_INFO_L1_I :
  906. *cacheinfo = LC1;
  907. break;
  908. case CACHE_INFO_L1_D :
  909. *cacheinfo = LD1;
  910. break;
  911. case CACHE_INFO_L2 :
  912. *cacheinfo = L2;
  913. break;
  914. case CACHE_INFO_L3 :
  915. *cacheinfo = L3;
  916. break;
  917. case CACHE_INFO_L1_DTB :
  918. *cacheinfo = DTB;
  919. break;
  920. case CACHE_INFO_L1_ITB :
  921. *cacheinfo = ITB;
  922. break;
  923. case CACHE_INFO_L1_LDTB :
  924. *cacheinfo = LDTB;
  925. break;
  926. case CACHE_INFO_L1_LITB :
  927. *cacheinfo = LITB;
  928. break;
  929. case CACHE_INFO_L2_DTB :
  930. *cacheinfo = L2DTB;
  931. break;
  932. case CACHE_INFO_L2_ITB :
  933. *cacheinfo = L2ITB;
  934. break;
  935. case CACHE_INFO_L2_LDTB :
  936. *cacheinfo = L2LDTB;
  937. break;
  938. case CACHE_INFO_L2_LITB :
  939. *cacheinfo = L2LITB;
  940. break;
  941. }
  942. return 0;
  943. }
  944. int get_cpuname(void){
  945. int family, exfamily, model, vendor, exmodel;
  946. if (!have_cpuid()) return CPUTYPE_80386;
  947. family = get_cputype(GET_FAMILY);
  948. exfamily = get_cputype(GET_EXFAMILY);
  949. model = get_cputype(GET_MODEL);
  950. exmodel = get_cputype(GET_EXMODEL);
  951. vendor = get_vendor();
  952. if (vendor == VENDOR_INTEL){
  953. switch (family) {
  954. case 0x4:
  955. return CPUTYPE_80486;
  956. case 0x5:
  957. return CPUTYPE_PENTIUM;
  958. case 0x6:
  959. switch (exmodel) {
  960. case 0:
  961. switch (model) {
  962. case 1:
  963. case 3:
  964. case 5:
  965. case 6:
  966. return CPUTYPE_PENTIUM2;
  967. case 7:
  968. case 8:
  969. case 10:
  970. case 11:
  971. return CPUTYPE_PENTIUM3;
  972. case 9:
  973. case 13:
  974. case 14:
  975. return CPUTYPE_PENTIUMM;
  976. case 15:
  977. return CPUTYPE_CORE2;
  978. }
  979. break;
  980. case 1:
  981. switch (model) {
  982. case 6:
  983. return CPUTYPE_CORE2;
  984. case 7:
  985. return CPUTYPE_PENRYN;
  986. case 10:
  987. case 11:
  988. case 14:
  989. case 15:
  990. return CPUTYPE_NEHALEM;
  991. case 12:
  992. return CPUTYPE_ATOM;
  993. case 13:
  994. return CPUTYPE_DUNNINGTON;
  995. }
  996. break;
  997. case 2:
  998. switch (model) {
  999. case 5:
  1000. //Intel Core (Clarkdale) / Core (Arrandale)
  1001. // Pentium (Clarkdale) / Pentium Mobile (Arrandale)
  1002. // Xeon (Clarkdale), 32nm
  1003. return CPUTYPE_NEHALEM;
  1004. case 10:
  1005. //Intel Core i5-2000 /i7-2000 (Sandy Bridge)
  1006. if(support_avx())
  1007. return CPUTYPE_SANDYBRIDGE;
  1008. else
  1009. return CPUTYPE_NEHALEM; //OS doesn't support AVX
  1010. case 12:
  1011. //Xeon Processor 5600 (Westmere-EP)
  1012. return CPUTYPE_NEHALEM;
  1013. case 13:
  1014. //Intel Core i7-3000 / Xeon E5 (Sandy Bridge)
  1015. if(support_avx())
  1016. return CPUTYPE_SANDYBRIDGE;
  1017. else
  1018. return CPUTYPE_NEHALEM;
  1019. case 14:
  1020. // Xeon E7540
  1021. case 15:
  1022. //Xeon Processor E7 (Westmere-EX)
  1023. return CPUTYPE_NEHALEM;
  1024. }
  1025. break;
  1026. case 3:
  1027. switch (model) {
  1028. case 7:
  1029. // Bay Trail
  1030. return CPUTYPE_ATOM;
  1031. case 10:
  1032. case 14:
  1033. // Ivy Bridge
  1034. if(support_avx())
  1035. return CPUTYPE_SANDYBRIDGE;
  1036. else
  1037. return CPUTYPE_NEHALEM;
  1038. case 12:
  1039. case 15:
  1040. if(support_avx())
  1041. #ifndef NO_AVX2
  1042. return CPUTYPE_HASWELL;
  1043. #else
  1044. return CPUTYPE_SANDYBRIDGE;
  1045. #endif
  1046. else
  1047. return CPUTYPE_NEHALEM;
  1048. case 13:
  1049. //Broadwell
  1050. if(support_avx())
  1051. #ifndef NO_AVX2
  1052. return CPUTYPE_HASWELL;
  1053. #else
  1054. return CPUTYPE_SANDYBRIDGE;
  1055. #endif
  1056. else
  1057. return CPUTYPE_NEHALEM;
  1058. }
  1059. break;
  1060. case 4:
  1061. switch (model) {
  1062. case 5:
  1063. case 6:
  1064. if(support_avx())
  1065. #ifndef NO_AVX2
  1066. return CPUTYPE_HASWELL;
  1067. #else
  1068. return CPUTYPE_SANDYBRIDGE;
  1069. #endif
  1070. else
  1071. return CPUTYPE_NEHALEM;
  1072. case 7:
  1073. case 15:
  1074. //Broadwell
  1075. if(support_avx())
  1076. #ifndef NO_AVX2
  1077. return CPUTYPE_HASWELL;
  1078. #else
  1079. return CPUTYPE_SANDYBRIDGE;
  1080. #endif
  1081. else
  1082. return CPUTYPE_NEHALEM;
  1083. case 14:
  1084. //Skylake
  1085. if(support_avx())
  1086. #ifndef NO_AVX2
  1087. return CPUTYPE_HASWELL;
  1088. #else
  1089. return CPUTYPE_SANDYBRIDGE;
  1090. #endif
  1091. else
  1092. return CPUTYPE_NEHALEM;
  1093. case 12:
  1094. // Braswell
  1095. case 13:
  1096. // Avoton
  1097. return CPUTYPE_NEHALEM;
  1098. }
  1099. break;
  1100. case 5:
  1101. switch (model) {
  1102. case 6:
  1103. //Broadwell
  1104. if(support_avx())
  1105. #ifndef NO_AVX2
  1106. return CPUTYPE_HASWELL;
  1107. #else
  1108. return CPUTYPE_SANDYBRIDGE;
  1109. #endif
  1110. else
  1111. return CPUTYPE_NEHALEM;
  1112. case 5:
  1113. case 14:
  1114. // Skylake
  1115. if(support_avx())
  1116. #ifndef NO_AVX2
  1117. return CPUTYPE_HASWELL;
  1118. #else
  1119. return CPUTYPE_SANDYBRIDGE;
  1120. #endif
  1121. else
  1122. return CPUTYPE_NEHALEM;
  1123. }
  1124. break;
  1125. }
  1126. break;
  1127. case 0x7:
  1128. return CPUTYPE_ITANIUM;
  1129. case 0xf:
  1130. switch (exfamily) {
  1131. case 0 :
  1132. return CPUTYPE_PENTIUM4;
  1133. case 1 :
  1134. return CPUTYPE_ITANIUM;
  1135. }
  1136. break;
  1137. }
  1138. return CPUTYPE_INTEL_UNKNOWN;
  1139. }
  1140. if (vendor == VENDOR_AMD){
  1141. switch (family) {
  1142. case 0x4:
  1143. return CPUTYPE_AMD5X86;
  1144. case 0x5:
  1145. return CPUTYPE_AMDK6;
  1146. case 0x6:
  1147. return CPUTYPE_ATHLON;
  1148. case 0xf:
  1149. switch (exfamily) {
  1150. case 0:
  1151. case 2:
  1152. return CPUTYPE_OPTERON;
  1153. case 1:
  1154. case 3:
  1155. case 10:
  1156. return CPUTYPE_BARCELONA;
  1157. case 6:
  1158. switch (model) {
  1159. case 1:
  1160. //AMD Bulldozer Opteron 6200 / Opteron 4200 / AMD FX-Series
  1161. if(support_avx())
  1162. return CPUTYPE_BULLDOZER;
  1163. else
  1164. return CPUTYPE_BARCELONA; //OS don't support AVX.
  1165. case 2: //AMD Piledriver
  1166. case 3: //AMD Richland
  1167. if(support_avx())
  1168. return CPUTYPE_PILEDRIVER;
  1169. else
  1170. return CPUTYPE_BARCELONA; //OS don't support AVX.
  1171. case 0:
  1172. switch(exmodel){
  1173. case 1: //AMD Trinity
  1174. if(support_avx())
  1175. return CPUTYPE_PILEDRIVER;
  1176. else
  1177. return CPUTYPE_BARCELONA; //OS don't support AVX.
  1178. case 3:
  1179. if(support_avx())
  1180. return CPUTYPE_STEAMROLLER;
  1181. else
  1182. return CPUTYPE_BARCELONA; //OS don't support AVX.
  1183. case 6:
  1184. if(support_avx())
  1185. return CPUTYPE_EXCAVATOR;
  1186. else
  1187. return CPUTYPE_BARCELONA; //OS don't support AVX.
  1188. }
  1189. break;
  1190. }
  1191. break;
  1192. case 5:
  1193. return CPUTYPE_BOBCAT;
  1194. }
  1195. break;
  1196. }
  1197. return CPUTYPE_AMD_UNKNOWN;
  1198. }
  1199. if (vendor == VENDOR_CYRIX){
  1200. switch (family) {
  1201. case 0x4:
  1202. return CPUTYPE_CYRIX5X86;
  1203. case 0x5:
  1204. return CPUTYPE_CYRIXM1;
  1205. case 0x6:
  1206. return CPUTYPE_CYRIXM2;
  1207. }
  1208. return CPUTYPE_CYRIX_UNKNOWN;
  1209. }
  1210. if (vendor == VENDOR_NEXGEN){
  1211. switch (family) {
  1212. case 0x5:
  1213. return CPUTYPE_NEXGENNX586;
  1214. }
  1215. return CPUTYPE_NEXGEN_UNKNOWN;
  1216. }
  1217. if (vendor == VENDOR_CENTAUR){
  1218. switch (family) {
  1219. case 0x5:
  1220. return CPUTYPE_CENTAURC6;
  1221. break;
  1222. case 0x6:
  1223. return CPUTYPE_NANO;
  1224. break;
  1225. }
  1226. return CPUTYPE_VIAC3;
  1227. }
  1228. if (vendor == VENDOR_RISE){
  1229. switch (family) {
  1230. case 0x5:
  1231. return CPUTYPE_RISEMP6;
  1232. }
  1233. return CPUTYPE_RISE_UNKNOWN;
  1234. }
  1235. if (vendor == VENDOR_SIS){
  1236. switch (family) {
  1237. case 0x5:
  1238. return CPUTYPE_SYS55X;
  1239. }
  1240. return CPUTYPE_SIS_UNKNOWN;
  1241. }
  1242. if (vendor == VENDOR_TRANSMETA){
  1243. switch (family) {
  1244. case 0x5:
  1245. return CPUTYPE_CRUSOETM3X;
  1246. }
  1247. return CPUTYPE_TRANSMETA_UNKNOWN;
  1248. }
  1249. if (vendor == VENDOR_NSC){
  1250. switch (family) {
  1251. case 0x5:
  1252. return CPUTYPE_NSGEODE;
  1253. }
  1254. return CPUTYPE_NSC_UNKNOWN;
  1255. }
  1256. return CPUTYPE_UNKNOWN;
  1257. }
  1258. static char *cpuname[] = {
  1259. "UNKNOWN",
  1260. "INTEL_UNKNOWN",
  1261. "UMC_UNKNOWN",
  1262. "AMD_UNKNOWN",
  1263. "CYRIX_UNKNOWN",
  1264. "NEXGEN_UNKNOWN",
  1265. "CENTAUR_UNKNOWN",
  1266. "RISE_UNKNOWN",
  1267. "SIS_UNKNOWN",
  1268. "TRANSMETA_UNKNOWN",
  1269. "NSC_UNKNOWN",
  1270. "80386",
  1271. "80486",
  1272. "PENTIUM",
  1273. "PENTIUM2",
  1274. "PENTIUM3",
  1275. "PENTIUMM",
  1276. "PENTIUM4",
  1277. "CORE2",
  1278. "PENRYN",
  1279. "DUNNINGTON",
  1280. "NEHALEM",
  1281. "ATOM",
  1282. "ITANIUM",
  1283. "ITANIUM2",
  1284. "5X86",
  1285. "K6",
  1286. "ATHLON",
  1287. "DURON",
  1288. "OPTERON",
  1289. "BARCELONA",
  1290. "SHANGHAI",
  1291. "ISTANBUL",
  1292. "CYRIX5X86",
  1293. "CYRIXM1",
  1294. "CYRIXM2",
  1295. "NEXGENNX586",
  1296. "CENTAURC6",
  1297. "RISEMP6",
  1298. "SYS55X",
  1299. "TM3X00",
  1300. "NSGEODE",
  1301. "VIAC3",
  1302. "NANO",
  1303. "SANDYBRIDGE",
  1304. "BOBCAT",
  1305. "BULLDOZER",
  1306. "PILEDRIVER",
  1307. "HASWELL",
  1308. "STEAMROLLER",
  1309. "EXCAVATOR",
  1310. };
  1311. static char *lowercpuname[] = {
  1312. "unknown",
  1313. "intel_unknown",
  1314. "umc_unknown",
  1315. "amd_unknown",
  1316. "cyrix_unknown",
  1317. "nexgen_unknown",
  1318. "centaur_unknown",
  1319. "rise_unknown",
  1320. "sis_unknown",
  1321. "transmeta_unknown",
  1322. "nsc_unknown",
  1323. "80386",
  1324. "80486",
  1325. "pentium",
  1326. "pentium2",
  1327. "pentium3",
  1328. "pentiumm",
  1329. "pentium4",
  1330. "core2",
  1331. "penryn",
  1332. "dunnington",
  1333. "nehalem",
  1334. "atom",
  1335. "itanium",
  1336. "itanium2",
  1337. "5x86",
  1338. "k6",
  1339. "athlon",
  1340. "duron",
  1341. "opteron",
  1342. "barcelona",
  1343. "shanghai",
  1344. "istanbul",
  1345. "cyrix5x86",
  1346. "cyrixm1",
  1347. "cyrixm2",
  1348. "nexgennx586",
  1349. "centaurc6",
  1350. "risemp6",
  1351. "sys55x",
  1352. "tms3x00",
  1353. "nsgeode",
  1354. "nano",
  1355. "sandybridge",
  1356. "bobcat",
  1357. "bulldozer",
  1358. "piledriver",
  1359. "haswell",
  1360. "steamroller",
  1361. "excavator",
  1362. };
  1363. static char *corename[] = {
  1364. "UNKOWN",
  1365. "80486",
  1366. "P5",
  1367. "P6",
  1368. "KATMAI",
  1369. "COPPERMINE",
  1370. "NORTHWOOD",
  1371. "PRESCOTT",
  1372. "BANIAS",
  1373. "ATHLON",
  1374. "OPTERON",
  1375. "BARCELONA",
  1376. "VIAC3",
  1377. "YONAH",
  1378. "CORE2",
  1379. "PENRYN",
  1380. "DUNNINGTON",
  1381. "NEHALEM",
  1382. "ATOM",
  1383. "NANO",
  1384. "SANDYBRIDGE",
  1385. "BOBCAT",
  1386. "BULLDOZER",
  1387. "PILEDRIVER",
  1388. "HASWELL",
  1389. "STEAMROLLER",
  1390. "EXCAVATOR",
  1391. };
  1392. static char *corename_lower[] = {
  1393. "unknown",
  1394. "80486",
  1395. "p5",
  1396. "p6",
  1397. "katmai",
  1398. "coppermine",
  1399. "northwood",
  1400. "prescott",
  1401. "banias",
  1402. "athlon",
  1403. "opteron",
  1404. "barcelona",
  1405. "viac3",
  1406. "yonah",
  1407. "core2",
  1408. "penryn",
  1409. "dunnington",
  1410. "nehalem",
  1411. "atom",
  1412. "nano",
  1413. "sandybridge",
  1414. "bobcat",
  1415. "bulldozer",
  1416. "piledriver",
  1417. "haswell",
  1418. "steamroller",
  1419. "excavator",
  1420. };
  1421. char *get_cpunamechar(void){
  1422. return cpuname[get_cpuname()];
  1423. }
  1424. char *get_lower_cpunamechar(void){
  1425. return lowercpuname[get_cpuname()];
  1426. }
  1427. int get_coretype(void){
  1428. int family, exfamily, model, exmodel, vendor;
  1429. if (!have_cpuid()) return CORE_80486;
  1430. family = get_cputype(GET_FAMILY);
  1431. exfamily = get_cputype(GET_EXFAMILY);
  1432. model = get_cputype(GET_MODEL);
  1433. exmodel = get_cputype(GET_EXMODEL);
  1434. vendor = get_vendor();
  1435. if (vendor == VENDOR_INTEL){
  1436. switch (family) {
  1437. case 4:
  1438. return CORE_80486;
  1439. case 5:
  1440. return CORE_P5;
  1441. case 6:
  1442. switch (exmodel) {
  1443. case 0:
  1444. switch (model) {
  1445. case 0:
  1446. case 1:
  1447. case 2:
  1448. case 3:
  1449. case 4:
  1450. case 5:
  1451. case 6:
  1452. return CORE_P6;
  1453. case 7:
  1454. return CORE_KATMAI;
  1455. case 8:
  1456. case 10:
  1457. case 11:
  1458. return CORE_COPPERMINE;
  1459. case 9:
  1460. case 13:
  1461. case 14:
  1462. return CORE_BANIAS;
  1463. case 15:
  1464. return CORE_CORE2;
  1465. }
  1466. break;
  1467. case 1:
  1468. switch (model) {
  1469. case 6:
  1470. return CORE_CORE2;
  1471. case 7:
  1472. return CORE_PENRYN;
  1473. case 10:
  1474. case 11:
  1475. case 14:
  1476. case 15:
  1477. return CORE_NEHALEM;
  1478. case 12:
  1479. return CORE_ATOM;
  1480. case 13:
  1481. return CORE_DUNNINGTON;
  1482. }
  1483. break;
  1484. case 2:
  1485. switch (model) {
  1486. case 5:
  1487. //Intel Core (Clarkdale) / Core (Arrandale)
  1488. // Pentium (Clarkdale) / Pentium Mobile (Arrandale)
  1489. // Xeon (Clarkdale), 32nm
  1490. return CORE_NEHALEM;
  1491. case 10:
  1492. //Intel Core i5-2000 /i7-2000 (Sandy Bridge)
  1493. if(support_avx())
  1494. return CORE_SANDYBRIDGE;
  1495. else
  1496. return CORE_NEHALEM; //OS doesn't support AVX
  1497. case 12:
  1498. //Xeon Processor 5600 (Westmere-EP)
  1499. return CORE_NEHALEM;
  1500. case 13:
  1501. //Intel Core i7-3000 / Xeon E5 (Sandy Bridge)
  1502. if(support_avx())
  1503. return CORE_SANDYBRIDGE;
  1504. else
  1505. return CORE_NEHALEM; //OS doesn't support AVX
  1506. case 14:
  1507. //Xeon E7540
  1508. case 15:
  1509. //Xeon Processor E7 (Westmere-EX)
  1510. return CORE_NEHALEM;
  1511. }
  1512. break;
  1513. case 3:
  1514. switch (model) {
  1515. case 10:
  1516. case 14:
  1517. if(support_avx())
  1518. return CORE_SANDYBRIDGE;
  1519. else
  1520. return CORE_NEHALEM; //OS doesn't support AVX
  1521. case 12:
  1522. case 15:
  1523. if(support_avx())
  1524. #ifndef NO_AVX2
  1525. return CORE_HASWELL;
  1526. #else
  1527. return CORE_SANDYBRIDGE;
  1528. #endif
  1529. else
  1530. return CORE_NEHALEM;
  1531. case 13:
  1532. //broadwell
  1533. if(support_avx())
  1534. #ifndef NO_AVX2
  1535. return CORE_HASWELL;
  1536. #else
  1537. return CORE_SANDYBRIDGE;
  1538. #endif
  1539. else
  1540. return CORE_NEHALEM;
  1541. }
  1542. break;
  1543. case 4:
  1544. switch (model) {
  1545. case 5:
  1546. case 6:
  1547. if(support_avx())
  1548. #ifndef NO_AVX2
  1549. return CORE_HASWELL;
  1550. #else
  1551. return CORE_SANDYBRIDGE;
  1552. #endif
  1553. else
  1554. return CORE_NEHALEM;
  1555. case 7:
  1556. case 15:
  1557. //broadwell
  1558. if(support_avx())
  1559. #ifndef NO_AVX2
  1560. return CORE_HASWELL;
  1561. #else
  1562. return CORE_SANDYBRIDGE;
  1563. #endif
  1564. else
  1565. return CORE_NEHALEM;
  1566. case 14:
  1567. //Skylake
  1568. if(support_avx())
  1569. #ifndef NO_AVX2
  1570. return CORE_HASWELL;
  1571. #else
  1572. return CORE_SANDYBRIDGE;
  1573. #endif
  1574. else
  1575. return CORE_NEHALEM;
  1576. case 12:
  1577. // Braswell
  1578. case 13:
  1579. // Avoton
  1580. return CORE_NEHALEM;
  1581. }
  1582. break;
  1583. case 5:
  1584. switch (model) {
  1585. case 6:
  1586. //broadwell
  1587. if(support_avx())
  1588. #ifndef NO_AVX2
  1589. return CORE_HASWELL;
  1590. #else
  1591. return CORE_SANDYBRIDGE;
  1592. #endif
  1593. else
  1594. return CORE_NEHALEM;
  1595. case 5:
  1596. case 14:
  1597. // Skylake
  1598. if(support_avx())
  1599. #ifndef NO_AVX2
  1600. return CORE_HASWELL;
  1601. #else
  1602. return CORE_SANDYBRIDGE;
  1603. #endif
  1604. else
  1605. return CORE_NEHALEM;
  1606. }
  1607. break;
  1608. }
  1609. break;
  1610. case 15:
  1611. if (model <= 0x2) return CORE_NORTHWOOD;
  1612. else return CORE_PRESCOTT;
  1613. }
  1614. }
  1615. if (vendor == VENDOR_AMD){
  1616. if (family <= 0x5) return CORE_80486;
  1617. if (family <= 0xe) return CORE_ATHLON;
  1618. if (family == 0xf){
  1619. if ((exfamily == 0) || (exfamily == 2)) return CORE_OPTERON;
  1620. else if (exfamily == 5) return CORE_BOBCAT;
  1621. else if (exfamily == 6) {
  1622. switch (model) {
  1623. case 1:
  1624. //AMD Bulldozer Opteron 6200 / Opteron 4200 / AMD FX-Series
  1625. if(support_avx())
  1626. return CORE_BULLDOZER;
  1627. else
  1628. return CORE_BARCELONA; //OS don't support AVX.
  1629. case 2: //AMD Piledriver
  1630. case 3: //AMD Richland
  1631. if(support_avx())
  1632. return CORE_PILEDRIVER;
  1633. else
  1634. return CORE_BARCELONA; //OS don't support AVX.
  1635. case 0:
  1636. switch(exmodel){
  1637. case 1: //AMD Trinity
  1638. if(support_avx())
  1639. return CORE_PILEDRIVER;
  1640. else
  1641. return CORE_BARCELONA; //OS don't support AVX.
  1642. case 3:
  1643. if(support_avx())
  1644. return CORE_STEAMROLLER;
  1645. else
  1646. return CORE_BARCELONA; //OS don't support AVX.
  1647. case 6:
  1648. if(support_avx())
  1649. return CORE_EXCAVATOR;
  1650. else
  1651. return CORE_BARCELONA; //OS don't support AVX.
  1652. }
  1653. break;
  1654. }
  1655. }else return CORE_BARCELONA;
  1656. }
  1657. }
  1658. if (vendor == VENDOR_CENTAUR) {
  1659. switch (family) {
  1660. case 0x6:
  1661. return CORE_NANO;
  1662. break;
  1663. }
  1664. return CORE_VIAC3;
  1665. }
  1666. return CORE_UNKNOWN;
  1667. }
  1668. void get_cpuconfig(void){
  1669. cache_info_t info;
  1670. int features;
  1671. printf("#define %s\n", cpuname[get_cpuname()]);
  1672. if (get_coretype() != CORE_P5) {
  1673. get_cacheinfo(CACHE_INFO_L1_I, &info);
  1674. if (info.size > 0) {
  1675. printf("#define L1_CODE_SIZE %d\n", info.size * 1024);
  1676. printf("#define L1_CODE_ASSOCIATIVE %d\n", info.associative);
  1677. printf("#define L1_CODE_LINESIZE %d\n", info.linesize);
  1678. }
  1679. get_cacheinfo(CACHE_INFO_L1_D, &info);
  1680. if (info.size > 0) {
  1681. printf("#define L1_DATA_SIZE %d\n", info.size * 1024);
  1682. printf("#define L1_DATA_ASSOCIATIVE %d\n", info.associative);
  1683. printf("#define L1_DATA_LINESIZE %d\n", info.linesize);
  1684. }
  1685. get_cacheinfo(CACHE_INFO_L2, &info);
  1686. if (info.size > 0) {
  1687. printf("#define L2_SIZE %d\n", info.size * 1024);
  1688. printf("#define L2_ASSOCIATIVE %d\n", info.associative);
  1689. printf("#define L2_LINESIZE %d\n", info.linesize);
  1690. } else {
  1691. //fall back for some virtual machines.
  1692. printf("#define L2_SIZE 1048576\n");
  1693. printf("#define L2_ASSOCIATIVE 6\n");
  1694. printf("#define L2_LINESIZE 64\n");
  1695. }
  1696. get_cacheinfo(CACHE_INFO_L3, &info);
  1697. if (info.size > 0) {
  1698. printf("#define L3_SIZE %d\n", info.size * 1024);
  1699. printf("#define L3_ASSOCIATIVE %d\n", info.associative);
  1700. printf("#define L3_LINESIZE %d\n", info.linesize);
  1701. }
  1702. get_cacheinfo(CACHE_INFO_L1_ITB, &info);
  1703. if (info.size > 0) {
  1704. printf("#define ITB_SIZE %d\n", info.size * 1024);
  1705. printf("#define ITB_ASSOCIATIVE %d\n", info.associative);
  1706. printf("#define ITB_ENTRIES %d\n", info.linesize);
  1707. }
  1708. get_cacheinfo(CACHE_INFO_L1_DTB, &info);
  1709. if (info.size > 0) {
  1710. printf("#define DTB_SIZE %d\n", info.size * 1024);
  1711. printf("#define DTB_ASSOCIATIVE %d\n", info.associative);
  1712. printf("#define DTB_DEFAULT_ENTRIES %d\n", info.linesize);
  1713. } else {
  1714. //fall back for some virtual machines.
  1715. printf("#define DTB_DEFAULT_ENTRIES 32\n");
  1716. }
  1717. features = get_cputype(GET_FEATURE);
  1718. if (features & HAVE_CMOV ) printf("#define HAVE_CMOV\n");
  1719. if (features & HAVE_MMX ) printf("#define HAVE_MMX\n");
  1720. if (features & HAVE_SSE ) printf("#define HAVE_SSE\n");
  1721. if (features & HAVE_SSE2 ) printf("#define HAVE_SSE2\n");
  1722. if (features & HAVE_SSE3 ) printf("#define HAVE_SSE3\n");
  1723. if (features & HAVE_SSSE3) printf("#define HAVE_SSSE3\n");
  1724. if (features & HAVE_SSE4_1) printf("#define HAVE_SSE4_1\n");
  1725. if (features & HAVE_SSE4_2) printf("#define HAVE_SSE4_2\n");
  1726. if (features & HAVE_SSE4A) printf("#define HAVE_SSE4A\n");
  1727. if (features & HAVE_SSE5 ) printf("#define HAVE_SSSE5\n");
  1728. if (features & HAVE_AVX ) printf("#define HAVE_AVX\n");
  1729. if (features & HAVE_3DNOWEX) printf("#define HAVE_3DNOWEX\n");
  1730. if (features & HAVE_3DNOW) printf("#define HAVE_3DNOW\n");
  1731. if (features & HAVE_FMA4 ) printf("#define HAVE_FMA4\n");
  1732. if (features & HAVE_FMA3 ) printf("#define HAVE_FMA3\n");
  1733. if (features & HAVE_CFLUSH) printf("#define HAVE_CFLUSH\n");
  1734. if (features & HAVE_HIT) printf("#define HAVE_HIT 1\n");
  1735. if (features & HAVE_MISALIGNSSE) printf("#define HAVE_MISALIGNSSE\n");
  1736. if (features & HAVE_128BITFPU) printf("#define HAVE_128BITFPU\n");
  1737. if (features & HAVE_FASTMOVU) printf("#define HAVE_FASTMOVU\n");
  1738. printf("#define NUM_SHAREDCACHE %d\n", get_cputype(GET_NUMSHARE) + 1);
  1739. printf("#define NUM_CORES %d\n", get_cputype(GET_NUMCORES) + 1);
  1740. features = get_coretype();
  1741. if (features > 0) printf("#define CORE_%s\n", corename[features]);
  1742. } else {
  1743. printf("#define DTB_DEFAULT_ENTRIES 16\n");
  1744. printf("#define L1_CODE_SIZE 8192\n");
  1745. printf("#define L1_DATA_SIZE 8192\n");
  1746. printf("#define L2_SIZE 0\n");
  1747. }
  1748. }
  1749. void get_architecture(void){
  1750. #ifndef __64BIT__
  1751. printf("X86");
  1752. #else
  1753. printf("X86_64");
  1754. #endif
  1755. }
  1756. void get_subarchitecture(void){
  1757. printf("%s", get_cpunamechar());
  1758. }
  1759. void get_subdirname(void){
  1760. #ifndef __64BIT__
  1761. printf("x86");
  1762. #else
  1763. printf("x86_64");
  1764. #endif
  1765. }
  1766. char *get_corename(void){
  1767. return corename[get_coretype()];
  1768. }
  1769. void get_libname(void){
  1770. printf("%s", corename_lower[get_coretype()]);
  1771. }
  1772. /* This if for Makefile */
  1773. void get_sse(void){
  1774. int features;
  1775. features = get_cputype(GET_FEATURE);
  1776. if (features & HAVE_MMX ) printf("HAVE_MMX=1\n");
  1777. if (features & HAVE_SSE ) printf("HAVE_SSE=1\n");
  1778. if (features & HAVE_SSE2 ) printf("HAVE_SSE2=1\n");
  1779. if (features & HAVE_SSE3 ) printf("HAVE_SSE3=1\n");
  1780. if (features & HAVE_SSSE3) printf("HAVE_SSSE3=1\n");
  1781. if (features & HAVE_SSE4_1) printf("HAVE_SSE4_1=1\n");
  1782. if (features & HAVE_SSE4_2) printf("HAVE_SSE4_2=1\n");
  1783. if (features & HAVE_SSE4A) printf("HAVE_SSE4A=1\n");
  1784. if (features & HAVE_SSE5 ) printf("HAVE_SSSE5=1\n");
  1785. if (features & HAVE_AVX ) printf("HAVE_AVX=1\n");
  1786. if (features & HAVE_3DNOWEX) printf("HAVE_3DNOWEX=1\n");
  1787. if (features & HAVE_3DNOW) printf("HAVE_3DNOW=1\n");
  1788. if (features & HAVE_FMA4 ) printf("HAVE_FMA4=1\n");
  1789. if (features & HAVE_FMA3 ) printf("HAVE_FMA3=1\n");
  1790. }