12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748174917501751175217531754175517561757175817591760176117621763176417651766176717681769177017711772177317741775177617771778177917801781178217831784178517861787178817891790179117921793179417951796179717981799180018011802180318041805180618071808180918101811181218131814181518161817181818191820182118221823182418251826182718281829183018311832183318341835183618371838183918401841184218431844184518461847184818491850185118521853185418551856185718581859186018611862186318641865186618671868186918701871187218731874187518761877187818791880188118821883188418851886188718881889189018911892189318941895189618971898189919001901190219031904190519061907190819091910191119121913191419151916191719181919192019211922192319241925192619271928192919301931193219331934193519361937193819391940194119421943194419451946194719481949195019511952195319541955195619571958195919601961196219631964196519661967196819691970197119721973197419751976197719781979198019811982198319841985198619871988198919901991199219931994199519961997199819992000200120022003200420052006200720082009201020112012201320142015201620172018201920202021202220232024202520262027202820292030203120322033203420352036203720382039204020412042204320442045204620472048204920502051205220532054205520562057205820592060206120622063206420652066206720682069207020712072207320742075207620772078207920802081208220832084208520862087208820892090209120922093209420952096209720982099210021012102210321042105210621072108210921102111211221132114211521162117211821192120212121222123212421252126212721282129213021312132213321342135213621372138213921402141214221432144214521462147214821492150215121522153215421552156215721582159216021612162216321642165216621672168216921702171217221732174217521762177217821792180218121822183218421852186218721882189219021912192219321942195219621972198219922002201220222032204220522062207220822092210221122122213221422152216221722182219222022212222222322242225222622272228222922302231223222332234223522362237223822392240224122422243224422452246224722482249225022512252225322542255225622572258225922602261226222632264226522662267226822692270227122722273227422752276227722782279228022812282228322842285228622872288228922902291229222932294229522962297229822992300230123022303230423052306230723082309231023112312231323142315231623172318231923202321232223232324232523262327232823292330233123322333233423352336233723382339234023412342234323442345234623472348234923502351235223532354235523562357235823592360236123622363236423652366236723682369237023712372237323742375237623772378237923802381238223832384238523862387238823892390239123922393239423952396239723982399240024012402240324042405240624072408240924102411241224132414241524162417241824192420242124222423242424252426242724282429243024312432243324342435243624372438243924402441244224432444244524462447244824492450245124522453245424552456245724582459246024612462246324642465246624672468246924702471247224732474247524762477247824792480248124822483248424852486248724882489249024912492249324942495249624972498249925002501250225032504250525062507250825092510251125122513251425152516251725182519252025212522252325242525252625272528252925302531253225332534253525362537253825392540254125422543254425452546254725482549255025512552255325542555255625572558255925602561256225632564256525662567256825692570257125722573257425752576257725782579258025812582258325842585258625872588258925902591259225932594259525962597259825992600260126022603260426052606260726082609261026112612261326142615261626172618261926202621262226232624262526262627262826292630263126322633263426352636263726382639264026412642264326442645264626472648264926502651265226532654265526562657265826592660266126622663266426652666266726682669267026712672267326742675267626772678267926802681268226832684268526862687268826892690269126922693269426952696269726982699270027012702270327042705270627072708270927102711271227132714271527162717271827192720272127222723272427252726272727282729273027312732273327342735273627372738273927402741274227432744274527462747274827492750275127522753275427552756275727582759276027612762276327642765276627672768276927702771277227732774277527762777277827792780278127822783278427852786278727882789279027912792279327942795279627972798279928002801280228032804280528062807280828092810281128122813281428152816281728182819282028212822282328242825282628272828282928302831283228332834283528362837283828392840284128422843284428452846284728482849285028512852285328542855285628572858285928602861286228632864286528662867286828692870287128722873287428752876287728782879288028812882288328842885288628872888288928902891289228932894289528962897289828992900290129022903290429052906290729082909291029112912291329142915291629172918291929202921292229232924292529262927292829292930293129322933293429352936293729382939294029412942294329442945294629472948294929502951295229532954295529562957295829592960296129622963296429652966296729682969297029712972297329742975297629772978297929802981298229832984298529862987298829892990299129922993299429952996299729982999300030013002300330043005300630073008300930103011301230133014301530163017301830193020302130223023302430253026302730283029303030313032303330343035303630373038303930403041304230433044304530463047304830493050305130523053305430553056305730583059306030613062306330643065306630673068306930703071307230733074307530763077307830793080308130823083308430853086308730883089309030913092309330943095309630973098309931003101310231033104310531063107310831093110311131123113311431153116311731183119312031213122312331243125312631273128312931303131313231333134313531363137313831393140314131423143314431453146314731483149315031513152315331543155315631573158315931603161316231633164316531663167316831693170317131723173317431753176317731783179318031813182318331843185318631873188318931903191319231933194319531963197319831993200320132023203320432053206320732083209321032113212321332143215321632173218321932203221322232233224322532263227322832293230323132323233323432353236323732383239324032413242324332443245324632473248324932503251325232533254325532563257325832593260326132623263326432653266326732683269327032713272327332743275327632773278327932803281328232833284328532863287328832893290329132923293329432953296329732983299330033013302330333043305330633073308330933103311331233133314331533163317331833193320332133223323332433253326332733283329333033313332333333343335333633373338333933403341334233433344334533463347334833493350335133523353335433553356335733583359336033613362336333643365336633673368336933703371337233733374337533763377337833793380338133823383338433853386338733883389339033913392339333943395339633973398339934003401340234033404340534063407340834093410341134123413341434153416341734183419342034213422342334243425342634273428342934303431343234333434343534363437343834393440344134423443344434453446344734483449345034513452345334543455345634573458345934603461346234633464346534663467346834693470347134723473347434753476347734783479348034813482348334843485348634873488348934903491349234933494349534963497349834993500350135023503350435053506350735083509351035113512351335143515351635173518351935203521352235233524352535263527352835293530353135323533353435353536353735383539354035413542354335443545354635473548354935503551355235533554355535563557355835593560356135623563356435653566356735683569357035713572357335743575357635773578357935803581358235833584358535863587358835893590359135923593359435953596359735983599360036013602360336043605360636073608360936103611361236133614361536163617361836193620362136223623362436253626362736283629363036313632363336343635363636373638363936403641364236433644364536463647364836493650365136523653365436553656365736583659366036613662366336643665366636673668366936703671367236733674367536763677367836793680368136823683368436853686368736883689369036913692369336943695369636973698369937003701370237033704370537063707370837093710371137123713371437153716371737183719372037213722372337243725372637273728372937303731373237333734373537363737373837393740374137423743374437453746374737483749375037513752375337543755375637573758375937603761376237633764376537663767376837693770377137723773377437753776377737783779378037813782378337843785378637873788378937903791379237933794379537963797379837993800380138023803380438053806380738083809381038113812381338143815381638173818381938203821382238233824382538263827382838293830383138323833383438353836383738383839384038413842384338443845384638473848384938503851385238533854385538563857385838593860386138623863386438653866386738683869387038713872387338743875387638773878387938803881388238833884388538863887388838893890389138923893389438953896389738983899390039013902390339043905390639073908390939103911391239133914391539163917391839193920392139223923392439253926392739283929393039313932393339343935393639373938393939403941394239433944394539463947394839493950395139523953395439553956395739583959396039613962396339643965396639673968396939703971397239733974397539763977397839793980398139823983398439853986398739883989399039913992399339943995399639973998399940004001400240034004400540064007400840094010401140124013401440154016401740184019402040214022402340244025402640274028402940304031403240334034403540364037403840394040404140424043404440454046404740484049405040514052405340544055405640574058405940604061406240634064406540664067406840694070407140724073407440754076407740784079408040814082408340844085408640874088408940904091409240934094409540964097409840994100410141024103410441054106410741084109411041114112411341144115411641174118411941204121412241234124412541264127412841294130413141324133413441354136413741384139414041414142414341444145414641474148414941504151415241534154415541564157415841594160416141624163416441654166416741684169417041714172417341744175417641774178417941804181418241834184418541864187418841894190419141924193419441954196419741984199420042014202420342044205420642074208420942104211421242134214421542164217421842194220422142224223422442254226422742284229423042314232423342344235423642374238423942404241424242434244424542464247424842494250425142524253425442554256425742584259426042614262426342644265426642674268426942704271427242734274427542764277427842794280428142824283428442854286428742884289429042914292429342944295429642974298429943004301430243034304430543064307430843094310431143124313431443154316431743184319432043214322432343244325432643274328432943304331433243334334433543364337433843394340434143424343434443454346434743484349435043514352435343544355435643574358435943604361436243634364436543664367436843694370437143724373437443754376437743784379438043814382438343844385438643874388438943904391439243934394439543964397439843994400440144024403440444054406440744084409441044114412441344144415441644174418441944204421442244234424442544264427442844294430443144324433443444354436443744384439444044414442444344444445444644474448444944504451445244534454445544564457445844594460446144624463446444654466446744684469447044714472447344744475447644774478447944804481448244834484448544864487448844894490449144924493449444954496449744984499450045014502450345044505450645074508450945104511451245134514451545164517451845194520452145224523452445254526452745284529453045314532453345344535453645374538453945404541454245434544454545464547454845494550455145524553455445554556455745584559456045614562456345644565456645674568456945704571457245734574457545764577457845794580458145824583458445854586458745884589459045914592459345944595459645974598459946004601460246034604460546064607460846094610461146124613461446154616461746184619462046214622462346244625462646274628462946304631463246334634463546364637463846394640464146424643464446454646464746484649465046514652465346544655465646574658465946604661466246634664466546664667466846694670467146724673467446754676467746784679468046814682468346844685468646874688468946904691469246934694469546964697469846994700470147024703470447054706470747084709471047114712471347144715471647174718471947204721472247234724472547264727472847294730473147324733473447354736473747384739474047414742474347444745474647474748474947504751475247534754475547564757475847594760476147624763476447654766476747684769477047714772477347744775477647774778477947804781478247834784478547864787478847894790479147924793479447954796479747984799480048014802480348044805480648074808480948104811481248134814481548164817481848194820482148224823482448254826482748284829483048314832483348344835483648374838483948404841484248434844484548464847484848494850485148524853485448554856485748584859486048614862486348644865486648674868486948704871487248734874487548764877487848794880488148824883488448854886488748884889489048914892489348944895489648974898489949004901490249034904490549064907490849094910491149124913491449154916491749184919492049214922492349244925492649274928492949304931493249334934493549364937493849394940494149424943494449454946494749484949495049514952495349544955495649574958495949604961496249634964496549664967496849694970497149724973497449754976497749784979498049814982498349844985498649874988498949904991499249934994499549964997499849995000500150025003500450055006500750085009501050115012501350145015501650175018501950205021502250235024502550265027502850295030503150325033503450355036503750385039504050415042504350445045504650475048504950505051505250535054505550565057505850595060506150625063506450655066506750685069507050715072507350745075507650775078507950805081508250835084508550865087508850895090509150925093509450955096509750985099510051015102510351045105510651075108510951105111511251135114511551165117511851195120512151225123512451255126512751285129513051315132513351345135513651375138513951405141514251435144514551465147514851495150515151525153515451555156515751585159516051615162516351645165516651675168516951705171517251735174517551765177517851795180518151825183518451855186518751885189519051915192519351945195519651975198519952005201520252035204520552065207520852095210521152125213521452155216521752185219522052215222522352245225522652275228522952305231523252335234523552365237523852395240524152425243524452455246524752485249525052515252525352545255525652575258525952605261526252635264526552665267526852695270527152725273527452755276527752785279528052815282528352845285528652875288528952905291529252935294529552965297529852995300530153025303530453055306530753085309531053115312531353145315531653175318531953205321532253235324532553265327532853295330533153325333533453355336533753385339534053415342534353445345534653475348534953505351535253535354535553565357535853595360536153625363536453655366536753685369537053715372537353745375537653775378537953805381538253835384538553865387538853895390539153925393539453955396539753985399540054015402540354045405540654075408540954105411541254135414541554165417541854195420542154225423542454255426542754285429543054315432543354345435543654375438543954405441544254435444544554465447544854495450545154525453545454555456545754585459546054615462546354645465546654675468546954705471547254735474547554765477547854795480548154825483548454855486548754885489549054915492549354945495549654975498549955005501550255035504550555065507550855095510551155125513551455155516551755185519552055215522552355245525552655275528552955305531553255335534553555365537553855395540554155425543554455455546554755485549555055515552555355545555555655575558555955605561556255635564556555665567556855695570557155725573557455755576557755785579558055815582558355845585558655875588558955905591559255935594559555965597559855995600560156025603560456055606560756085609561056115612561356145615561656175618561956205621562256235624562556265627562856295630563156325633563456355636563756385639564056415642564356445645564656475648564956505651565256535654565556565657565856595660566156625663566456655666566756685669567056715672567356745675567656775678567956805681568256835684568556865687568856895690569156925693569456955696569756985699570057015702570357045705570657075708570957105711571257135714571557165717571857195720572157225723572457255726572757285729573057315732573357345735573657375738573957405741574257435744574557465747574857495750575157525753575457555756575757585759576057615762576357645765576657675768576957705771577257735774577557765777577857795780578157825783578457855786578757885789579057915792579357945795579657975798579958005801580258035804580558065807580858095810581158125813581458155816581758185819582058215822582358245825582658275828582958305831583258335834583558365837583858395840584158425843584458455846584758485849585058515852585358545855585658575858585958605861586258635864586558665867586858695870587158725873587458755876587758785879588058815882588358845885588658875888588958905891589258935894589558965897589858995900590159025903590459055906590759085909591059115912591359145915591659175918591959205921592259235924592559265927592859295930593159325933593459355936593759385939594059415942594359445945594659475948594959505951595259535954595559565957595859595960596159625963596459655966596759685969597059715972597359745975597659775978597959805981598259835984598559865987598859895990599159925993599459955996599759985999600060016002600360046005600660076008600960106011601260136014601560166017601860196020602160226023602460256026602760286029603060316032603360346035603660376038603960406041604260436044604560466047604860496050605160526053605460556056605760586059606060616062606360646065606660676068606960706071607260736074607560766077607860796080608160826083608460856086608760886089609060916092609360946095609660976098609961006101610261036104610561066107610861096110611161126113611461156116611761186119612061216122612361246125612661276128612961306131613261336134613561366137613861396140614161426143614461456146614761486149615061516152615361546155615661576158615961606161616261636164616561666167616861696170617161726173617461756176617761786179618061816182618361846185618661876188618961906191619261936194619561966197619861996200620162026203620462056206620762086209621062116212621362146215621662176218621962206221622262236224622562266227622862296230623162326233623462356236623762386239624062416242624362446245624662476248624962506251625262536254625562566257625862596260626162626263626462656266626762686269627062716272627362746275627662776278627962806281628262836284628562866287628862896290629162926293629462956296629762986299630063016302630363046305630663076308630963106311631263136314631563166317631863196320632163226323632463256326632763286329633063316332633363346335633663376338633963406341634263436344634563466347634863496350635163526353635463556356635763586359636063616362636363646365636663676368636963706371637263736374637563766377637863796380638163826383638463856386638763886389639063916392639363946395639663976398639964006401640264036404640564066407640864096410641164126413641464156416641764186419642064216422642364246425642664276428642964306431643264336434643564366437643864396440644164426443644464456446644764486449645064516452645364546455645664576458645964606461646264636464646564666467646864696470647164726473647464756476647764786479648064816482648364846485648664876488648964906491649264936494649564966497649864996500650165026503650465056506650765086509651065116512651365146515651665176518651965206521652265236524652565266527652865296530653165326533653465356536653765386539654065416542654365446545654665476548654965506551655265536554655565566557655865596560656165626563656465656566656765686569657065716572657365746575657665776578657965806581658265836584658565866587658865896590659165926593659465956596659765986599660066016602660366046605660666076608660966106611661266136614661566166617661866196620662166226623662466256626662766286629663066316632663366346635663666376638663966406641664266436644664566466647664866496650665166526653665466556656665766586659666066616662666366646665666666676668666966706671667266736674667566766677667866796680668166826683668466856686668766886689669066916692669366946695669666976698669967006701670267036704670567066707670867096710671167126713671467156716671767186719672067216722672367246725672667276728672967306731673267336734673567366737673867396740674167426743674467456746674767486749675067516752675367546755675667576758675967606761676267636764676567666767676867696770677167726773677467756776677767786779678067816782678367846785678667876788678967906791679267936794679567966797679867996800680168026803680468056806680768086809681068116812681368146815681668176818681968206821682268236824682568266827682868296830683168326833683468356836683768386839684068416842684368446845684668476848684968506851685268536854685568566857685868596860686168626863686468656866686768686869687068716872687368746875687668776878687968806881688268836884688568866887688868896890689168926893689468956896689768986899690069016902690369046905690669076908690969106911691269136914691569166917691869196920692169226923692469256926692769286929693069316932693369346935693669376938693969406941694269436944694569466947694869496950695169526953695469556956695769586959696069616962696369646965696669676968696969706971697269736974697569766977697869796980698169826983698469856986698769886989699069916992699369946995699669976998699970007001700270037004700570067007700870097010701170127013701470157016701770187019702070217022702370247025702670277028702970307031703270337034703570367037703870397040704170427043704470457046704770487049705070517052705370547055705670577058705970607061706270637064706570667067706870697070707170727073707470757076707770787079708070817082708370847085708670877088708970907091709270937094709570967097709870997100710171027103710471057106710771087109711071117112711371147115711671177118711971207121712271237124712571267127712871297130713171327133713471357136713771387139714071417142714371447145714671477148714971507151715271537154715571567157715871597160716171627163716471657166716771687169717071717172717371747175717671777178717971807181718271837184718571867187718871897190719171927193719471957196719771987199720072017202720372047205720672077208720972107211721272137214721572167217721872197220722172227223722472257226722772287229723072317232723372347235723672377238723972407241724272437244724572467247724872497250725172527253725472557256725772587259726072617262726372647265726672677268726972707271727272737274727572767277727872797280728172827283728472857286728772887289729072917292729372947295729672977298729973007301730273037304730573067307730873097310731173127313731473157316731773187319732073217322732373247325732673277328732973307331733273337334733573367337733873397340734173427343734473457346734773487349735073517352735373547355735673577358735973607361736273637364736573667367736873697370737173727373737473757376737773787379738073817382738373847385738673877388738973907391739273937394739573967397739873997400740174027403740474057406740774087409741074117412741374147415741674177418741974207421742274237424742574267427742874297430743174327433743474357436743774387439744074417442744374447445744674477448744974507451745274537454745574567457745874597460746174627463746474657466746774687469747074717472747374747475747674777478747974807481748274837484748574867487748874897490749174927493749474957496749774987499750075017502750375047505750675077508750975107511751275137514751575167517751875197520752175227523752475257526752775287529753075317532753375347535753675377538753975407541754275437544754575467547754875497550755175527553755475557556755775587559756075617562756375647565756675677568756975707571757275737574757575767577757875797580758175827583758475857586758775887589759075917592759375947595759675977598759976007601760276037604760576067607760876097610761176127613761476157616761776187619762076217622762376247625762676277628762976307631763276337634763576367637763876397640764176427643764476457646764776487649765076517652765376547655765676577658765976607661766276637664766576667667766876697670767176727673767476757676767776787679768076817682768376847685768676877688768976907691769276937694769576967697769876997700770177027703770477057706770777087709771077117712771377147715771677177718771977207721772277237724772577267727772877297730773177327733773477357736773777387739774077417742774377447745774677477748774977507751775277537754775577567757775877597760776177627763776477657766776777687769777077717772777377747775777677777778777977807781778277837784778577867787778877897790779177927793779477957796779777987799780078017802780378047805780678077808780978107811781278137814781578167817781878197820782178227823782478257826782778287829783078317832783378347835783678377838783978407841784278437844784578467847784878497850785178527853785478557856785778587859786078617862786378647865786678677868786978707871787278737874787578767877787878797880788178827883788478857886788778887889789078917892789378947895789678977898789979007901790279037904790579067907790879097910791179127913791479157916791779187919792079217922792379247925792679277928792979307931793279337934793579367937793879397940794179427943794479457946794779487949795079517952795379547955795679577958795979607961796279637964796579667967796879697970797179727973797479757976797779787979798079817982798379847985798679877988798979907991799279937994799579967997799879998000800180028003800480058006800780088009801080118012801380148015801680178018801980208021802280238024802580268027802880298030803180328033803480358036803780388039804080418042804380448045804680478048804980508051805280538054805580568057805880598060806180628063806480658066806780688069807080718072807380748075807680778078807980808081808280838084808580868087808880898090809180928093809480958096809780988099810081018102810381048105810681078108810981108111811281138114811581168117811881198120812181228123812481258126812781288129813081318132813381348135813681378138813981408141814281438144814581468147814881498150815181528153815481558156815781588159816081618162816381648165816681678168816981708171817281738174817581768177817881798180818181828183818481858186818781888189819081918192819381948195819681978198819982008201820282038204820582068207820882098210821182128213821482158216821782188219822082218222822382248225822682278228822982308231823282338234823582368237823882398240824182428243824482458246824782488249825082518252825382548255825682578258825982608261826282638264826582668267826882698270827182728273827482758276827782788279828082818282828382848285828682878288828982908291829282938294829582968297829882998300830183028303830483058306830783088309831083118312831383148315831683178318831983208321832283238324832583268327832883298330833183328333833483358336833783388339834083418342834383448345834683478348834983508351835283538354835583568357835883598360836183628363836483658366836783688369837083718372837383748375837683778378837983808381838283838384838583868387838883898390839183928393839483958396839783988399840084018402840384048405840684078408840984108411841284138414841584168417841884198420842184228423842484258426842784288429843084318432843384348435843684378438843984408441844284438444844584468447844884498450845184528453845484558456845784588459846084618462846384648465846684678468846984708471847284738474847584768477847884798480848184828483848484858486848784888489849084918492849384948495849684978498849985008501850285038504850585068507850885098510851185128513851485158516851785188519852085218522852385248525852685278528852985308531853285338534853585368537853885398540854185428543854485458546854785488549855085518552855385548555855685578558855985608561856285638564856585668567856885698570857185728573857485758576857785788579858085818582858385848585858685878588858985908591859285938594859585968597859885998600860186028603860486058606860786088609861086118612861386148615861686178618861986208621862286238624862586268627862886298630863186328633863486358636863786388639864086418642864386448645864686478648864986508651865286538654865586568657865886598660866186628663866486658666866786688669867086718672867386748675867686778678867986808681868286838684868586868687868886898690869186928693869486958696869786988699870087018702870387048705870687078708870987108711871287138714871587168717871887198720872187228723872487258726872787288729873087318732873387348735873687378738873987408741874287438744874587468747874887498750875187528753875487558756875787588759876087618762876387648765876687678768876987708771877287738774877587768777877887798780878187828783878487858786878787888789879087918792879387948795879687978798879988008801880288038804880588068807880888098810881188128813881488158816881788188819882088218822882388248825882688278828882988308831883288338834883588368837883888398840884188428843884488458846884788488849885088518852885388548855885688578858885988608861886288638864886588668867886888698870887188728873887488758876887788788879888088818882888388848885888688878888888988908891889288938894889588968897889888998900890189028903890489058906890789088909891089118912891389148915891689178918891989208921892289238924892589268927892889298930893189328933893489358936893789388939894089418942894389448945894689478948894989508951895289538954895589568957895889598960896189628963896489658966896789688969897089718972897389748975897689778978897989808981898289838984898589868987898889898990899189928993899489958996899789988999900090019002900390049005900690079008900990109011901290139014901590169017901890199020902190229023902490259026902790289029903090319032903390349035903690379038903990409041904290439044904590469047904890499050905190529053905490559056905790589059906090619062906390649065906690679068906990709071907290739074907590769077907890799080908190829083908490859086908790889089909090919092909390949095909690979098909991009101910291039104910591069107910891099110911191129113911491159116911791189119912091219122912391249125912691279128912991309131913291339134913591369137913891399140914191429143914491459146914791489149915091519152915391549155915691579158915991609161916291639164916591669167916891699170917191729173917491759176917791789179918091819182918391849185918691879188918991909191919291939194919591969197919891999200920192029203920492059206920792089209921092119212921392149215921692179218921992209221922292239224922592269227922892299230923192329233923492359236923792389239924092419242924392449245924692479248924992509251925292539254925592569257925892599260926192629263926492659266926792689269927092719272927392749275927692779278927992809281928292839284928592869287928892899290929192929293929492959296929792989299930093019302930393049305930693079308930993109311931293139314931593169317931893199320932193229323932493259326932793289329933093319332933393349335933693379338933993409341934293439344934593469347934893499350935193529353935493559356935793589359936093619362936393649365936693679368936993709371937293739374937593769377937893799380938193829383938493859386938793889389939093919392939393949395939693979398939994009401940294039404940594069407940894099410941194129413941494159416941794189419942094219422942394249425942694279428942994309431943294339434943594369437943894399440944194429443944494459446944794489449945094519452945394549455945694579458945994609461946294639464946594669467946894699470947194729473947494759476947794789479948094819482948394849485948694879488948994909491949294939494949594969497949894999500950195029503950495059506950795089509951095119512951395149515951695179518951995209521952295239524952595269527952895299530953195329533953495359536953795389539954095419542954395449545954695479548954995509551955295539554955595569557955895599560956195629563956495659566956795689569957095719572957395749575957695779578957995809581958295839584958595869587958895899590959195929593959495959596959795989599960096019602960396049605960696079608960996109611961296139614961596169617961896199620962196229623962496259626962796289629963096319632963396349635963696379638963996409641964296439644964596469647964896499650965196529653965496559656965796589659966096619662966396649665966696679668966996709671967296739674967596769677967896799680968196829683968496859686968796889689969096919692969396949695969696979698969997009701970297039704970597069707970897099710971197129713971497159716971797189719972097219722972397249725972697279728972997309731973297339734973597369737973897399740974197429743974497459746974797489749975097519752975397549755975697579758975997609761976297639764976597669767976897699770977197729773977497759776977797789779978097819782978397849785978697879788978997909791979297939794979597969797979897999800980198029803980498059806980798089809981098119812981398149815981698179818981998209821982298239824982598269827982898299830983198329833983498359836983798389839984098419842984398449845984698479848984998509851985298539854985598569857985898599860986198629863986498659866986798689869987098719872987398749875987698779878987998809881988298839884988598869887988898899890989198929893989498959896989798989899990099019902990399049905990699079908990999109911991299139914991599169917991899199920992199229923992499259926992799289929993099319932993399349935993699379938993999409941994299439944994599469947994899499950995199529953995499559956995799589959996099619962996399649965996699679968996999709971997299739974997599769977997899799980998199829983998499859986998799889989999099919992999399949995999699979998999910000100011000210003100041000510006100071000810009100101001110012100131001410015100161001710018100191002010021100221002310024100251002610027100281002910030100311003210033100341003510036100371003810039100401004110042100431004410045100461004710048100491005010051100521005310054100551005610057100581005910060100611006210063100641006510066100671006810069100701007110072100731007410075100761007710078100791008010081100821008310084100851008610087100881008910090100911009210093100941009510096100971009810099101001010110102101031010410105101061010710108101091011010111101121011310114101151011610117101181011910120101211012210123101241012510126101271012810129101301013110132101331013410135101361013710138101391014010141101421014310144101451014610147101481014910150101511015210153101541015510156101571015810159101601016110162101631016410165101661016710168101691017010171101721017310174101751017610177101781017910180101811018210183101841018510186101871018810189101901019110192101931019410195101961019710198101991020010201102021020310204102051020610207102081020910210102111021210213102141021510216102171021810219102201022110222102231022410225102261022710228102291023010231102321023310234102351023610237102381023910240102411024210243102441024510246102471024810249102501025110252102531025410255102561025710258102591026010261102621026310264102651026610267102681026910270102711027210273102741027510276102771027810279102801028110282102831028410285102861028710288102891029010291102921029310294102951029610297102981029910300103011030210303103041030510306103071030810309103101031110312103131031410315103161031710318103191032010321103221032310324103251032610327103281032910330103311033210333103341033510336103371033810339103401034110342103431034410345103461034710348103491035010351103521035310354103551035610357103581035910360103611036210363103641036510366103671036810369103701037110372103731037410375103761037710378103791038010381103821038310384103851038610387103881038910390103911039210393103941039510396103971039810399104001040110402104031040410405104061040710408104091041010411104121041310414104151041610417104181041910420104211042210423104241042510426104271042810429104301043110432104331043410435104361043710438104391044010441104421044310444104451044610447104481044910450104511045210453104541045510456104571045810459104601046110462104631046410465104661046710468104691047010471104721047310474104751047610477104781047910480104811048210483104841048510486104871048810489104901049110492104931049410495104961049710498104991050010501105021050310504105051050610507105081050910510105111051210513105141051510516105171051810519105201052110522105231052410525105261052710528105291053010531105321053310534105351053610537105381053910540105411054210543105441054510546105471054810549105501055110552105531055410555105561055710558105591056010561105621056310564105651056610567105681056910570105711057210573105741057510576105771057810579105801058110582105831058410585105861058710588105891059010591105921059310594105951059610597105981059910600106011060210603106041060510606106071060810609106101061110612106131061410615106161061710618106191062010621106221062310624106251062610627106281062910630106311063210633106341063510636106371063810639106401064110642106431064410645106461064710648106491065010651106521065310654106551065610657106581065910660106611066210663106641066510666106671066810669106701067110672106731067410675106761067710678106791068010681106821068310684106851068610687106881068910690106911069210693106941069510696106971069810699107001070110702107031070410705107061070710708107091071010711107121071310714107151071610717107181071910720107211072210723107241072510726107271072810729107301073110732107331073410735107361073710738107391074010741107421074310744107451074610747107481074910750107511075210753107541075510756107571075810759107601076110762107631076410765107661076710768107691077010771107721077310774107751077610777107781077910780107811078210783107841078510786107871078810789107901079110792107931079410795107961079710798107991080010801108021080310804108051080610807108081080910810108111081210813108141081510816108171081810819108201082110822108231082410825108261082710828108291083010831108321083310834108351083610837108381083910840108411084210843108441084510846108471084810849108501085110852108531085410855108561085710858108591086010861108621086310864108651086610867108681086910870108711087210873108741087510876108771087810879108801088110882108831088410885108861088710888108891089010891108921089310894108951089610897108981089910900109011090210903109041090510906109071090810909109101091110912109131091410915109161091710918109191092010921109221092310924109251092610927109281092910930109311093210933109341093510936109371093810939109401094110942109431094410945109461094710948109491095010951109521095310954109551095610957109581095910960109611096210963109641096510966109671096810969109701097110972109731097410975109761097710978109791098010981109821098310984109851098610987109881098910990109911099210993109941099510996109971099810999110001100111002110031100411005110061100711008110091101011011110121101311014110151101611017110181101911020110211102211023110241102511026110271102811029110301103111032110331103411035110361103711038110391104011041110421104311044110451104611047110481104911050110511105211053110541105511056110571105811059110601106111062110631106411065110661106711068110691107011071110721107311074110751107611077110781107911080110811108211083110841108511086110871108811089110901109111092110931109411095110961109711098110991110011101111021110311104111051110611107111081110911110111111111211113111141111511116111171111811119111201112111122111231112411125111261112711128111291113011131111321113311134111351113611137111381113911140111411114211143111441114511146111471114811149111501115111152111531115411155111561115711158111591116011161111621116311164111651116611167111681116911170111711117211173111741117511176111771117811179111801118111182111831118411185111861118711188111891119011191111921119311194111951119611197111981119911200112011120211203112041120511206112071120811209112101121111212112131121411215112161121711218112191122011221112221122311224112251122611227112281122911230112311123211233112341123511236112371123811239112401124111242112431124411245112461124711248112491125011251112521125311254112551125611257112581125911260112611126211263112641126511266112671126811269112701127111272112731127411275112761127711278112791128011281112821128311284112851128611287112881128911290112911129211293112941129511296112971129811299113001130111302113031130411305113061130711308113091131011311113121131311314113151131611317113181131911320113211132211323113241132511326113271132811329113301133111332113331133411335113361133711338113391134011341113421134311344113451134611347113481134911350113511135211353113541135511356113571135811359113601136111362113631136411365113661136711368113691137011371113721137311374113751137611377113781137911380113811138211383113841138511386113871138811389113901139111392113931139411395113961139711398113991140011401114021140311404114051140611407114081140911410114111141211413114141141511416114171141811419114201142111422114231142411425114261142711428114291143011431114321143311434114351143611437114381143911440114411144211443114441144511446114471144811449114501145111452114531145411455114561145711458114591146011461114621146311464114651146611467114681146911470114711147211473114741147511476114771147811479114801148111482114831148411485114861148711488114891149011491114921149311494114951149611497114981149911500115011150211503115041150511506115071150811509115101151111512115131151411515115161151711518115191152011521115221152311524115251152611527115281152911530115311153211533115341153511536115371153811539115401154111542115431154411545115461154711548115491155011551115521155311554115551155611557115581155911560115611156211563115641156511566115671156811569115701157111572115731157411575115761157711578115791158011581115821158311584115851158611587115881158911590115911159211593115941159511596115971159811599116001160111602116031160411605116061160711608116091161011611116121161311614116151161611617116181161911620116211162211623116241162511626116271162811629116301163111632116331163411635116361163711638116391164011641116421164311644116451164611647116481164911650116511165211653116541165511656116571165811659116601166111662116631166411665116661166711668116691167011671116721167311674116751167611677116781167911680116811168211683116841168511686116871168811689116901169111692116931169411695116961169711698116991170011701117021170311704117051170611707117081170911710117111171211713117141171511716117171171811719117201172111722117231172411725117261172711728117291173011731117321173311734117351173611737117381173911740117411174211743117441174511746117471174811749117501175111752117531175411755117561175711758117591176011761117621176311764117651176611767117681176911770117711177211773117741177511776117771177811779117801178111782117831178411785117861178711788117891179011791117921179311794117951179611797117981179911800118011180211803118041180511806118071180811809118101181111812118131181411815118161181711818118191182011821118221182311824118251182611827118281182911830118311183211833118341183511836118371183811839118401184111842118431184411845118461184711848118491185011851118521185311854118551185611857118581185911860118611186211863118641186511866118671186811869118701187111872118731187411875118761187711878118791188011881118821188311884118851188611887118881188911890118911189211893118941189511896118971189811899119001190111902119031190411905119061190711908119091191011911119121191311914119151191611917119181191911920119211192211923119241192511926119271192811929119301193111932119331193411935119361193711938119391194011941119421194311944119451194611947119481194911950119511195211953119541195511956119571195811959119601196111962119631196411965119661196711968119691197011971119721197311974119751197611977119781197911980119811198211983119841198511986119871198811989119901199111992119931199411995119961199711998119991200012001120021200312004120051200612007120081200912010120111201212013120141201512016120171201812019120201202112022120231202412025120261202712028120291203012031120321203312034120351203612037120381203912040120411204212043120441204512046120471204812049120501205112052120531205412055120561205712058120591206012061120621206312064120651206612067120681206912070120711207212073120741207512076120771207812079120801208112082120831208412085120861208712088120891209012091120921209312094120951209612097120981209912100121011210212103121041210512106121071210812109121101211112112121131211412115121161211712118121191212012121121221212312124121251212612127121281212912130121311213212133121341213512136121371213812139121401214112142121431214412145121461214712148121491215012151121521215312154121551215612157121581215912160121611216212163121641216512166121671216812169121701217112172121731217412175121761217712178121791218012181121821218312184121851218612187121881218912190121911219212193121941219512196121971219812199122001220112202122031220412205122061220712208122091221012211122121221312214122151221612217122181221912220122211222212223122241222512226122271222812229122301223112232122331223412235122361223712238122391224012241122421224312244122451224612247122481224912250122511225212253122541225512256122571225812259122601226112262122631226412265122661226712268122691227012271122721227312274122751227612277122781227912280122811228212283122841228512286122871228812289122901229112292122931229412295122961229712298122991230012301123021230312304123051230612307123081230912310123111231212313123141231512316123171231812319123201232112322123231232412325123261232712328123291233012331123321233312334123351233612337123381233912340123411234212343123441234512346123471234812349123501235112352123531235412355123561235712358123591236012361123621236312364123651236612367123681236912370123711237212373123741237512376123771237812379123801238112382123831238412385123861238712388123891239012391123921239312394123951239612397123981239912400124011240212403124041240512406124071240812409124101241112412124131241412415124161241712418124191242012421124221242312424124251242612427124281242912430124311243212433124341243512436124371243812439124401244112442124431244412445124461244712448124491245012451124521245312454124551245612457124581245912460124611246212463124641246512466124671246812469124701247112472124731247412475124761247712478124791248012481124821248312484124851248612487124881248912490124911249212493124941249512496124971249812499125001250112502125031250412505125061250712508125091251012511125121251312514125151251612517125181251912520125211252212523125241252512526125271252812529125301253112532125331253412535125361253712538125391254012541125421254312544125451254612547125481254912550125511255212553125541255512556125571255812559125601256112562125631256412565125661256712568125691257012571125721257312574125751257612577125781257912580125811258212583125841258512586125871258812589125901259112592125931259412595125961259712598125991260012601126021260312604126051260612607126081260912610126111261212613126141261512616126171261812619126201262112622126231262412625126261262712628126291263012631126321263312634126351263612637126381263912640126411264212643126441264512646126471264812649126501265112652126531265412655126561265712658126591266012661126621266312664126651266612667126681266912670126711267212673126741267512676126771267812679126801268112682126831268412685126861268712688126891269012691126921269312694126951269612697126981269912700127011270212703127041270512706127071270812709127101271112712127131271412715127161271712718127191272012721127221272312724127251272612727127281272912730127311273212733127341273512736127371273812739127401274112742127431274412745127461274712748127491275012751127521275312754127551275612757127581275912760127611276212763127641276512766127671276812769127701277112772127731277412775127761277712778127791278012781127821278312784127851278612787127881278912790127911279212793127941279512796127971279812799128001280112802128031280412805128061280712808128091281012811128121281312814128151281612817128181281912820128211282212823128241282512826128271282812829128301283112832128331283412835128361283712838128391284012841128421284312844128451284612847128481284912850128511285212853128541285512856128571285812859128601286112862128631286412865128661286712868128691287012871128721287312874128751287612877128781287912880128811288212883128841288512886128871288812889128901289112892128931289412895128961289712898128991290012901129021290312904129051290612907129081290912910129111291212913129141291512916129171291812919129201292112922129231292412925129261292712928129291293012931129321293312934129351293612937129381293912940129411294212943129441294512946129471294812949129501295112952129531295412955129561295712958129591296012961129621296312964129651296612967129681296912970129711297212973129741297512976129771297812979129801298112982129831298412985129861298712988129891299012991129921299312994129951299612997129981299913000130011300213003130041300513006130071300813009130101301113012130131301413015130161301713018130191302013021130221302313024130251302613027130281302913030130311303213033130341303513036130371303813039130401304113042130431304413045130461304713048130491305013051130521305313054130551305613057130581305913060130611306213063130641306513066130671306813069130701307113072130731307413075130761307713078130791308013081130821308313084130851308613087130881308913090130911309213093130941309513096130971309813099131001310113102131031310413105131061310713108131091311013111131121311313114131151311613117131181311913120131211312213123131241312513126131271312813129131301313113132131331313413135131361313713138131391314013141131421314313144131451314613147131481314913150131511315213153131541315513156131571315813159131601316113162131631316413165131661316713168131691317013171131721317313174131751317613177131781317913180131811318213183131841318513186131871318813189131901319113192131931319413195131961319713198131991320013201132021320313204132051320613207132081320913210132111321213213132141321513216132171321813219132201322113222132231322413225132261322713228132291323013231132321323313234132351323613237132381323913240132411324213243132441324513246132471324813249132501325113252132531325413255132561325713258132591326013261132621326313264132651326613267132681326913270132711327213273132741327513276132771327813279132801328113282132831328413285132861328713288132891329013291132921329313294132951329613297132981329913300133011330213303133041330513306133071330813309133101331113312133131331413315133161331713318133191332013321133221332313324133251332613327133281332913330133311333213333133341333513336133371333813339133401334113342133431334413345133461334713348133491335013351133521335313354133551335613357133581335913360133611336213363133641336513366133671336813369133701337113372133731337413375133761337713378133791338013381133821338313384133851338613387133881338913390133911339213393133941339513396133971339813399134001340113402134031340413405134061340713408134091341013411134121341313414134151341613417134181341913420134211342213423134241342513426134271342813429134301343113432134331343413435134361343713438134391344013441134421344313444134451344613447134481344913450134511345213453134541345513456134571345813459134601346113462134631346413465134661346713468134691347013471134721347313474134751347613477134781347913480134811348213483134841348513486134871348813489134901349113492134931349413495134961349713498134991350013501135021350313504135051350613507135081350913510135111351213513135141351513516135171351813519135201352113522135231352413525135261352713528135291353013531135321353313534135351353613537135381353913540135411354213543135441354513546135471354813549135501355113552135531355413555135561355713558135591356013561135621356313564135651356613567135681356913570135711357213573135741357513576135771357813579135801358113582135831358413585135861358713588135891359013591135921359313594135951359613597135981359913600136011360213603136041360513606136071360813609136101361113612136131361413615136161361713618136191362013621136221362313624136251362613627136281362913630136311363213633136341363513636136371363813639136401364113642136431364413645136461364713648136491365013651136521365313654136551365613657136581365913660136611366213663136641366513666136671366813669136701367113672136731367413675136761367713678136791368013681136821368313684136851368613687136881368913690136911369213693136941369513696136971369813699137001370113702137031370413705137061370713708137091371013711137121371313714137151371613717137181371913720137211372213723137241372513726137271372813729137301373113732137331373413735137361373713738137391374013741137421374313744137451374613747137481374913750137511375213753137541375513756137571375813759137601376113762137631376413765137661376713768137691377013771137721377313774137751377613777137781377913780137811378213783137841378513786137871378813789137901379113792137931379413795137961379713798137991380013801138021380313804138051380613807138081380913810138111381213813138141381513816138171381813819138201382113822138231382413825138261382713828138291383013831138321383313834138351383613837138381383913840138411384213843138441384513846138471384813849138501385113852138531385413855138561385713858138591386013861138621386313864138651386613867138681386913870138711387213873138741387513876138771387813879138801388113882138831388413885138861388713888138891389013891138921389313894138951389613897138981389913900139011390213903139041390513906139071390813909139101391113912139131391413915139161391713918139191392013921139221392313924139251392613927139281392913930139311393213933139341393513936139371393813939139401394113942139431394413945139461394713948139491395013951139521395313954139551395613957139581395913960139611396213963139641396513966139671396813969139701397113972139731397413975139761397713978139791398013981139821398313984139851398613987139881398913990139911399213993139941399513996139971399813999140001400114002140031400414005140061400714008140091401014011140121401314014140151401614017140181401914020140211402214023140241402514026140271402814029140301403114032140331403414035140361403714038140391404014041140421404314044140451404614047140481404914050140511405214053140541405514056140571405814059140601406114062140631406414065140661406714068140691407014071140721407314074140751407614077140781407914080140811408214083140841408514086140871408814089140901409114092140931409414095140961409714098140991410014101141021410314104141051410614107141081410914110141111411214113141141411514116141171411814119141201412114122141231412414125141261412714128141291413014131141321413314134141351413614137141381413914140141411414214143141441414514146141471414814149141501415114152141531415414155141561415714158141591416014161141621416314164141651416614167141681416914170141711417214173141741417514176141771417814179141801418114182141831418414185141861418714188141891419014191141921419314194141951419614197141981419914200142011420214203142041420514206142071420814209142101421114212142131421414215142161421714218142191422014221142221422314224142251422614227142281422914230142311423214233142341423514236142371423814239142401424114242142431424414245142461424714248142491425014251142521425314254142551425614257142581425914260142611426214263142641426514266142671426814269142701427114272142731427414275142761427714278142791428014281142821428314284142851428614287142881428914290142911429214293142941429514296142971429814299143001430114302143031430414305143061430714308143091431014311143121431314314143151431614317143181431914320143211432214323143241432514326143271432814329143301433114332143331433414335143361433714338143391434014341143421434314344143451434614347143481434914350143511435214353143541435514356143571435814359143601436114362143631436414365143661436714368143691437014371143721437314374143751437614377143781437914380143811438214383143841438514386143871438814389143901439114392143931439414395143961439714398143991440014401144021440314404144051440614407144081440914410144111441214413144141441514416144171441814419144201442114422144231442414425144261442714428144291443014431144321443314434144351443614437144381443914440144411444214443144441444514446144471444814449144501445114452144531445414455144561445714458144591446014461144621446314464144651446614467144681446914470144711447214473144741447514476144771447814479144801448114482144831448414485144861448714488144891449014491144921449314494144951449614497144981449914500145011450214503145041450514506145071450814509145101451114512145131451414515145161451714518145191452014521145221452314524145251452614527145281452914530145311453214533145341453514536145371453814539145401454114542145431454414545145461454714548145491455014551145521455314554145551455614557145581455914560145611456214563145641456514566145671456814569145701457114572145731457414575145761457714578145791458014581145821458314584145851458614587145881458914590145911459214593145941459514596145971459814599146001460114602146031460414605146061460714608146091461014611146121461314614146151461614617146181461914620146211462214623146241462514626146271462814629146301463114632146331463414635146361463714638146391464014641146421464314644146451464614647146481464914650146511465214653146541465514656146571465814659146601466114662146631466414665146661466714668146691467014671146721467314674146751467614677146781467914680146811468214683146841468514686146871468814689146901469114692146931469414695146961469714698146991470014701147021470314704147051470614707147081470914710147111471214713147141471514716147171471814719147201472114722147231472414725147261472714728147291473014731147321473314734147351473614737147381473914740147411474214743147441474514746147471474814749147501475114752147531475414755147561475714758147591476014761147621476314764147651476614767147681476914770147711477214773147741477514776147771477814779147801478114782147831478414785147861478714788147891479014791147921479314794147951479614797147981479914800148011480214803148041480514806148071480814809148101481114812148131481414815148161481714818148191482014821148221482314824148251482614827148281482914830148311483214833148341483514836148371483814839148401484114842148431484414845148461484714848148491485014851148521485314854148551485614857148581485914860148611486214863148641486514866148671486814869148701487114872148731487414875148761487714878148791488014881148821488314884148851488614887148881488914890148911489214893148941489514896148971489814899149001490114902149031490414905149061490714908149091491014911149121491314914149151491614917149181491914920149211492214923149241492514926149271492814929149301493114932149331493414935149361493714938149391494014941149421494314944149451494614947149481494914950149511495214953149541495514956149571495814959149601496114962149631496414965149661496714968149691497014971149721497314974149751497614977149781497914980149811498214983149841498514986149871498814989149901499114992149931499414995149961499714998149991500015001150021500315004150051500615007150081500915010150111501215013150141501515016150171501815019150201502115022150231502415025150261502715028150291503015031150321503315034150351503615037150381503915040150411504215043150441504515046150471504815049150501505115052150531505415055150561505715058150591506015061150621506315064150651506615067150681506915070150711507215073150741507515076150771507815079150801508115082150831508415085150861508715088150891509015091150921509315094150951509615097150981509915100151011510215103151041510515106151071510815109151101511115112151131511415115151161511715118151191512015121151221512315124151251512615127151281512915130151311513215133151341513515136151371513815139151401514115142151431514415145151461514715148151491515015151151521515315154151551515615157151581515915160151611516215163151641516515166151671516815169151701517115172151731517415175151761517715178151791518015181151821518315184151851518615187151881518915190151911519215193151941519515196151971519815199152001520115202152031520415205152061520715208152091521015211152121521315214152151521615217152181521915220152211522215223152241522515226152271522815229152301523115232152331523415235152361523715238152391524015241152421524315244152451524615247152481524915250152511525215253152541525515256152571525815259152601526115262152631526415265152661526715268152691527015271152721527315274152751527615277152781527915280152811528215283152841528515286152871528815289152901529115292152931529415295152961529715298152991530015301153021530315304153051530615307153081530915310153111531215313153141531515316153171531815319153201532115322153231532415325153261532715328153291533015331153321533315334153351533615337153381533915340153411534215343153441534515346153471534815349153501535115352153531535415355153561535715358153591536015361153621536315364153651536615367153681536915370153711537215373153741537515376153771537815379153801538115382153831538415385153861538715388153891539015391153921539315394153951539615397153981539915400154011540215403154041540515406154071540815409154101541115412154131541415415154161541715418154191542015421154221542315424154251542615427154281542915430154311543215433154341543515436154371543815439154401544115442154431544415445154461544715448154491545015451154521545315454154551545615457154581545915460154611546215463154641546515466154671546815469154701547115472154731547415475154761547715478154791548015481154821548315484154851548615487154881548915490154911549215493154941549515496154971549815499155001550115502155031550415505155061550715508155091551015511155121551315514155151551615517155181551915520155211552215523155241552515526155271552815529155301553115532155331553415535155361553715538155391554015541155421554315544155451554615547155481554915550155511555215553155541555515556155571555815559155601556115562155631556415565155661556715568155691557015571155721557315574155751557615577155781557915580155811558215583155841558515586155871558815589155901559115592155931559415595155961559715598155991560015601156021560315604156051560615607156081560915610156111561215613156141561515616156171561815619156201562115622156231562415625156261562715628156291563015631156321563315634156351563615637156381563915640156411564215643156441564515646156471564815649156501565115652156531565415655156561565715658156591566015661156621566315664156651566615667156681566915670156711567215673156741567515676156771567815679156801568115682156831568415685156861568715688156891569015691156921569315694156951569615697156981569915700157011570215703157041570515706157071570815709157101571115712157131571415715157161571715718157191572015721157221572315724157251572615727157281572915730157311573215733157341573515736157371573815739157401574115742157431574415745157461574715748157491575015751157521575315754157551575615757157581575915760157611576215763157641576515766157671576815769157701577115772157731577415775157761577715778157791578015781157821578315784157851578615787157881578915790157911579215793157941579515796157971579815799158001580115802158031580415805158061580715808158091581015811158121581315814158151581615817158181581915820158211582215823158241582515826158271582815829158301583115832158331583415835158361583715838158391584015841158421584315844158451584615847158481584915850158511585215853158541585515856158571585815859158601586115862158631586415865158661586715868158691587015871158721587315874158751587615877158781587915880158811588215883158841588515886158871588815889158901589115892158931589415895158961589715898158991590015901159021590315904159051590615907159081590915910159111591215913159141591515916159171591815919159201592115922159231592415925159261592715928159291593015931159321593315934159351593615937159381593915940159411594215943159441594515946159471594815949 |
- /* Copyright (C) 2013-2019 Free Software Foundation, Inc.
- This file is part of GCC.
- GCC is free software; you can redistribute it and/or modify
- it under the terms of the GNU General Public License as published by
- the Free Software Foundation; either version 3, or (at your option)
- any later version.
- GCC is distributed in the hope that it will be useful,
- but WITHOUT ANY WARRANTY; without even the implied warranty of
- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
- GNU General Public License for more details.
- Under Section 7 of GPL version 3, you are granted additional
- permissions described in the GCC Runtime Library Exception, version
- 3.1, as published by the Free Software Foundation.
- You should have received a copy of the GNU General Public License and
- a copy of the GCC Runtime Library Exception along with this program;
- see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
- <http://www.gnu.org/licenses/>. */
- #ifndef _IMMINTRIN_H_INCLUDED
- #error "Never use <avx512fintrin.h> directly; include <immintrin.h> instead."
- #endif
- #ifndef _AVX512FINTRIN_H_INCLUDED
- #define _AVX512FINTRIN_H_INCLUDED
- #ifndef __AVX512F__
- #pragma GCC push_options
- #pragma GCC target("avx512f")
- #define __DISABLE_AVX512F__
- #endif /* __AVX512F__ */
- /* Internal data types for implementing the intrinsics. */
- typedef double __v8df __attribute__ ((__vector_size__ (64)));
- typedef float __v16sf __attribute__ ((__vector_size__ (64)));
- typedef long long __v8di __attribute__ ((__vector_size__ (64)));
- typedef unsigned long long __v8du __attribute__ ((__vector_size__ (64)));
- typedef int __v16si __attribute__ ((__vector_size__ (64)));
- typedef unsigned int __v16su __attribute__ ((__vector_size__ (64)));
- typedef short __v32hi __attribute__ ((__vector_size__ (64)));
- typedef unsigned short __v32hu __attribute__ ((__vector_size__ (64)));
- typedef char __v64qi __attribute__ ((__vector_size__ (64)));
- typedef unsigned char __v64qu __attribute__ ((__vector_size__ (64)));
- /* The Intel API is flexible enough that we must allow aliasing with other
- vector types, and their scalar components. */
- typedef float __m512 __attribute__ ((__vector_size__ (64), __may_alias__));
- typedef long long __m512i __attribute__ ((__vector_size__ (64), __may_alias__));
- typedef double __m512d __attribute__ ((__vector_size__ (64), __may_alias__));
- /* Unaligned version of the same type. */
- typedef float __m512_u __attribute__ ((__vector_size__ (64), __may_alias__, __aligned__ (1)));
- typedef long long __m512i_u __attribute__ ((__vector_size__ (64), __may_alias__, __aligned__ (1)));
- typedef double __m512d_u __attribute__ ((__vector_size__ (64), __may_alias__, __aligned__ (1)));
- typedef unsigned char __mmask8;
- typedef unsigned short __mmask16;
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_int2mask (int __M)
- {
- return (__mmask16) __M;
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask2int (__mmask16 __M)
- {
- return (int) __M;
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set_epi64 (long long __A, long long __B, long long __C,
- long long __D, long long __E, long long __F,
- long long __G, long long __H)
- {
- return __extension__ (__m512i) (__v8di)
- { __H, __G, __F, __E, __D, __C, __B, __A };
- }
- /* Create the vector [A B C D E F G H I J K L M N O P]. */
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set_epi32 (int __A, int __B, int __C, int __D,
- int __E, int __F, int __G, int __H,
- int __I, int __J, int __K, int __L,
- int __M, int __N, int __O, int __P)
- {
- return __extension__ (__m512i)(__v16si)
- { __P, __O, __N, __M, __L, __K, __J, __I,
- __H, __G, __F, __E, __D, __C, __B, __A };
- }
- extern __inline __m512i
- __attribute__((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set_epi16 (short __q31, short __q30, short __q29, short __q28,
- short __q27, short __q26, short __q25, short __q24,
- short __q23, short __q22, short __q21, short __q20,
- short __q19, short __q18, short __q17, short __q16,
- short __q15, short __q14, short __q13, short __q12,
- short __q11, short __q10, short __q09, short __q08,
- short __q07, short __q06, short __q05, short __q04,
- short __q03, short __q02, short __q01, short __q00)
- {
- return __extension__ (__m512i)(__v32hi){
- __q00, __q01, __q02, __q03, __q04, __q05, __q06, __q07,
- __q08, __q09, __q10, __q11, __q12, __q13, __q14, __q15,
- __q16, __q17, __q18, __q19, __q20, __q21, __q22, __q23,
- __q24, __q25, __q26, __q27, __q28, __q29, __q30, __q31
- };
- }
- extern __inline __m512i
- __attribute__((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set_epi8 (char __q63, char __q62, char __q61, char __q60,
- char __q59, char __q58, char __q57, char __q56,
- char __q55, char __q54, char __q53, char __q52,
- char __q51, char __q50, char __q49, char __q48,
- char __q47, char __q46, char __q45, char __q44,
- char __q43, char __q42, char __q41, char __q40,
- char __q39, char __q38, char __q37, char __q36,
- char __q35, char __q34, char __q33, char __q32,
- char __q31, char __q30, char __q29, char __q28,
- char __q27, char __q26, char __q25, char __q24,
- char __q23, char __q22, char __q21, char __q20,
- char __q19, char __q18, char __q17, char __q16,
- char __q15, char __q14, char __q13, char __q12,
- char __q11, char __q10, char __q09, char __q08,
- char __q07, char __q06, char __q05, char __q04,
- char __q03, char __q02, char __q01, char __q00)
- {
- return __extension__ (__m512i)(__v64qi){
- __q00, __q01, __q02, __q03, __q04, __q05, __q06, __q07,
- __q08, __q09, __q10, __q11, __q12, __q13, __q14, __q15,
- __q16, __q17, __q18, __q19, __q20, __q21, __q22, __q23,
- __q24, __q25, __q26, __q27, __q28, __q29, __q30, __q31,
- __q32, __q33, __q34, __q35, __q36, __q37, __q38, __q39,
- __q40, __q41, __q42, __q43, __q44, __q45, __q46, __q47,
- __q48, __q49, __q50, __q51, __q52, __q53, __q54, __q55,
- __q56, __q57, __q58, __q59, __q60, __q61, __q62, __q63
- };
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set_pd (double __A, double __B, double __C, double __D,
- double __E, double __F, double __G, double __H)
- {
- return __extension__ (__m512d)
- { __H, __G, __F, __E, __D, __C, __B, __A };
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set_ps (float __A, float __B, float __C, float __D,
- float __E, float __F, float __G, float __H,
- float __I, float __J, float __K, float __L,
- float __M, float __N, float __O, float __P)
- {
- return __extension__ (__m512)
- { __P, __O, __N, __M, __L, __K, __J, __I,
- __H, __G, __F, __E, __D, __C, __B, __A };
- }
- #define _mm512_setr_epi64(e0,e1,e2,e3,e4,e5,e6,e7) \
- _mm512_set_epi64(e7,e6,e5,e4,e3,e2,e1,e0)
- #define _mm512_setr_epi32(e0,e1,e2,e3,e4,e5,e6,e7, \
- e8,e9,e10,e11,e12,e13,e14,e15) \
- _mm512_set_epi32(e15,e14,e13,e12,e11,e10,e9,e8,e7,e6,e5,e4,e3,e2,e1,e0)
- #define _mm512_setr_pd(e0,e1,e2,e3,e4,e5,e6,e7) \
- _mm512_set_pd(e7,e6,e5,e4,e3,e2,e1,e0)
- #define _mm512_setr_ps(e0,e1,e2,e3,e4,e5,e6,e7,e8,e9,e10,e11,e12,e13,e14,e15) \
- _mm512_set_ps(e15,e14,e13,e12,e11,e10,e9,e8,e7,e6,e5,e4,e3,e2,e1,e0)
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_undefined_ps (void)
- {
- __m512 __Y = __Y;
- return __Y;
- }
- #define _mm512_undefined _mm512_undefined_ps
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_undefined_pd (void)
- {
- __m512d __Y = __Y;
- return __Y;
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_undefined_epi32 (void)
- {
- __m512i __Y = __Y;
- return __Y;
- }
- #define _mm512_undefined_si512 _mm512_undefined_epi32
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set1_epi8 (char __A)
- {
- return __extension__ (__m512i)(__v64qi)
- { __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A };
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set1_epi16 (short __A)
- {
- return __extension__ (__m512i)(__v32hi)
- { __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A,
- __A, __A, __A, __A, __A, __A, __A, __A };
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set1_pd (double __A)
- {
- return (__m512d) __builtin_ia32_broadcastsd512 (__extension__
- (__v2df) { __A, },
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set1_ps (float __A)
- {
- return (__m512) __builtin_ia32_broadcastss512 (__extension__
- (__v4sf) { __A, },
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- /* Create the vector [A B C D A B C D A B C D A B C D]. */
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set4_epi32 (int __A, int __B, int __C, int __D)
- {
- return __extension__ (__m512i)(__v16si)
- { __D, __C, __B, __A, __D, __C, __B, __A,
- __D, __C, __B, __A, __D, __C, __B, __A };
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set4_epi64 (long long __A, long long __B, long long __C,
- long long __D)
- {
- return __extension__ (__m512i) (__v8di)
- { __D, __C, __B, __A, __D, __C, __B, __A };
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set4_pd (double __A, double __B, double __C, double __D)
- {
- return __extension__ (__m512d)
- { __D, __C, __B, __A, __D, __C, __B, __A };
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set4_ps (float __A, float __B, float __C, float __D)
- {
- return __extension__ (__m512)
- { __D, __C, __B, __A, __D, __C, __B, __A,
- __D, __C, __B, __A, __D, __C, __B, __A };
- }
- #define _mm512_setr4_epi64(e0,e1,e2,e3) \
- _mm512_set4_epi64(e3,e2,e1,e0)
- #define _mm512_setr4_epi32(e0,e1,e2,e3) \
- _mm512_set4_epi32(e3,e2,e1,e0)
- #define _mm512_setr4_pd(e0,e1,e2,e3) \
- _mm512_set4_pd(e3,e2,e1,e0)
- #define _mm512_setr4_ps(e0,e1,e2,e3) \
- _mm512_set4_ps(e3,e2,e1,e0)
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_setzero_ps (void)
- {
- return __extension__ (__m512){ 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0,
- 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 };
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_setzero (void)
- {
- return _mm512_setzero_ps ();
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_setzero_pd (void)
- {
- return __extension__ (__m512d) { 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0 };
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_setzero_epi32 (void)
- {
- return __extension__ (__m512i)(__v8di){ 0, 0, 0, 0, 0, 0, 0, 0 };
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_setzero_si512 (void)
- {
- return __extension__ (__m512i)(__v8di){ 0, 0, 0, 0, 0, 0, 0, 0 };
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mov_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_movapd512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mov_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_movapd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mov_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_movaps512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mov_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_movaps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_load_pd (void const *__P)
- {
- return *(__m512d *) __P;
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_load_pd (__m512d __W, __mmask8 __U, void const *__P)
- {
- return (__m512d) __builtin_ia32_loadapd512_mask ((const __v8df *) __P,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_load_pd (__mmask8 __U, void const *__P)
- {
- return (__m512d) __builtin_ia32_loadapd512_mask ((const __v8df *) __P,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_store_pd (void *__P, __m512d __A)
- {
- *(__m512d *) __P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_store_pd (void *__P, __mmask8 __U, __m512d __A)
- {
- __builtin_ia32_storeapd512_mask ((__v8df *) __P, (__v8df) __A,
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_load_ps (void const *__P)
- {
- return *(__m512 *) __P;
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_load_ps (__m512 __W, __mmask16 __U, void const *__P)
- {
- return (__m512) __builtin_ia32_loadaps512_mask ((const __v16sf *) __P,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_load_ps (__mmask16 __U, void const *__P)
- {
- return (__m512) __builtin_ia32_loadaps512_mask ((const __v16sf *) __P,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_store_ps (void *__P, __m512 __A)
- {
- *(__m512 *) __P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_store_ps (void *__P, __mmask16 __U, __m512 __A)
- {
- __builtin_ia32_storeaps512_mask ((__v16sf *) __P, (__v16sf) __A,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mov_epi64 (__m512i __W, __mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_movdqa64_512_mask ((__v8di) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mov_epi64 (__mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_movdqa64_512_mask ((__v8di) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_load_epi64 (void const *__P)
- {
- return *(__m512i *) __P;
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_load_epi64 (__m512i __W, __mmask8 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_movdqa64load512_mask ((const __v8di *) __P,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_load_epi64 (__mmask8 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_movdqa64load512_mask ((const __v8di *) __P,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_store_epi64 (void *__P, __m512i __A)
- {
- *(__m512i *) __P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_store_epi64 (void *__P, __mmask8 __U, __m512i __A)
- {
- __builtin_ia32_movdqa64store512_mask ((__v8di *) __P, (__v8di) __A,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mov_epi32 (__m512i __W, __mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_movdqa32_512_mask ((__v16si) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mov_epi32 (__mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_movdqa32_512_mask ((__v16si) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_load_si512 (void const *__P)
- {
- return *(__m512i *) __P;
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_load_epi32 (void const *__P)
- {
- return *(__m512i *) __P;
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_load_epi32 (__m512i __W, __mmask16 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_movdqa32load512_mask ((const __v16si *) __P,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_load_epi32 (__mmask16 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_movdqa32load512_mask ((const __v16si *) __P,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_store_si512 (void *__P, __m512i __A)
- {
- *(__m512i *) __P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_store_epi32 (void *__P, __m512i __A)
- {
- *(__m512i *) __P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_store_epi32 (void *__P, __mmask16 __U, __m512i __A)
- {
- __builtin_ia32_movdqa32store512_mask ((__v16si *) __P, (__v16si) __A,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mullo_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A * (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mullo_epi32 (__mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmulld512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mullo_epi32 (__m512i __W, __mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmulld512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mullox_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v8du) __A * (__v8du) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mullox_epi64 (__m512i __W, __mmask8 __M, __m512i __A, __m512i __B)
- {
- return _mm512_mask_mov_epi64 (__W, __M, _mm512_mullox_epi64 (__A, __B));
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sllv_epi32 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psllv16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sllv_epi32 (__m512i __W, __mmask16 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psllv16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sllv_epi32 (__mmask16 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psllv16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srav_epi32 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrav16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srav_epi32 (__m512i __W, __mmask16 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrav16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srav_epi32 (__mmask16 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrav16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srlv_epi32 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrlv16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srlv_epi32 (__m512i __W, __mmask16 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrlv16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srlv_epi32 (__mmask16 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrlv16si_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_add_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v8du) __A + (__v8du) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_add_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_paddq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_add_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_paddq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sub_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v8du) __A - (__v8du) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sub_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_psubq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sub_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_psubq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sllv_epi64 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psllv8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sllv_epi64 (__m512i __W, __mmask8 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psllv8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sllv_epi64 (__mmask8 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psllv8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srav_epi64 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrav8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srav_epi64 (__m512i __W, __mmask8 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrav8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srav_epi64 (__mmask8 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrav8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srlv_epi64 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrlv8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srlv_epi64 (__m512i __W, __mmask8 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrlv8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srlv_epi64 (__mmask8 __U, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_psrlv8di_mask ((__v8di) __X,
- (__v8di) __Y,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_add_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A + (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_add_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_paddd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_add_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_paddd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mul_epi32 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_pmuldq512_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mul_epi32 (__m512i __W, __mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_pmuldq512_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v8di) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mul_epi32 (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_pmuldq512_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sub_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A - (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sub_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_psubd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sub_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_psubd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mul_epu32 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_pmuludq512_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mul_epu32 (__m512i __W, __mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_pmuludq512_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v8di) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mul_epu32 (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_pmuludq512_mask ((__v16si) __X,
- (__v16si) __Y,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_slli_epi64 (__m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psllqi512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_slli_epi64 (__m512i __W, __mmask8 __U, __m512i __A,
- unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psllqi512_mask ((__v8di) __A, __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_slli_epi64 (__mmask8 __U, __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psllqi512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_slli_epi64(X, C) \
- ((__m512i) __builtin_ia32_psllqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask8)-1))
- #define _mm512_mask_slli_epi64(W, U, X, C) \
- ((__m512i) __builtin_ia32_psllqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_slli_epi64(U, X, C) \
- ((__m512i) __builtin_ia32_psllqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)_mm512_setzero_si512 (),\
- (__mmask8)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sll_epi64 (__m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psllq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sll_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psllq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sll_epi64 (__mmask8 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psllq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srli_epi64 (__m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psrlqi512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srli_epi64 (__m512i __W, __mmask8 __U,
- __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psrlqi512_mask ((__v8di) __A, __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srli_epi64 (__mmask8 __U, __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psrlqi512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_srli_epi64(X, C) \
- ((__m512i) __builtin_ia32_psrlqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask8)-1))
- #define _mm512_mask_srli_epi64(W, U, X, C) \
- ((__m512i) __builtin_ia32_psrlqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_srli_epi64(U, X, C) \
- ((__m512i) __builtin_ia32_psrlqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)_mm512_setzero_si512 (),\
- (__mmask8)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srl_epi64 (__m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrlq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srl_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrlq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srl_epi64 (__mmask8 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrlq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srai_epi64 (__m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psraqi512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srai_epi64 (__m512i __W, __mmask8 __U, __m512i __A,
- unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psraqi512_mask ((__v8di) __A, __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srai_epi64 (__mmask8 __U, __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psraqi512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_srai_epi64(X, C) \
- ((__m512i) __builtin_ia32_psraqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask8)-1))
- #define _mm512_mask_srai_epi64(W, U, X, C) \
- ((__m512i) __builtin_ia32_psraqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_srai_epi64(U, X, C) \
- ((__m512i) __builtin_ia32_psraqi512_mask ((__v8di)(__m512i)(X), (int)(C),\
- (__v8di)(__m512i)_mm512_setzero_si512 (),\
- (__mmask8)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sra_epi64 (__m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psraq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sra_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psraq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sra_epi64 (__mmask8 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psraq512_mask ((__v8di) __A,
- (__v2di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_slli_epi32 (__m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_pslldi512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_slli_epi32 (__m512i __W, __mmask16 __U, __m512i __A,
- unsigned int __B)
- {
- return (__m512i) __builtin_ia32_pslldi512_mask ((__v16si) __A, __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_slli_epi32 (__mmask16 __U, __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_pslldi512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- #else
- #define _mm512_slli_epi32(X, C) \
- ((__m512i) __builtin_ia32_pslldi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask16)-1))
- #define _mm512_mask_slli_epi32(W, U, X, C) \
- ((__m512i) __builtin_ia32_pslldi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)(W),\
- (__mmask16)(U)))
- #define _mm512_maskz_slli_epi32(U, X, C) \
- ((__m512i) __builtin_ia32_pslldi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_setzero_si512 (),\
- (__mmask16)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sll_epi32 (__m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_pslld512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sll_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_pslld512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sll_epi32 (__mmask16 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_pslld512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srli_epi32 (__m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psrldi512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srli_epi32 (__m512i __W, __mmask16 __U,
- __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psrldi512_mask ((__v16si) __A, __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srli_epi32 (__mmask16 __U, __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psrldi512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- #else
- #define _mm512_srli_epi32(X, C) \
- ((__m512i) __builtin_ia32_psrldi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask16)-1))
- #define _mm512_mask_srli_epi32(W, U, X, C) \
- ((__m512i) __builtin_ia32_psrldi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)(W),\
- (__mmask16)(U)))
- #define _mm512_maskz_srli_epi32(U, X, C) \
- ((__m512i) __builtin_ia32_psrldi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_setzero_si512 (),\
- (__mmask16)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srl_epi32 (__m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrld512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srl_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrld512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srl_epi32 (__mmask16 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrld512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_srai_epi32 (__m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psradi512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_srai_epi32 (__m512i __W, __mmask16 __U, __m512i __A,
- unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psradi512_mask ((__v16si) __A, __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_srai_epi32 (__mmask16 __U, __m512i __A, unsigned int __B)
- {
- return (__m512i) __builtin_ia32_psradi512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- #else
- #define _mm512_srai_epi32(X, C) \
- ((__m512i) __builtin_ia32_psradi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask16)-1))
- #define _mm512_mask_srai_epi32(W, U, X, C) \
- ((__m512i) __builtin_ia32_psradi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)(W),\
- (__mmask16)(U)))
- #define _mm512_maskz_srai_epi32(U, X, C) \
- ((__m512i) __builtin_ia32_psradi512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_setzero_si512 (),\
- (__mmask16)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sra_epi32 (__m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrad512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sra_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrad512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sra_epi32 (__mmask16 __U, __m512i __A, __m128i __B)
- {
- return (__m512i) __builtin_ia32_psrad512_mask ((__v16si) __A,
- (__v4si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_add_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_addsd_round ((__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_add_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_addsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_add_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_addsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_add_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_addss_round ((__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_add_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_addss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_add_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_addss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_sub_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_subsd_round ((__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_sub_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_subsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_sub_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_subsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_sub_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_subss_round ((__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_sub_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_subss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_sub_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_subss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- #else
- #define _mm_add_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_addsd_round(A, B, C)
- #define _mm_mask_add_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_addsd_mask_round(A, B, W, U, C)
- #define _mm_maskz_add_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_addsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U, C)
- #define _mm_add_round_ss(A, B, C) \
- (__m128)__builtin_ia32_addss_round(A, B, C)
- #define _mm_mask_add_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_addss_mask_round(A, B, W, U, C)
- #define _mm_maskz_add_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_addss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U, C)
- #define _mm_sub_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_subsd_round(A, B, C)
- #define _mm_mask_sub_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_subsd_mask_round(A, B, W, U, C)
- #define _mm_maskz_sub_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_subsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U, C)
- #define _mm_sub_round_ss(A, B, C) \
- (__m128)__builtin_ia32_subss_round(A, B, C)
- #define _mm_mask_sub_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_subss_mask_round(A, B, W, U, C)
- #define _mm_maskz_sub_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_subss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U, C)
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_ternarylogic_epi64 (__m512i __A, __m512i __B, __m512i __C,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_pternlogq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __C, __imm,
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_ternarylogic_epi64 (__m512i __A, __mmask8 __U, __m512i __B,
- __m512i __C, const int __imm)
- {
- return (__m512i) __builtin_ia32_pternlogq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __C, __imm,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_ternarylogic_epi64 (__mmask8 __U, __m512i __A, __m512i __B,
- __m512i __C, const int __imm)
- {
- return (__m512i) __builtin_ia32_pternlogq512_maskz ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __C,
- __imm, (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_ternarylogic_epi32 (__m512i __A, __m512i __B, __m512i __C,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_pternlogd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __C,
- __imm, (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_ternarylogic_epi32 (__m512i __A, __mmask16 __U, __m512i __B,
- __m512i __C, const int __imm)
- {
- return (__m512i) __builtin_ia32_pternlogd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __C,
- __imm, (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_ternarylogic_epi32 (__mmask16 __U, __m512i __A, __m512i __B,
- __m512i __C, const int __imm)
- {
- return (__m512i) __builtin_ia32_pternlogd512_maskz ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __C,
- __imm, (__mmask16) __U);
- }
- #else
- #define _mm512_ternarylogic_epi64(A, B, C, I) \
- ((__m512i) __builtin_ia32_pternlogq512_mask ((__v8di)(__m512i)(A), \
- (__v8di)(__m512i)(B), (__v8di)(__m512i)(C), (int)(I), (__mmask8)-1))
- #define _mm512_mask_ternarylogic_epi64(A, U, B, C, I) \
- ((__m512i) __builtin_ia32_pternlogq512_mask ((__v8di)(__m512i)(A), \
- (__v8di)(__m512i)(B), (__v8di)(__m512i)(C), (int)(I), (__mmask8)(U)))
- #define _mm512_maskz_ternarylogic_epi64(U, A, B, C, I) \
- ((__m512i) __builtin_ia32_pternlogq512_maskz ((__v8di)(__m512i)(A), \
- (__v8di)(__m512i)(B), (__v8di)(__m512i)(C), (int)(I), (__mmask8)(U)))
- #define _mm512_ternarylogic_epi32(A, B, C, I) \
- ((__m512i) __builtin_ia32_pternlogd512_mask ((__v16si)(__m512i)(A), \
- (__v16si)(__m512i)(B), (__v16si)(__m512i)(C), (int)(I), \
- (__mmask16)-1))
- #define _mm512_mask_ternarylogic_epi32(A, U, B, C, I) \
- ((__m512i) __builtin_ia32_pternlogd512_mask ((__v16si)(__m512i)(A), \
- (__v16si)(__m512i)(B), (__v16si)(__m512i)(C), (int)(I), \
- (__mmask16)(U)))
- #define _mm512_maskz_ternarylogic_epi32(U, A, B, C, I) \
- ((__m512i) __builtin_ia32_pternlogd512_maskz ((__v16si)(__m512i)(A), \
- (__v16si)(__m512i)(B), (__v16si)(__m512i)(C), (int)(I), \
- (__mmask16)(U)))
- #endif
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rcp14_pd (__m512d __A)
- {
- return (__m512d) __builtin_ia32_rcp14pd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rcp14_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_rcp14pd512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rcp14_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_rcp14pd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rcp14_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_rcp14ps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rcp14_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_rcp14ps512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rcp14_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_rcp14ps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_rcp14_sd (__m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_rcp14sd ((__v2df) __B,
- (__v2df) __A);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_rcp14_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_rcp14sd_mask ((__v2df) __B,
- (__v2df) __A,
- (__v2df) __W,
- (__mmask8) __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_rcp14_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_rcp14sd_mask ((__v2df) __B,
- (__v2df) __A,
- (__v2df) _mm_setzero_ps (),
- (__mmask8) __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_rcp14_ss (__m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_rcp14ss ((__v4sf) __B,
- (__v4sf) __A);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_rcp14_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_rcp14ss_mask ((__v4sf) __B,
- (__v4sf) __A,
- (__v4sf) __W,
- (__mmask8) __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_rcp14_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_rcp14ss_mask ((__v4sf) __B,
- (__v4sf) __A,
- (__v4sf) _mm_setzero_ps (),
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rsqrt14_pd (__m512d __A)
- {
- return (__m512d) __builtin_ia32_rsqrt14pd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rsqrt14_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_rsqrt14pd512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rsqrt14_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_rsqrt14pd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rsqrt14_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_rsqrt14ps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rsqrt14_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_rsqrt14ps512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rsqrt14_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_rsqrt14ps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_rsqrt14_sd (__m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_rsqrt14sd ((__v2df) __B,
- (__v2df) __A);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_rsqrt14_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_rsqrt14sd_mask ((__v2df) __B,
- (__v2df) __A,
- (__v2df) __W,
- (__mmask8) __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_rsqrt14_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_rsqrt14sd_mask ((__v2df) __B,
- (__v2df) __A,
- (__v2df) _mm_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_rsqrt14_ss (__m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_rsqrt14ss ((__v4sf) __B,
- (__v4sf) __A);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_rsqrt14_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_rsqrt14ss_mask ((__v4sf) __B,
- (__v4sf) __A,
- (__v4sf) __W,
- (__mmask8) __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_rsqrt14_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_rsqrt14ss_mask ((__v4sf) __B,
- (__v4sf) __A,
- (__v4sf) _mm_setzero_ps (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sqrt_round_pd (__m512d __A, const int __R)
- {
- return (__m512d) __builtin_ia32_sqrtpd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sqrt_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- const int __R)
- {
- return (__m512d) __builtin_ia32_sqrtpd512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sqrt_round_pd (__mmask8 __U, __m512d __A, const int __R)
- {
- return (__m512d) __builtin_ia32_sqrtpd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sqrt_round_ps (__m512 __A, const int __R)
- {
- return (__m512) __builtin_ia32_sqrtps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sqrt_round_ps (__m512 __W, __mmask16 __U, __m512 __A, const int __R)
- {
- return (__m512) __builtin_ia32_sqrtps512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sqrt_round_ps (__mmask16 __U, __m512 __A, const int __R)
- {
- return (__m512) __builtin_ia32_sqrtps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_sqrt_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_sqrtsd_mask_round ((__v2df) __B,
- (__v2df) __A,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_sqrt_round_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_sqrtsd_mask_round ((__v2df) __B,
- (__v2df) __A,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_sqrt_round_sd (__mmask8 __U, __m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_sqrtsd_mask_round ((__v2df) __B,
- (__v2df) __A,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_sqrt_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_sqrtss_mask_round ((__v4sf) __B,
- (__v4sf) __A,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) -1, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_sqrt_round_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_sqrtss_mask_round ((__v4sf) __B,
- (__v4sf) __A,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_sqrt_round_ss (__mmask8 __U, __m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_sqrtss_mask_round ((__v4sf) __B,
- (__v4sf) __A,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- #else
- #define _mm512_sqrt_round_pd(A, C) \
- (__m512d)__builtin_ia32_sqrtpd512_mask(A, (__v8df)_mm512_undefined_pd(), -1, C)
- #define _mm512_mask_sqrt_round_pd(W, U, A, C) \
- (__m512d)__builtin_ia32_sqrtpd512_mask(A, W, U, C)
- #define _mm512_maskz_sqrt_round_pd(U, A, C) \
- (__m512d)__builtin_ia32_sqrtpd512_mask(A, (__v8df)_mm512_setzero_pd(), U, C)
- #define _mm512_sqrt_round_ps(A, C) \
- (__m512)__builtin_ia32_sqrtps512_mask(A, (__v16sf)_mm512_undefined_ps(), -1, C)
- #define _mm512_mask_sqrt_round_ps(W, U, A, C) \
- (__m512)__builtin_ia32_sqrtps512_mask(A, W, U, C)
- #define _mm512_maskz_sqrt_round_ps(U, A, C) \
- (__m512)__builtin_ia32_sqrtps512_mask(A, (__v16sf)_mm512_setzero_ps(), U, C)
- #define _mm_sqrt_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_sqrtsd_mask_round (B, A, \
- (__v2df) _mm_setzero_pd (), -1, C)
- #define _mm_mask_sqrt_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_sqrtsd_mask_round (B, A, W, U, C)
- #define _mm_maskz_sqrt_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_sqrtsd_mask_round (B, A, \
- (__v2df) _mm_setzero_pd (), U, C)
- #define _mm_sqrt_round_ss(A, B, C) \
- (__m128)__builtin_ia32_sqrtss_mask_round (B, A, \
- (__v4sf) _mm_setzero_ps (), -1, C)
- #define _mm_mask_sqrt_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_sqrtss_mask_round (B, A, W, U, C)
- #define _mm_maskz_sqrt_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_sqrtss_mask_round (B, A, \
- (__v4sf) _mm_setzero_ps (), U, C)
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi8_epi32 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxbd512_mask ((__v16qi) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi8_epi32 (__m512i __W, __mmask16 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxbd512_mask ((__v16qi) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi8_epi32 (__mmask16 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxbd512_mask ((__v16qi) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi8_epi64 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxbq512_mask ((__v16qi) __A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi8_epi64 (__m512i __W, __mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxbq512_mask ((__v16qi) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi8_epi64 (__mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxbq512_mask ((__v16qi) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi16_epi32 (__m256i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxwd512_mask ((__v16hi) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi16_epi32 (__m512i __W, __mmask16 __U, __m256i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxwd512_mask ((__v16hi) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi16_epi32 (__mmask16 __U, __m256i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxwd512_mask ((__v16hi) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi16_epi64 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxwq512_mask ((__v8hi) __A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi16_epi64 (__m512i __W, __mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxwq512_mask ((__v8hi) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi16_epi64 (__mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovsxwq512_mask ((__v8hi) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi32_epi64 (__m256i __X)
- {
- return (__m512i) __builtin_ia32_pmovsxdq512_mask ((__v8si) __X,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi32_epi64 (__m512i __W, __mmask8 __U, __m256i __X)
- {
- return (__m512i) __builtin_ia32_pmovsxdq512_mask ((__v8si) __X,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi32_epi64 (__mmask8 __U, __m256i __X)
- {
- return (__m512i) __builtin_ia32_pmovsxdq512_mask ((__v8si) __X,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepu8_epi32 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxbd512_mask ((__v16qi) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepu8_epi32 (__m512i __W, __mmask16 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxbd512_mask ((__v16qi) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepu8_epi32 (__mmask16 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxbd512_mask ((__v16qi) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepu8_epi64 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxbq512_mask ((__v16qi) __A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepu8_epi64 (__m512i __W, __mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxbq512_mask ((__v16qi) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepu8_epi64 (__mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxbq512_mask ((__v16qi) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepu16_epi32 (__m256i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxwd512_mask ((__v16hi) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepu16_epi32 (__m512i __W, __mmask16 __U, __m256i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxwd512_mask ((__v16hi) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepu16_epi32 (__mmask16 __U, __m256i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxwd512_mask ((__v16hi) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepu16_epi64 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxwq512_mask ((__v8hi) __A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepu16_epi64 (__m512i __W, __mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxwq512_mask ((__v8hi) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepu16_epi64 (__mmask8 __U, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pmovzxwq512_mask ((__v8hi) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepu32_epi64 (__m256i __X)
- {
- return (__m512i) __builtin_ia32_pmovzxdq512_mask ((__v8si) __X,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepu32_epi64 (__m512i __W, __mmask8 __U, __m256i __X)
- {
- return (__m512i) __builtin_ia32_pmovzxdq512_mask ((__v8si) __X,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepu32_epi64 (__mmask8 __U, __m256i __X)
- {
- return (__m512i) __builtin_ia32_pmovzxdq512_mask ((__v8si) __X,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_add_round_pd (__m512d __A, __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_addpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_add_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_addpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_add_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- const int __R)
- {
- return (__m512d) __builtin_ia32_addpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_add_round_ps (__m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_addps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_add_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_addps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_add_round_ps (__mmask16 __U, __m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_addps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sub_round_pd (__m512d __A, __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_subpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sub_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_subpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sub_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- const int __R)
- {
- return (__m512d) __builtin_ia32_subpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sub_round_ps (__m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_subps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sub_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_subps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sub_round_ps (__mmask16 __U, __m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_subps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- #else
- #define _mm512_add_round_pd(A, B, C) \
- (__m512d)__builtin_ia32_addpd512_mask(A, B, (__v8df)_mm512_undefined_pd(), -1, C)
- #define _mm512_mask_add_round_pd(W, U, A, B, C) \
- (__m512d)__builtin_ia32_addpd512_mask(A, B, W, U, C)
- #define _mm512_maskz_add_round_pd(U, A, B, C) \
- (__m512d)__builtin_ia32_addpd512_mask(A, B, (__v8df)_mm512_setzero_pd(), U, C)
- #define _mm512_add_round_ps(A, B, C) \
- (__m512)__builtin_ia32_addps512_mask(A, B, (__v16sf)_mm512_undefined_ps(), -1, C)
- #define _mm512_mask_add_round_ps(W, U, A, B, C) \
- (__m512)__builtin_ia32_addps512_mask(A, B, W, U, C)
- #define _mm512_maskz_add_round_ps(U, A, B, C) \
- (__m512)__builtin_ia32_addps512_mask(A, B, (__v16sf)_mm512_setzero_ps(), U, C)
- #define _mm512_sub_round_pd(A, B, C) \
- (__m512d)__builtin_ia32_subpd512_mask(A, B, (__v8df)_mm512_undefined_pd(), -1, C)
- #define _mm512_mask_sub_round_pd(W, U, A, B, C) \
- (__m512d)__builtin_ia32_subpd512_mask(A, B, W, U, C)
- #define _mm512_maskz_sub_round_pd(U, A, B, C) \
- (__m512d)__builtin_ia32_subpd512_mask(A, B, (__v8df)_mm512_setzero_pd(), U, C)
- #define _mm512_sub_round_ps(A, B, C) \
- (__m512)__builtin_ia32_subps512_mask(A, B, (__v16sf)_mm512_undefined_ps(), -1, C)
- #define _mm512_mask_sub_round_ps(W, U, A, B, C) \
- (__m512)__builtin_ia32_subps512_mask(A, B, W, U, C)
- #define _mm512_maskz_sub_round_ps(U, A, B, C) \
- (__m512)__builtin_ia32_subps512_mask(A, B, (__v16sf)_mm512_setzero_ps(), U, C)
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mul_round_pd (__m512d __A, __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_mulpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mul_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_mulpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mul_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- const int __R)
- {
- return (__m512d) __builtin_ia32_mulpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mul_round_ps (__m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_mulps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mul_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_mulps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mul_round_ps (__mmask16 __U, __m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_mulps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_div_round_pd (__m512d __M, __m512d __V, const int __R)
- {
- return (__m512d) __builtin_ia32_divpd512_mask ((__v8df) __M,
- (__v8df) __V,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_div_round_pd (__m512d __W, __mmask8 __U, __m512d __M,
- __m512d __V, const int __R)
- {
- return (__m512d) __builtin_ia32_divpd512_mask ((__v8df) __M,
- (__v8df) __V,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_div_round_pd (__mmask8 __U, __m512d __M, __m512d __V,
- const int __R)
- {
- return (__m512d) __builtin_ia32_divpd512_mask ((__v8df) __M,
- (__v8df) __V,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_div_round_ps (__m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_divps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_div_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_divps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_div_round_ps (__mmask16 __U, __m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_divps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mul_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_mulsd_round ((__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_mul_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_mulsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_mul_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_mulsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mul_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_mulss_round ((__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_mul_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_mulss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_mul_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_mulss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_div_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_divsd_round ((__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_div_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_divsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_div_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_divsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_div_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_divss_round ((__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_div_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_divss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_div_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_divss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- #else
- #define _mm512_mul_round_pd(A, B, C) \
- (__m512d)__builtin_ia32_mulpd512_mask(A, B, (__v8df)_mm512_undefined_pd(), -1, C)
- #define _mm512_mask_mul_round_pd(W, U, A, B, C) \
- (__m512d)__builtin_ia32_mulpd512_mask(A, B, W, U, C)
- #define _mm512_maskz_mul_round_pd(U, A, B, C) \
- (__m512d)__builtin_ia32_mulpd512_mask(A, B, (__v8df)_mm512_setzero_pd(), U, C)
- #define _mm512_mul_round_ps(A, B, C) \
- (__m512)__builtin_ia32_mulps512_mask(A, B, (__v16sf)_mm512_undefined_ps(), -1, C)
- #define _mm512_mask_mul_round_ps(W, U, A, B, C) \
- (__m512)__builtin_ia32_mulps512_mask(A, B, W, U, C)
- #define _mm512_maskz_mul_round_ps(U, A, B, C) \
- (__m512)__builtin_ia32_mulps512_mask(A, B, (__v16sf)_mm512_setzero_ps(), U, C)
- #define _mm512_div_round_pd(A, B, C) \
- (__m512d)__builtin_ia32_divpd512_mask(A, B, (__v8df)_mm512_undefined_pd(), -1, C)
- #define _mm512_mask_div_round_pd(W, U, A, B, C) \
- (__m512d)__builtin_ia32_divpd512_mask(A, B, W, U, C)
- #define _mm512_maskz_div_round_pd(U, A, B, C) \
- (__m512d)__builtin_ia32_divpd512_mask(A, B, (__v8df)_mm512_setzero_pd(), U, C)
- #define _mm512_div_round_ps(A, B, C) \
- (__m512)__builtin_ia32_divps512_mask(A, B, (__v16sf)_mm512_undefined_ps(), -1, C)
- #define _mm512_mask_div_round_ps(W, U, A, B, C) \
- (__m512)__builtin_ia32_divps512_mask(A, B, W, U, C)
- #define _mm512_maskz_div_round_ps(U, A, B, C) \
- (__m512)__builtin_ia32_divps512_mask(A, B, (__v16sf)_mm512_setzero_ps(), U, C)
- #define _mm_mul_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_mulsd_round(A, B, C)
- #define _mm_mask_mul_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_mulsd_mask_round(A, B, W, U, C)
- #define _mm_maskz_mul_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_mulsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U, C)
- #define _mm_mul_round_ss(A, B, C) \
- (__m128)__builtin_ia32_mulss_round(A, B, C)
- #define _mm_mask_mul_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_mulss_mask_round(A, B, W, U, C)
- #define _mm_maskz_mul_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_mulss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U, C)
- #define _mm_div_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_divsd_round(A, B, C)
- #define _mm_mask_div_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_divsd_mask_round(A, B, W, U, C)
- #define _mm_maskz_div_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_divsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U, C)
- #define _mm_div_round_ss(A, B, C) \
- (__m128)__builtin_ia32_divss_round(A, B, C)
- #define _mm_mask_div_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_divss_mask_round(A, B, W, U, C)
- #define _mm_maskz_div_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_divss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U, C)
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_round_pd (__m512d __A, __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_maxpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_maxpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- const int __R)
- {
- return (__m512d) __builtin_ia32_maxpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_round_ps (__m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_maxps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_maxps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_round_ps (__mmask16 __U, __m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_maxps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_round_pd (__m512d __A, __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_minpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_minpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- const int __R)
- {
- return (__m512d) __builtin_ia32_minpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_round_ps (__m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_minps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_minps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_round_ps (__mmask16 __U, __m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_minps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- #else
- #define _mm512_max_round_pd(A, B, R) \
- (__m512d)__builtin_ia32_maxpd512_mask(A, B, (__v8df)_mm512_undefined_pd(), -1, R)
- #define _mm512_mask_max_round_pd(W, U, A, B, R) \
- (__m512d)__builtin_ia32_maxpd512_mask(A, B, W, U, R)
- #define _mm512_maskz_max_round_pd(U, A, B, R) \
- (__m512d)__builtin_ia32_maxpd512_mask(A, B, (__v8df)_mm512_setzero_pd(), U, R)
- #define _mm512_max_round_ps(A, B, R) \
- (__m512)__builtin_ia32_maxps512_mask(A, B, (__v16sf)_mm512_undefined_pd(), -1, R)
- #define _mm512_mask_max_round_ps(W, U, A, B, R) \
- (__m512)__builtin_ia32_maxps512_mask(A, B, W, U, R)
- #define _mm512_maskz_max_round_ps(U, A, B, R) \
- (__m512)__builtin_ia32_maxps512_mask(A, B, (__v16sf)_mm512_setzero_ps(), U, R)
- #define _mm512_min_round_pd(A, B, R) \
- (__m512d)__builtin_ia32_minpd512_mask(A, B, (__v8df)_mm512_undefined_pd(), -1, R)
- #define _mm512_mask_min_round_pd(W, U, A, B, R) \
- (__m512d)__builtin_ia32_minpd512_mask(A, B, W, U, R)
- #define _mm512_maskz_min_round_pd(U, A, B, R) \
- (__m512d)__builtin_ia32_minpd512_mask(A, B, (__v8df)_mm512_setzero_pd(), U, R)
- #define _mm512_min_round_ps(A, B, R) \
- (__m512)__builtin_ia32_minps512_mask(A, B, (__v16sf)_mm512_undefined_ps(), -1, R)
- #define _mm512_mask_min_round_ps(W, U, A, B, R) \
- (__m512)__builtin_ia32_minps512_mask(A, B, W, U, R)
- #define _mm512_maskz_min_round_ps(U, A, B, R) \
- (__m512)__builtin_ia32_minps512_mask(A, B, (__v16sf)_mm512_setzero_ps(), U, R)
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_scalef_round_pd (__m512d __A, __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_scalefpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_scalef_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- __m512d __B, const int __R)
- {
- return (__m512d) __builtin_ia32_scalefpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_scalef_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- const int __R)
- {
- return (__m512d) __builtin_ia32_scalefpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_scalef_round_ps (__m512 __A, __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_scalefps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_scalef_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __R)
- {
- return (__m512) __builtin_ia32_scalefps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_scalef_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- const int __R)
- {
- return (__m512) __builtin_ia32_scalefps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_scalef_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_scalefsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_scalef_round_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_scalefsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_scalef_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_scalefsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_scalef_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_scalefss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) -1, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_scalef_round_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_scalefss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_scalef_round_ss (__mmask8 __U, __m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_scalefss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- #else
- #define _mm512_scalef_round_pd(A, B, C) \
- (__m512d)__builtin_ia32_scalefpd512_mask(A, B, (__v8df)_mm512_undefined_pd(), -1, C)
- #define _mm512_mask_scalef_round_pd(W, U, A, B, C) \
- (__m512d)__builtin_ia32_scalefpd512_mask(A, B, W, U, C)
- #define _mm512_maskz_scalef_round_pd(U, A, B, C) \
- (__m512d)__builtin_ia32_scalefpd512_mask(A, B, (__v8df)_mm512_setzero_pd(), U, C)
- #define _mm512_scalef_round_ps(A, B, C) \
- (__m512)__builtin_ia32_scalefps512_mask(A, B, (__v16sf)_mm512_undefined_ps(), -1, C)
- #define _mm512_mask_scalef_round_ps(W, U, A, B, C) \
- (__m512)__builtin_ia32_scalefps512_mask(A, B, W, U, C)
- #define _mm512_maskz_scalef_round_ps(U, A, B, C) \
- (__m512)__builtin_ia32_scalefps512_mask(A, B, (__v16sf)_mm512_setzero_ps(), U, C)
- #define _mm_scalef_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_scalefsd_mask_round (A, B, \
- (__v2df)_mm_setzero_pd (), -1, C)
- #define _mm_scalef_round_ss(A, B, C) \
- (__m128)__builtin_ia32_scalefss_mask_round (A, B, \
- (__v4sf)_mm_setzero_ps (), -1, C)
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmadd_round_pd (__m512d __A, __m512d __B, __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmadd_round_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmadd_round_pd (__m512d __A, __m512d __B, __m512d __C,
- __mmask8 __U, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmadd_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmadd_round_ps (__m512 __A, __m512 __B, __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmadd_round_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmadd_round_ps (__m512 __A, __m512 __B, __m512 __C,
- __mmask16 __U, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmadd_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsub_round_pd (__m512d __A, __m512d __B, __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsub_round_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsub_round_pd (__m512d __A, __m512d __B, __m512d __C,
- __mmask8 __U, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsub_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsub_round_ps (__m512 __A, __m512 __B, __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsub_round_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsub_round_ps (__m512 __A, __m512 __B, __m512 __C,
- __mmask16 __U, const int __R)
- {
- return (__m512) __builtin_ia32_vfmsubps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsub_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmaddsub_round_pd (__m512d __A, __m512d __B, __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmaddsub_round_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmaddsub_round_pd (__m512d __A, __m512d __B, __m512d __C,
- __mmask8 __U, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmaddsub_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmaddsub_round_ps (__m512 __A, __m512 __B, __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmaddsub_round_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmaddsub_round_ps (__m512 __A, __m512 __B, __m512 __C,
- __mmask16 __U, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmaddsub_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsubadd_round_pd (__m512d __A, __m512d __B, __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- -(__v8df) __C,
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsubadd_round_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- -(__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsubadd_round_pd (__m512d __A, __m512d __B, __m512d __C,
- __mmask8 __U, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmsubaddpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsubadd_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- -(__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsubadd_round_ps (__m512 __A, __m512 __B, __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- -(__v16sf) __C,
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsubadd_round_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- -(__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsubadd_round_ps (__m512 __A, __m512 __B, __m512 __C,
- __mmask16 __U, const int __R)
- {
- return (__m512) __builtin_ia32_vfmsubaddps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsubadd_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- -(__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmadd_round_pd (__m512d __A, __m512d __B, __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmadd_round_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmadd_round_pd (__m512d __A, __m512d __B, __m512d __C,
- __mmask8 __U, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmadd_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmadd_round_ps (__m512 __A, __m512 __B, __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmadd_round_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmadd_round_ps (__m512 __A, __m512 __B, __m512 __C,
- __mmask16 __U, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmadd_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmsub_round_pd (__m512d __A, __m512d __B, __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmsub_round_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmsub_round_pd (__m512d __A, __m512d __B, __m512d __C,
- __mmask8 __U, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmsub_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512d __C, const int __R)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmsub_round_ps (__m512 __A, __m512 __B, __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmsub_round_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmsub_round_ps (__m512 __A, __m512 __B, __m512 __C,
- __mmask16 __U, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmsub_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512 __C, const int __R)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U, __R);
- }
- #else
- #define _mm512_fmadd_round_pd(A, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddpd512_mask(A, B, C, -1, R)
- #define _mm512_mask_fmadd_round_pd(A, U, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddpd512_mask(A, B, C, U, R)
- #define _mm512_mask3_fmadd_round_pd(A, B, C, U, R) \
- (__m512d)__builtin_ia32_vfmaddpd512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmadd_round_pd(U, A, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddpd512_maskz(A, B, C, U, R)
- #define _mm512_fmadd_round_ps(A, B, C, R) \
- (__m512)__builtin_ia32_vfmaddps512_mask(A, B, C, -1, R)
- #define _mm512_mask_fmadd_round_ps(A, U, B, C, R) \
- (__m512)__builtin_ia32_vfmaddps512_mask(A, B, C, U, R)
- #define _mm512_mask3_fmadd_round_ps(A, B, C, U, R) \
- (__m512)__builtin_ia32_vfmaddps512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmadd_round_ps(U, A, B, C, R) \
- (__m512)__builtin_ia32_vfmaddps512_maskz(A, B, C, U, R)
- #define _mm512_fmsub_round_pd(A, B, C, R) \
- (__m512d)__builtin_ia32_vfmsubpd512_mask(A, B, C, -1, R)
- #define _mm512_mask_fmsub_round_pd(A, U, B, C, R) \
- (__m512d)__builtin_ia32_vfmsubpd512_mask(A, B, C, U, R)
- #define _mm512_mask3_fmsub_round_pd(A, B, C, U, R) \
- (__m512d)__builtin_ia32_vfmsubpd512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmsub_round_pd(U, A, B, C, R) \
- (__m512d)__builtin_ia32_vfmsubpd512_maskz(A, B, C, U, R)
- #define _mm512_fmsub_round_ps(A, B, C, R) \
- (__m512)__builtin_ia32_vfmsubps512_mask(A, B, C, -1, R)
- #define _mm512_mask_fmsub_round_ps(A, U, B, C, R) \
- (__m512)__builtin_ia32_vfmsubps512_mask(A, B, C, U, R)
- #define _mm512_mask3_fmsub_round_ps(A, B, C, U, R) \
- (__m512)__builtin_ia32_vfmsubps512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmsub_round_ps(U, A, B, C, R) \
- (__m512)__builtin_ia32_vfmsubps512_maskz(A, B, C, U, R)
- #define _mm512_fmaddsub_round_pd(A, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddsubpd512_mask(A, B, C, -1, R)
- #define _mm512_mask_fmaddsub_round_pd(A, U, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddsubpd512_mask(A, B, C, U, R)
- #define _mm512_mask3_fmaddsub_round_pd(A, B, C, U, R) \
- (__m512d)__builtin_ia32_vfmaddsubpd512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmaddsub_round_pd(U, A, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddsubpd512_maskz(A, B, C, U, R)
- #define _mm512_fmaddsub_round_ps(A, B, C, R) \
- (__m512)__builtin_ia32_vfmaddsubps512_mask(A, B, C, -1, R)
- #define _mm512_mask_fmaddsub_round_ps(A, U, B, C, R) \
- (__m512)__builtin_ia32_vfmaddsubps512_mask(A, B, C, U, R)
- #define _mm512_mask3_fmaddsub_round_ps(A, B, C, U, R) \
- (__m512)__builtin_ia32_vfmaddsubps512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmaddsub_round_ps(U, A, B, C, R) \
- (__m512)__builtin_ia32_vfmaddsubps512_maskz(A, B, C, U, R)
- #define _mm512_fmsubadd_round_pd(A, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddsubpd512_mask(A, B, -(C), -1, R)
- #define _mm512_mask_fmsubadd_round_pd(A, U, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddsubpd512_mask(A, B, -(C), U, R)
- #define _mm512_mask3_fmsubadd_round_pd(A, B, C, U, R) \
- (__m512d)__builtin_ia32_vfmsubaddpd512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmsubadd_round_pd(U, A, B, C, R) \
- (__m512d)__builtin_ia32_vfmaddsubpd512_maskz(A, B, -(C), U, R)
- #define _mm512_fmsubadd_round_ps(A, B, C, R) \
- (__m512)__builtin_ia32_vfmaddsubps512_mask(A, B, -(C), -1, R)
- #define _mm512_mask_fmsubadd_round_ps(A, U, B, C, R) \
- (__m512)__builtin_ia32_vfmaddsubps512_mask(A, B, -(C), U, R)
- #define _mm512_mask3_fmsubadd_round_ps(A, B, C, U, R) \
- (__m512)__builtin_ia32_vfmsubaddps512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fmsubadd_round_ps(U, A, B, C, R) \
- (__m512)__builtin_ia32_vfmaddsubps512_maskz(A, B, -(C), U, R)
- #define _mm512_fnmadd_round_pd(A, B, C, R) \
- (__m512d)__builtin_ia32_vfnmaddpd512_mask(A, B, C, -1, R)
- #define _mm512_mask_fnmadd_round_pd(A, U, B, C, R) \
- (__m512d)__builtin_ia32_vfnmaddpd512_mask(A, B, C, U, R)
- #define _mm512_mask3_fnmadd_round_pd(A, B, C, U, R) \
- (__m512d)__builtin_ia32_vfnmaddpd512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fnmadd_round_pd(U, A, B, C, R) \
- (__m512d)__builtin_ia32_vfnmaddpd512_maskz(A, B, C, U, R)
- #define _mm512_fnmadd_round_ps(A, B, C, R) \
- (__m512)__builtin_ia32_vfnmaddps512_mask(A, B, C, -1, R)
- #define _mm512_mask_fnmadd_round_ps(A, U, B, C, R) \
- (__m512)__builtin_ia32_vfnmaddps512_mask(A, B, C, U, R)
- #define _mm512_mask3_fnmadd_round_ps(A, B, C, U, R) \
- (__m512)__builtin_ia32_vfnmaddps512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fnmadd_round_ps(U, A, B, C, R) \
- (__m512)__builtin_ia32_vfnmaddps512_maskz(A, B, C, U, R)
- #define _mm512_fnmsub_round_pd(A, B, C, R) \
- (__m512d)__builtin_ia32_vfnmsubpd512_mask(A, B, C, -1, R)
- #define _mm512_mask_fnmsub_round_pd(A, U, B, C, R) \
- (__m512d)__builtin_ia32_vfnmsubpd512_mask(A, B, C, U, R)
- #define _mm512_mask3_fnmsub_round_pd(A, B, C, U, R) \
- (__m512d)__builtin_ia32_vfnmsubpd512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fnmsub_round_pd(U, A, B, C, R) \
- (__m512d)__builtin_ia32_vfnmsubpd512_maskz(A, B, C, U, R)
- #define _mm512_fnmsub_round_ps(A, B, C, R) \
- (__m512)__builtin_ia32_vfnmsubps512_mask(A, B, C, -1, R)
- #define _mm512_mask_fnmsub_round_ps(A, U, B, C, R) \
- (__m512)__builtin_ia32_vfnmsubps512_mask(A, B, C, U, R)
- #define _mm512_mask3_fnmsub_round_ps(A, B, C, U, R) \
- (__m512)__builtin_ia32_vfnmsubps512_mask3(A, B, C, U, R)
- #define _mm512_maskz_fnmsub_round_ps(U, A, B, C, R) \
- (__m512)__builtin_ia32_vfnmsubps512_maskz(A, B, C, U, R)
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_abs_epi64 (__m512i __A)
- {
- return (__m512i) __builtin_ia32_pabsq512_mask ((__v8di) __A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_abs_epi64 (__m512i __W, __mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_pabsq512_mask ((__v8di) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_abs_epi64 (__mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_pabsq512_mask ((__v8di) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_abs_epi32 (__m512i __A)
- {
- return (__m512i) __builtin_ia32_pabsd512_mask ((__v16si) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_abs_epi32 (__m512i __W, __mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_pabsd512_mask ((__v16si) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_abs_epi32 (__mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_pabsd512_mask ((__v16si) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcastss_ps (__m128 __A)
- {
- return (__m512) __builtin_ia32_broadcastss512 ((__v4sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcastss_ps (__m512 __O, __mmask16 __M, __m128 __A)
- {
- return (__m512) __builtin_ia32_broadcastss512 ((__v4sf) __A,
- (__v16sf) __O, __M);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcastss_ps (__mmask16 __M, __m128 __A)
- {
- return (__m512) __builtin_ia32_broadcastss512 ((__v4sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- __M);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcastsd_pd (__m128d __A)
- {
- return (__m512d) __builtin_ia32_broadcastsd512 ((__v2df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcastsd_pd (__m512d __O, __mmask8 __M, __m128d __A)
- {
- return (__m512d) __builtin_ia32_broadcastsd512 ((__v2df) __A,
- (__v8df) __O, __M);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcastsd_pd (__mmask8 __M, __m128d __A)
- {
- return (__m512d) __builtin_ia32_broadcastsd512 ((__v2df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcastd_epi32 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastd512 ((__v4si) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcastd_epi32 (__m512i __O, __mmask16 __M, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastd512 ((__v4si) __A,
- (__v16si) __O, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcastd_epi32 (__mmask16 __M, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastd512 ((__v4si) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set1_epi32 (int __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastd512_gpr_mask (__A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16)(-1));
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_set1_epi32 (__m512i __O, __mmask16 __M, int __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastd512_gpr_mask (__A, (__v16si) __O,
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_set1_epi32 (__mmask16 __M, int __A)
- {
- return (__m512i)
- __builtin_ia32_pbroadcastd512_gpr_mask (__A,
- (__v16si) _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcastq_epi64 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastq512 ((__v2di) __A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcastq_epi64 (__m512i __O, __mmask8 __M, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastq512 ((__v2di) __A,
- (__v8di) __O, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcastq_epi64 (__mmask8 __M, __m128i __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastq512 ((__v2di) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_set1_epi64 (long long __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastq512_gpr_mask (__A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8)(-1));
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_set1_epi64 (__m512i __O, __mmask8 __M, long long __A)
- {
- return (__m512i) __builtin_ia32_pbroadcastq512_gpr_mask (__A, (__v8di) __O,
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_set1_epi64 (__mmask8 __M, long long __A)
- {
- return (__m512i)
- __builtin_ia32_pbroadcastq512_gpr_mask (__A,
- (__v8di) _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcast_f32x4 (__m128 __A)
- {
- return (__m512) __builtin_ia32_broadcastf32x4_512 ((__v4sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcast_f32x4 (__m512 __O, __mmask16 __M, __m128 __A)
- {
- return (__m512) __builtin_ia32_broadcastf32x4_512 ((__v4sf) __A,
- (__v16sf) __O,
- __M);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcast_f32x4 (__mmask16 __M, __m128 __A)
- {
- return (__m512) __builtin_ia32_broadcastf32x4_512 ((__v4sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcast_i32x4 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_broadcasti32x4_512 ((__v4si) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcast_i32x4 (__m512i __O, __mmask16 __M, __m128i __A)
- {
- return (__m512i) __builtin_ia32_broadcasti32x4_512 ((__v4si) __A,
- (__v16si) __O,
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcast_i32x4 (__mmask16 __M, __m128i __A)
- {
- return (__m512i) __builtin_ia32_broadcasti32x4_512 ((__v4si) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcast_f64x4 (__m256d __A)
- {
- return (__m512d) __builtin_ia32_broadcastf64x4_512 ((__v4df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcast_f64x4 (__m512d __O, __mmask8 __M, __m256d __A)
- {
- return (__m512d) __builtin_ia32_broadcastf64x4_512 ((__v4df) __A,
- (__v8df) __O,
- __M);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcast_f64x4 (__mmask8 __M, __m256d __A)
- {
- return (__m512d) __builtin_ia32_broadcastf64x4_512 ((__v4df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_broadcast_i64x4 (__m256i __A)
- {
- return (__m512i) __builtin_ia32_broadcasti64x4_512 ((__v4di) __A,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_broadcast_i64x4 (__m512i __O, __mmask8 __M, __m256i __A)
- {
- return (__m512i) __builtin_ia32_broadcasti64x4_512 ((__v4di) __A,
- (__v8di) __O,
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_broadcast_i64x4 (__mmask8 __M, __m256i __A)
- {
- return (__m512i) __builtin_ia32_broadcasti64x4_512 ((__v4di) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- typedef enum
- {
- _MM_PERM_AAAA = 0x00, _MM_PERM_AAAB = 0x01, _MM_PERM_AAAC = 0x02,
- _MM_PERM_AAAD = 0x03, _MM_PERM_AABA = 0x04, _MM_PERM_AABB = 0x05,
- _MM_PERM_AABC = 0x06, _MM_PERM_AABD = 0x07, _MM_PERM_AACA = 0x08,
- _MM_PERM_AACB = 0x09, _MM_PERM_AACC = 0x0A, _MM_PERM_AACD = 0x0B,
- _MM_PERM_AADA = 0x0C, _MM_PERM_AADB = 0x0D, _MM_PERM_AADC = 0x0E,
- _MM_PERM_AADD = 0x0F, _MM_PERM_ABAA = 0x10, _MM_PERM_ABAB = 0x11,
- _MM_PERM_ABAC = 0x12, _MM_PERM_ABAD = 0x13, _MM_PERM_ABBA = 0x14,
- _MM_PERM_ABBB = 0x15, _MM_PERM_ABBC = 0x16, _MM_PERM_ABBD = 0x17,
- _MM_PERM_ABCA = 0x18, _MM_PERM_ABCB = 0x19, _MM_PERM_ABCC = 0x1A,
- _MM_PERM_ABCD = 0x1B, _MM_PERM_ABDA = 0x1C, _MM_PERM_ABDB = 0x1D,
- _MM_PERM_ABDC = 0x1E, _MM_PERM_ABDD = 0x1F, _MM_PERM_ACAA = 0x20,
- _MM_PERM_ACAB = 0x21, _MM_PERM_ACAC = 0x22, _MM_PERM_ACAD = 0x23,
- _MM_PERM_ACBA = 0x24, _MM_PERM_ACBB = 0x25, _MM_PERM_ACBC = 0x26,
- _MM_PERM_ACBD = 0x27, _MM_PERM_ACCA = 0x28, _MM_PERM_ACCB = 0x29,
- _MM_PERM_ACCC = 0x2A, _MM_PERM_ACCD = 0x2B, _MM_PERM_ACDA = 0x2C,
- _MM_PERM_ACDB = 0x2D, _MM_PERM_ACDC = 0x2E, _MM_PERM_ACDD = 0x2F,
- _MM_PERM_ADAA = 0x30, _MM_PERM_ADAB = 0x31, _MM_PERM_ADAC = 0x32,
- _MM_PERM_ADAD = 0x33, _MM_PERM_ADBA = 0x34, _MM_PERM_ADBB = 0x35,
- _MM_PERM_ADBC = 0x36, _MM_PERM_ADBD = 0x37, _MM_PERM_ADCA = 0x38,
- _MM_PERM_ADCB = 0x39, _MM_PERM_ADCC = 0x3A, _MM_PERM_ADCD = 0x3B,
- _MM_PERM_ADDA = 0x3C, _MM_PERM_ADDB = 0x3D, _MM_PERM_ADDC = 0x3E,
- _MM_PERM_ADDD = 0x3F, _MM_PERM_BAAA = 0x40, _MM_PERM_BAAB = 0x41,
- _MM_PERM_BAAC = 0x42, _MM_PERM_BAAD = 0x43, _MM_PERM_BABA = 0x44,
- _MM_PERM_BABB = 0x45, _MM_PERM_BABC = 0x46, _MM_PERM_BABD = 0x47,
- _MM_PERM_BACA = 0x48, _MM_PERM_BACB = 0x49, _MM_PERM_BACC = 0x4A,
- _MM_PERM_BACD = 0x4B, _MM_PERM_BADA = 0x4C, _MM_PERM_BADB = 0x4D,
- _MM_PERM_BADC = 0x4E, _MM_PERM_BADD = 0x4F, _MM_PERM_BBAA = 0x50,
- _MM_PERM_BBAB = 0x51, _MM_PERM_BBAC = 0x52, _MM_PERM_BBAD = 0x53,
- _MM_PERM_BBBA = 0x54, _MM_PERM_BBBB = 0x55, _MM_PERM_BBBC = 0x56,
- _MM_PERM_BBBD = 0x57, _MM_PERM_BBCA = 0x58, _MM_PERM_BBCB = 0x59,
- _MM_PERM_BBCC = 0x5A, _MM_PERM_BBCD = 0x5B, _MM_PERM_BBDA = 0x5C,
- _MM_PERM_BBDB = 0x5D, _MM_PERM_BBDC = 0x5E, _MM_PERM_BBDD = 0x5F,
- _MM_PERM_BCAA = 0x60, _MM_PERM_BCAB = 0x61, _MM_PERM_BCAC = 0x62,
- _MM_PERM_BCAD = 0x63, _MM_PERM_BCBA = 0x64, _MM_PERM_BCBB = 0x65,
- _MM_PERM_BCBC = 0x66, _MM_PERM_BCBD = 0x67, _MM_PERM_BCCA = 0x68,
- _MM_PERM_BCCB = 0x69, _MM_PERM_BCCC = 0x6A, _MM_PERM_BCCD = 0x6B,
- _MM_PERM_BCDA = 0x6C, _MM_PERM_BCDB = 0x6D, _MM_PERM_BCDC = 0x6E,
- _MM_PERM_BCDD = 0x6F, _MM_PERM_BDAA = 0x70, _MM_PERM_BDAB = 0x71,
- _MM_PERM_BDAC = 0x72, _MM_PERM_BDAD = 0x73, _MM_PERM_BDBA = 0x74,
- _MM_PERM_BDBB = 0x75, _MM_PERM_BDBC = 0x76, _MM_PERM_BDBD = 0x77,
- _MM_PERM_BDCA = 0x78, _MM_PERM_BDCB = 0x79, _MM_PERM_BDCC = 0x7A,
- _MM_PERM_BDCD = 0x7B, _MM_PERM_BDDA = 0x7C, _MM_PERM_BDDB = 0x7D,
- _MM_PERM_BDDC = 0x7E, _MM_PERM_BDDD = 0x7F, _MM_PERM_CAAA = 0x80,
- _MM_PERM_CAAB = 0x81, _MM_PERM_CAAC = 0x82, _MM_PERM_CAAD = 0x83,
- _MM_PERM_CABA = 0x84, _MM_PERM_CABB = 0x85, _MM_PERM_CABC = 0x86,
- _MM_PERM_CABD = 0x87, _MM_PERM_CACA = 0x88, _MM_PERM_CACB = 0x89,
- _MM_PERM_CACC = 0x8A, _MM_PERM_CACD = 0x8B, _MM_PERM_CADA = 0x8C,
- _MM_PERM_CADB = 0x8D, _MM_PERM_CADC = 0x8E, _MM_PERM_CADD = 0x8F,
- _MM_PERM_CBAA = 0x90, _MM_PERM_CBAB = 0x91, _MM_PERM_CBAC = 0x92,
- _MM_PERM_CBAD = 0x93, _MM_PERM_CBBA = 0x94, _MM_PERM_CBBB = 0x95,
- _MM_PERM_CBBC = 0x96, _MM_PERM_CBBD = 0x97, _MM_PERM_CBCA = 0x98,
- _MM_PERM_CBCB = 0x99, _MM_PERM_CBCC = 0x9A, _MM_PERM_CBCD = 0x9B,
- _MM_PERM_CBDA = 0x9C, _MM_PERM_CBDB = 0x9D, _MM_PERM_CBDC = 0x9E,
- _MM_PERM_CBDD = 0x9F, _MM_PERM_CCAA = 0xA0, _MM_PERM_CCAB = 0xA1,
- _MM_PERM_CCAC = 0xA2, _MM_PERM_CCAD = 0xA3, _MM_PERM_CCBA = 0xA4,
- _MM_PERM_CCBB = 0xA5, _MM_PERM_CCBC = 0xA6, _MM_PERM_CCBD = 0xA7,
- _MM_PERM_CCCA = 0xA8, _MM_PERM_CCCB = 0xA9, _MM_PERM_CCCC = 0xAA,
- _MM_PERM_CCCD = 0xAB, _MM_PERM_CCDA = 0xAC, _MM_PERM_CCDB = 0xAD,
- _MM_PERM_CCDC = 0xAE, _MM_PERM_CCDD = 0xAF, _MM_PERM_CDAA = 0xB0,
- _MM_PERM_CDAB = 0xB1, _MM_PERM_CDAC = 0xB2, _MM_PERM_CDAD = 0xB3,
- _MM_PERM_CDBA = 0xB4, _MM_PERM_CDBB = 0xB5, _MM_PERM_CDBC = 0xB6,
- _MM_PERM_CDBD = 0xB7, _MM_PERM_CDCA = 0xB8, _MM_PERM_CDCB = 0xB9,
- _MM_PERM_CDCC = 0xBA, _MM_PERM_CDCD = 0xBB, _MM_PERM_CDDA = 0xBC,
- _MM_PERM_CDDB = 0xBD, _MM_PERM_CDDC = 0xBE, _MM_PERM_CDDD = 0xBF,
- _MM_PERM_DAAA = 0xC0, _MM_PERM_DAAB = 0xC1, _MM_PERM_DAAC = 0xC2,
- _MM_PERM_DAAD = 0xC3, _MM_PERM_DABA = 0xC4, _MM_PERM_DABB = 0xC5,
- _MM_PERM_DABC = 0xC6, _MM_PERM_DABD = 0xC7, _MM_PERM_DACA = 0xC8,
- _MM_PERM_DACB = 0xC9, _MM_PERM_DACC = 0xCA, _MM_PERM_DACD = 0xCB,
- _MM_PERM_DADA = 0xCC, _MM_PERM_DADB = 0xCD, _MM_PERM_DADC = 0xCE,
- _MM_PERM_DADD = 0xCF, _MM_PERM_DBAA = 0xD0, _MM_PERM_DBAB = 0xD1,
- _MM_PERM_DBAC = 0xD2, _MM_PERM_DBAD = 0xD3, _MM_PERM_DBBA = 0xD4,
- _MM_PERM_DBBB = 0xD5, _MM_PERM_DBBC = 0xD6, _MM_PERM_DBBD = 0xD7,
- _MM_PERM_DBCA = 0xD8, _MM_PERM_DBCB = 0xD9, _MM_PERM_DBCC = 0xDA,
- _MM_PERM_DBCD = 0xDB, _MM_PERM_DBDA = 0xDC, _MM_PERM_DBDB = 0xDD,
- _MM_PERM_DBDC = 0xDE, _MM_PERM_DBDD = 0xDF, _MM_PERM_DCAA = 0xE0,
- _MM_PERM_DCAB = 0xE1, _MM_PERM_DCAC = 0xE2, _MM_PERM_DCAD = 0xE3,
- _MM_PERM_DCBA = 0xE4, _MM_PERM_DCBB = 0xE5, _MM_PERM_DCBC = 0xE6,
- _MM_PERM_DCBD = 0xE7, _MM_PERM_DCCA = 0xE8, _MM_PERM_DCCB = 0xE9,
- _MM_PERM_DCCC = 0xEA, _MM_PERM_DCCD = 0xEB, _MM_PERM_DCDA = 0xEC,
- _MM_PERM_DCDB = 0xED, _MM_PERM_DCDC = 0xEE, _MM_PERM_DCDD = 0xEF,
- _MM_PERM_DDAA = 0xF0, _MM_PERM_DDAB = 0xF1, _MM_PERM_DDAC = 0xF2,
- _MM_PERM_DDAD = 0xF3, _MM_PERM_DDBA = 0xF4, _MM_PERM_DDBB = 0xF5,
- _MM_PERM_DDBC = 0xF6, _MM_PERM_DDBD = 0xF7, _MM_PERM_DDCA = 0xF8,
- _MM_PERM_DDCB = 0xF9, _MM_PERM_DDCC = 0xFA, _MM_PERM_DDCD = 0xFB,
- _MM_PERM_DDDA = 0xFC, _MM_PERM_DDDB = 0xFD, _MM_PERM_DDDC = 0xFE,
- _MM_PERM_DDDD = 0xFF
- } _MM_PERM_ENUM;
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_shuffle_epi32 (__m512i __A, _MM_PERM_ENUM __mask)
- {
- return (__m512i) __builtin_ia32_pshufd512_mask ((__v16si) __A,
- __mask,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_shuffle_epi32 (__m512i __W, __mmask16 __U, __m512i __A,
- _MM_PERM_ENUM __mask)
- {
- return (__m512i) __builtin_ia32_pshufd512_mask ((__v16si) __A,
- __mask,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_shuffle_epi32 (__mmask16 __U, __m512i __A, _MM_PERM_ENUM __mask)
- {
- return (__m512i) __builtin_ia32_pshufd512_mask ((__v16si) __A,
- __mask,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_shuffle_i64x2 (__m512i __A, __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_shuf_i64x2_mask ((__v8di) __A,
- (__v8di) __B, __imm,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_shuffle_i64x2 (__m512i __W, __mmask8 __U, __m512i __A,
- __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_shuf_i64x2_mask ((__v8di) __A,
- (__v8di) __B, __imm,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_shuffle_i64x2 (__mmask8 __U, __m512i __A, __m512i __B,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_shuf_i64x2_mask ((__v8di) __A,
- (__v8di) __B, __imm,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_shuffle_i32x4 (__m512i __A, __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_shuf_i32x4_mask ((__v16si) __A,
- (__v16si) __B,
- __imm,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_shuffle_i32x4 (__m512i __W, __mmask16 __U, __m512i __A,
- __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_shuf_i32x4_mask ((__v16si) __A,
- (__v16si) __B,
- __imm,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_shuffle_i32x4 (__mmask16 __U, __m512i __A, __m512i __B,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_shuf_i32x4_mask ((__v16si) __A,
- (__v16si) __B,
- __imm,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_shuffle_f64x2 (__m512d __A, __m512d __B, const int __imm)
- {
- return (__m512d) __builtin_ia32_shuf_f64x2_mask ((__v8df) __A,
- (__v8df) __B, __imm,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_shuffle_f64x2 (__m512d __W, __mmask8 __U, __m512d __A,
- __m512d __B, const int __imm)
- {
- return (__m512d) __builtin_ia32_shuf_f64x2_mask ((__v8df) __A,
- (__v8df) __B, __imm,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_shuffle_f64x2 (__mmask8 __U, __m512d __A, __m512d __B,
- const int __imm)
- {
- return (__m512d) __builtin_ia32_shuf_f64x2_mask ((__v8df) __A,
- (__v8df) __B, __imm,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_shuffle_f32x4 (__m512 __A, __m512 __B, const int __imm)
- {
- return (__m512) __builtin_ia32_shuf_f32x4_mask ((__v16sf) __A,
- (__v16sf) __B, __imm,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_shuffle_f32x4 (__m512 __W, __mmask16 __U, __m512 __A,
- __m512 __B, const int __imm)
- {
- return (__m512) __builtin_ia32_shuf_f32x4_mask ((__v16sf) __A,
- (__v16sf) __B, __imm,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_shuffle_f32x4 (__mmask16 __U, __m512 __A, __m512 __B,
- const int __imm)
- {
- return (__m512) __builtin_ia32_shuf_f32x4_mask ((__v16sf) __A,
- (__v16sf) __B, __imm,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- #else
- #define _mm512_shuffle_epi32(X, C) \
- ((__m512i) __builtin_ia32_pshufd512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask16)-1))
- #define _mm512_mask_shuffle_epi32(W, U, X, C) \
- ((__m512i) __builtin_ia32_pshufd512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)(W),\
- (__mmask16)(U)))
- #define _mm512_maskz_shuffle_epi32(U, X, C) \
- ((__m512i) __builtin_ia32_pshufd512_mask ((__v16si)(__m512i)(X), (int)(C),\
- (__v16si)(__m512i)_mm512_setzero_si512 (),\
- (__mmask16)(U)))
- #define _mm512_shuffle_i64x2(X, Y, C) \
- ((__m512i) __builtin_ia32_shuf_i64x2_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(C),\
- (__v8di)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask8)-1))
- #define _mm512_mask_shuffle_i64x2(W, U, X, Y, C) \
- ((__m512i) __builtin_ia32_shuf_i64x2_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(C),\
- (__v8di)(__m512i)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_shuffle_i64x2(U, X, Y, C) \
- ((__m512i) __builtin_ia32_shuf_i64x2_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(C),\
- (__v8di)(__m512i)_mm512_setzero_si512 (),\
- (__mmask8)(U)))
- #define _mm512_shuffle_i32x4(X, Y, C) \
- ((__m512i) __builtin_ia32_shuf_i32x4_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(C),\
- (__v16si)(__m512i)_mm512_undefined_epi32 (),\
- (__mmask16)-1))
- #define _mm512_mask_shuffle_i32x4(W, U, X, Y, C) \
- ((__m512i) __builtin_ia32_shuf_i32x4_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(C),\
- (__v16si)(__m512i)(W),\
- (__mmask16)(U)))
- #define _mm512_maskz_shuffle_i32x4(U, X, Y, C) \
- ((__m512i) __builtin_ia32_shuf_i32x4_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(C),\
- (__v16si)(__m512i)_mm512_setzero_si512 (),\
- (__mmask16)(U)))
- #define _mm512_shuffle_f64x2(X, Y, C) \
- ((__m512d) __builtin_ia32_shuf_f64x2_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(C),\
- (__v8df)(__m512d)_mm512_undefined_pd(),\
- (__mmask8)-1))
- #define _mm512_mask_shuffle_f64x2(W, U, X, Y, C) \
- ((__m512d) __builtin_ia32_shuf_f64x2_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(C),\
- (__v8df)(__m512d)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_shuffle_f64x2(U, X, Y, C) \
- ((__m512d) __builtin_ia32_shuf_f64x2_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(C),\
- (__v8df)(__m512d)_mm512_setzero_pd(),\
- (__mmask8)(U)))
- #define _mm512_shuffle_f32x4(X, Y, C) \
- ((__m512) __builtin_ia32_shuf_f32x4_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(C),\
- (__v16sf)(__m512)_mm512_undefined_ps(),\
- (__mmask16)-1))
- #define _mm512_mask_shuffle_f32x4(W, U, X, Y, C) \
- ((__m512) __builtin_ia32_shuf_f32x4_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(C),\
- (__v16sf)(__m512)(W),\
- (__mmask16)(U)))
- #define _mm512_maskz_shuffle_f32x4(U, X, Y, C) \
- ((__m512) __builtin_ia32_shuf_f32x4_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(C),\
- (__v16sf)(__m512)_mm512_setzero_ps(),\
- (__mmask16)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rolv_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prolvd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rolv_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prolvd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rolv_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prolvd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rorv_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prorvd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rorv_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prorvd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rorv_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prorvd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rolv_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prolvq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rolv_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prolvq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rolv_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prolvq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rorv_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prorvq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rorv_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prorvq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rorv_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_prorvq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtt_roundpd_epi32 (__m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvttpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtt_roundpd_epi32 (__m256i __W, __mmask8 __U, __m512d __A,
- const int __R)
- {
- return (__m256i) __builtin_ia32_cvttpd2dq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtt_roundpd_epi32 (__mmask8 __U, __m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvttpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtt_roundpd_epu32 (__m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvttpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtt_roundpd_epu32 (__m256i __W, __mmask8 __U, __m512d __A,
- const int __R)
- {
- return (__m256i) __builtin_ia32_cvttpd2udq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtt_roundpd_epu32 (__mmask8 __U, __m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvttpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U, __R);
- }
- #else
- #define _mm512_cvtt_roundpd_epi32(A, B) \
- ((__m256i)__builtin_ia32_cvttpd2dq512_mask(A, (__v8si)_mm256_undefined_si256(), -1, B))
- #define _mm512_mask_cvtt_roundpd_epi32(W, U, A, B) \
- ((__m256i)__builtin_ia32_cvttpd2dq512_mask(A, (__v8si)(W), U, B))
- #define _mm512_maskz_cvtt_roundpd_epi32(U, A, B) \
- ((__m256i)__builtin_ia32_cvttpd2dq512_mask(A, (__v8si)_mm256_setzero_si256(), U, B))
- #define _mm512_cvtt_roundpd_epu32(A, B) \
- ((__m256i)__builtin_ia32_cvttpd2udq512_mask(A, (__v8si)_mm256_undefined_si256(), -1, B))
- #define _mm512_mask_cvtt_roundpd_epu32(W, U, A, B) \
- ((__m256i)__builtin_ia32_cvttpd2udq512_mask(A, (__v8si)(W), U, B))
- #define _mm512_maskz_cvtt_roundpd_epu32(U, A, B) \
- ((__m256i)__builtin_ia32_cvttpd2udq512_mask(A, (__v8si)_mm256_setzero_si256(), U, B))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundpd_epi32 (__m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvtpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundpd_epi32 (__m256i __W, __mmask8 __U, __m512d __A,
- const int __R)
- {
- return (__m256i) __builtin_ia32_cvtpd2dq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundpd_epi32 (__mmask8 __U, __m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvtpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundpd_epu32 (__m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvtpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundpd_epu32 (__m256i __W, __mmask8 __U, __m512d __A,
- const int __R)
- {
- return (__m256i) __builtin_ia32_cvtpd2udq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundpd_epu32 (__mmask8 __U, __m512d __A, const int __R)
- {
- return (__m256i) __builtin_ia32_cvtpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U, __R);
- }
- #else
- #define _mm512_cvt_roundpd_epi32(A, B) \
- ((__m256i)__builtin_ia32_cvtpd2dq512_mask(A, (__v8si)_mm256_undefined_si256(), -1, B))
- #define _mm512_mask_cvt_roundpd_epi32(W, U, A, B) \
- ((__m256i)__builtin_ia32_cvtpd2dq512_mask(A, (__v8si)(W), U, B))
- #define _mm512_maskz_cvt_roundpd_epi32(U, A, B) \
- ((__m256i)__builtin_ia32_cvtpd2dq512_mask(A, (__v8si)_mm256_setzero_si256(), U, B))
- #define _mm512_cvt_roundpd_epu32(A, B) \
- ((__m256i)__builtin_ia32_cvtpd2udq512_mask(A, (__v8si)_mm256_undefined_si256(), -1, B))
- #define _mm512_mask_cvt_roundpd_epu32(W, U, A, B) \
- ((__m256i)__builtin_ia32_cvtpd2udq512_mask(A, (__v8si)(W), U, B))
- #define _mm512_maskz_cvt_roundpd_epu32(U, A, B) \
- ((__m256i)__builtin_ia32_cvtpd2udq512_mask(A, (__v8si)_mm256_setzero_si256(), U, B))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtt_roundps_epi32 (__m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvttps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtt_roundps_epi32 (__m512i __W, __mmask16 __U, __m512 __A,
- const int __R)
- {
- return (__m512i) __builtin_ia32_cvttps2dq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtt_roundps_epi32 (__mmask16 __U, __m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvttps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtt_roundps_epu32 (__m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvttps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtt_roundps_epu32 (__m512i __W, __mmask16 __U, __m512 __A,
- const int __R)
- {
- return (__m512i) __builtin_ia32_cvttps2udq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtt_roundps_epu32 (__mmask16 __U, __m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvttps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U, __R);
- }
- #else
- #define _mm512_cvtt_roundps_epi32(A, B) \
- ((__m512i)__builtin_ia32_cvttps2dq512_mask(A, (__v16si)_mm512_undefined_epi32 (), -1, B))
- #define _mm512_mask_cvtt_roundps_epi32(W, U, A, B) \
- ((__m512i)__builtin_ia32_cvttps2dq512_mask(A, (__v16si)(W), U, B))
- #define _mm512_maskz_cvtt_roundps_epi32(U, A, B) \
- ((__m512i)__builtin_ia32_cvttps2dq512_mask(A, (__v16si)_mm512_setzero_si512 (), U, B))
- #define _mm512_cvtt_roundps_epu32(A, B) \
- ((__m512i)__builtin_ia32_cvttps2udq512_mask(A, (__v16si)_mm512_undefined_epi32 (), -1, B))
- #define _mm512_mask_cvtt_roundps_epu32(W, U, A, B) \
- ((__m512i)__builtin_ia32_cvttps2udq512_mask(A, (__v16si)(W), U, B))
- #define _mm512_maskz_cvtt_roundps_epu32(U, A, B) \
- ((__m512i)__builtin_ia32_cvttps2udq512_mask(A, (__v16si)_mm512_setzero_si512 (), U, B))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundps_epi32 (__m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvtps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundps_epi32 (__m512i __W, __mmask16 __U, __m512 __A,
- const int __R)
- {
- return (__m512i) __builtin_ia32_cvtps2dq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundps_epi32 (__mmask16 __U, __m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvtps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundps_epu32 (__m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvtps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundps_epu32 (__m512i __W, __mmask16 __U, __m512 __A,
- const int __R)
- {
- return (__m512i) __builtin_ia32_cvtps2udq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundps_epu32 (__mmask16 __U, __m512 __A, const int __R)
- {
- return (__m512i) __builtin_ia32_cvtps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U, __R);
- }
- #else
- #define _mm512_cvt_roundps_epi32(A, B) \
- ((__m512i)__builtin_ia32_cvtps2dq512_mask(A, (__v16si)_mm512_undefined_epi32 (), -1, B))
- #define _mm512_mask_cvt_roundps_epi32(W, U, A, B) \
- ((__m512i)__builtin_ia32_cvtps2dq512_mask(A, (__v16si)(W), U, B))
- #define _mm512_maskz_cvt_roundps_epi32(U, A, B) \
- ((__m512i)__builtin_ia32_cvtps2dq512_mask(A, (__v16si)_mm512_setzero_si512 (), U, B))
- #define _mm512_cvt_roundps_epu32(A, B) \
- ((__m512i)__builtin_ia32_cvtps2udq512_mask(A, (__v16si)_mm512_undefined_epi32 (), -1, B))
- #define _mm512_mask_cvt_roundps_epu32(W, U, A, B) \
- ((__m512i)__builtin_ia32_cvtps2udq512_mask(A, (__v16si)(W), U, B))
- #define _mm512_maskz_cvt_roundps_epu32(U, A, B) \
- ((__m512i)__builtin_ia32_cvtps2udq512_mask(A, (__v16si)_mm512_setzero_si512 (), U, B))
- #endif
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtu32_sd (__m128d __A, unsigned __B)
- {
- return (__m128d) __builtin_ia32_cvtusi2sd32 ((__v2df) __A, __B);
- }
- #ifdef __x86_64__
- #ifdef __OPTIMIZE__
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundu64_sd (__m128d __A, unsigned long long __B, const int __R)
- {
- return (__m128d) __builtin_ia32_cvtusi2sd64 ((__v2df) __A, __B, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundi64_sd (__m128d __A, long long __B, const int __R)
- {
- return (__m128d) __builtin_ia32_cvtsi2sd64 ((__v2df) __A, __B, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsi64_sd (__m128d __A, long long __B, const int __R)
- {
- return (__m128d) __builtin_ia32_cvtsi2sd64 ((__v2df) __A, __B, __R);
- }
- #else
- #define _mm_cvt_roundu64_sd(A, B, C) \
- (__m128d)__builtin_ia32_cvtusi2sd64(A, B, C)
- #define _mm_cvt_roundi64_sd(A, B, C) \
- (__m128d)__builtin_ia32_cvtsi2sd64(A, B, C)
- #define _mm_cvt_roundsi64_sd(A, B, C) \
- (__m128d)__builtin_ia32_cvtsi2sd64(A, B, C)
- #endif
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundu32_ss (__m128 __A, unsigned __B, const int __R)
- {
- return (__m128) __builtin_ia32_cvtusi2ss32 ((__v4sf) __A, __B, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsi32_ss (__m128 __A, int __B, const int __R)
- {
- return (__m128) __builtin_ia32_cvtsi2ss32 ((__v4sf) __A, __B, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundi32_ss (__m128 __A, int __B, const int __R)
- {
- return (__m128) __builtin_ia32_cvtsi2ss32 ((__v4sf) __A, __B, __R);
- }
- #else
- #define _mm_cvt_roundu32_ss(A, B, C) \
- (__m128)__builtin_ia32_cvtusi2ss32(A, B, C)
- #define _mm_cvt_roundi32_ss(A, B, C) \
- (__m128)__builtin_ia32_cvtsi2ss32(A, B, C)
- #define _mm_cvt_roundsi32_ss(A, B, C) \
- (__m128)__builtin_ia32_cvtsi2ss32(A, B, C)
- #endif
- #ifdef __x86_64__
- #ifdef __OPTIMIZE__
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundu64_ss (__m128 __A, unsigned long long __B, const int __R)
- {
- return (__m128) __builtin_ia32_cvtusi2ss64 ((__v4sf) __A, __B, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsi64_ss (__m128 __A, long long __B, const int __R)
- {
- return (__m128) __builtin_ia32_cvtsi2ss64 ((__v4sf) __A, __B, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundi64_ss (__m128 __A, long long __B, const int __R)
- {
- return (__m128) __builtin_ia32_cvtsi2ss64 ((__v4sf) __A, __B, __R);
- }
- #else
- #define _mm_cvt_roundu64_ss(A, B, C) \
- (__m128)__builtin_ia32_cvtusi2ss64(A, B, C)
- #define _mm_cvt_roundi64_ss(A, B, C) \
- (__m128)__builtin_ia32_cvtsi2ss64(A, B, C)
- #define _mm_cvt_roundsi64_ss(A, B, C) \
- (__m128)__builtin_ia32_cvtsi2ss64(A, B, C)
- #endif
- #endif
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi32_epi8 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovdb512_mask ((__v16si) __A,
- (__v16qi)
- _mm_undefined_si128 (),
- (__mmask16) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi32_storeu_epi8 (void * __P, __mmask16 __M, __m512i __A)
- {
- __builtin_ia32_pmovdb512mem_mask ((__v16qi *) __P, (__v16si) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi32_epi8 (__m128i __O, __mmask16 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovdb512_mask ((__v16si) __A,
- (__v16qi) __O, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi32_epi8 (__mmask16 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovdb512_mask ((__v16si) __A,
- (__v16qi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtsepi32_epi8 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsdb512_mask ((__v16si) __A,
- (__v16qi)
- _mm_undefined_si128 (),
- (__mmask16) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi32_storeu_epi8 (void * __P, __mmask16 __M, __m512i __A)
- {
- __builtin_ia32_pmovsdb512mem_mask ((__v16qi *) __P, (__v16si) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi32_epi8 (__m128i __O, __mmask16 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsdb512_mask ((__v16si) __A,
- (__v16qi) __O, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtsepi32_epi8 (__mmask16 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsdb512_mask ((__v16si) __A,
- (__v16qi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtusepi32_epi8 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusdb512_mask ((__v16si) __A,
- (__v16qi)
- _mm_undefined_si128 (),
- (__mmask16) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi32_storeu_epi8 (void * __P, __mmask16 __M, __m512i __A)
- {
- __builtin_ia32_pmovusdb512mem_mask ((__v16qi *) __P, (__v16si) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi32_epi8 (__m128i __O, __mmask16 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusdb512_mask ((__v16si) __A,
- (__v16qi) __O,
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtusepi32_epi8 (__mmask16 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusdb512_mask ((__v16si) __A,
- (__v16qi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi32_epi16 (__m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovdw512_mask ((__v16si) __A,
- (__v16hi)
- _mm256_undefined_si256 (),
- (__mmask16) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi32_storeu_epi16 (void * __P, __mmask16 __M, __m512i __A)
- {
- __builtin_ia32_pmovdw512mem_mask ((__v16hi *) __P, (__v16si) __A, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi32_epi16 (__m256i __O, __mmask16 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovdw512_mask ((__v16si) __A,
- (__v16hi) __O, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi32_epi16 (__mmask16 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovdw512_mask ((__v16si) __A,
- (__v16hi)
- _mm256_setzero_si256 (),
- __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtsepi32_epi16 (__m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovsdw512_mask ((__v16si) __A,
- (__v16hi)
- _mm256_undefined_si256 (),
- (__mmask16) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi32_storeu_epi16 (void *__P, __mmask16 __M, __m512i __A)
- {
- __builtin_ia32_pmovsdw512mem_mask ((__v16hi*) __P, (__v16si) __A, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi32_epi16 (__m256i __O, __mmask16 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovsdw512_mask ((__v16si) __A,
- (__v16hi) __O, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtsepi32_epi16 (__mmask16 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovsdw512_mask ((__v16si) __A,
- (__v16hi)
- _mm256_setzero_si256 (),
- __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtusepi32_epi16 (__m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovusdw512_mask ((__v16si) __A,
- (__v16hi)
- _mm256_undefined_si256 (),
- (__mmask16) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi32_storeu_epi16 (void *__P, __mmask16 __M, __m512i __A)
- {
- __builtin_ia32_pmovusdw512mem_mask ((__v16hi*) __P, (__v16si) __A, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi32_epi16 (__m256i __O, __mmask16 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovusdw512_mask ((__v16si) __A,
- (__v16hi) __O,
- __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtusepi32_epi16 (__mmask16 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovusdw512_mask ((__v16si) __A,
- (__v16hi)
- _mm256_setzero_si256 (),
- __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi64_epi32 (__m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovqd512_mask ((__v8di) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi64_storeu_epi32 (void* __P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovqd512mem_mask ((__v8si *) __P, (__v8di) __A, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi64_epi32 (__m256i __O, __mmask8 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovqd512_mask ((__v8di) __A,
- (__v8si) __O, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi64_epi32 (__mmask8 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovqd512_mask ((__v8di) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtsepi64_epi32 (__m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovsqd512_mask ((__v8di) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi64_storeu_epi32 (void *__P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovsqd512mem_mask ((__v8si *) __P, (__v8di) __A, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi64_epi32 (__m256i __O, __mmask8 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovsqd512_mask ((__v8di) __A,
- (__v8si) __O, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtsepi64_epi32 (__mmask8 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovsqd512_mask ((__v8di) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtusepi64_epi32 (__m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovusqd512_mask ((__v8di) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi64_storeu_epi32 (void* __P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovusqd512mem_mask ((__v8si*) __P, (__v8di) __A, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi64_epi32 (__m256i __O, __mmask8 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovusqd512_mask ((__v8di) __A,
- (__v8si) __O, __M);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtusepi64_epi32 (__mmask8 __M, __m512i __A)
- {
- return (__m256i) __builtin_ia32_pmovusqd512_mask ((__v8di) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi64_epi16 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovqw512_mask ((__v8di) __A,
- (__v8hi)
- _mm_undefined_si128 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi64_storeu_epi16 (void *__P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovqw512mem_mask ((__v8hi *) __P, (__v8di) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi64_epi16 (__m128i __O, __mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovqw512_mask ((__v8di) __A,
- (__v8hi) __O, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi64_epi16 (__mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovqw512_mask ((__v8di) __A,
- (__v8hi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtsepi64_epi16 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsqw512_mask ((__v8di) __A,
- (__v8hi)
- _mm_undefined_si128 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi64_storeu_epi16 (void * __P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovsqw512mem_mask ((__v8hi *) __P, (__v8di) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi64_epi16 (__m128i __O, __mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsqw512_mask ((__v8di) __A,
- (__v8hi) __O, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtsepi64_epi16 (__mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsqw512_mask ((__v8di) __A,
- (__v8hi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtusepi64_epi16 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusqw512_mask ((__v8di) __A,
- (__v8hi)
- _mm_undefined_si128 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi64_storeu_epi16 (void *__P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovusqw512mem_mask ((__v8hi*) __P, (__v8di) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi64_epi16 (__m128i __O, __mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusqw512_mask ((__v8di) __A,
- (__v8hi) __O, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtusepi64_epi16 (__mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusqw512_mask ((__v8di) __A,
- (__v8hi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi64_epi8 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovqb512_mask ((__v8di) __A,
- (__v16qi)
- _mm_undefined_si128 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi64_storeu_epi8 (void * __P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovqb512mem_mask ((__v16qi *) __P, (__v8di) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi64_epi8 (__m128i __O, __mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovqb512_mask ((__v8di) __A,
- (__v16qi) __O, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi64_epi8 (__mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovqb512_mask ((__v8di) __A,
- (__v16qi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtsepi64_epi8 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsqb512_mask ((__v8di) __A,
- (__v16qi)
- _mm_undefined_si128 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi64_storeu_epi8 (void * __P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovsqb512mem_mask ((__v16qi *) __P, (__v8di) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtsepi64_epi8 (__m128i __O, __mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsqb512_mask ((__v8di) __A,
- (__v16qi) __O, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtsepi64_epi8 (__mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovsqb512_mask ((__v8di) __A,
- (__v16qi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtusepi64_epi8 (__m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusqb512_mask ((__v8di) __A,
- (__v16qi)
- _mm_undefined_si128 (),
- (__mmask8) -1);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi64_storeu_epi8 (void * __P, __mmask8 __M, __m512i __A)
- {
- __builtin_ia32_pmovusqb512mem_mask ((__v16qi *) __P, (__v8di) __A, __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtusepi64_epi8 (__m128i __O, __mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusqb512_mask ((__v8di) __A,
- (__v16qi) __O,
- __M);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtusepi64_epi8 (__mmask8 __M, __m512i __A)
- {
- return (__m128i) __builtin_ia32_pmovusqb512_mask ((__v8di) __A,
- (__v16qi)
- _mm_setzero_si128 (),
- __M);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi32_pd (__m256i __A)
- {
- return (__m512d) __builtin_ia32_cvtdq2pd512_mask ((__v8si) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi32_pd (__m512d __W, __mmask8 __U, __m256i __A)
- {
- return (__m512d) __builtin_ia32_cvtdq2pd512_mask ((__v8si) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi32_pd (__mmask8 __U, __m256i __A)
- {
- return (__m512d) __builtin_ia32_cvtdq2pd512_mask ((__v8si) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepu32_pd (__m256i __A)
- {
- return (__m512d) __builtin_ia32_cvtudq2pd512_mask ((__v8si) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepu32_pd (__m512d __W, __mmask8 __U, __m256i __A)
- {
- return (__m512d) __builtin_ia32_cvtudq2pd512_mask ((__v8si) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepu32_pd (__mmask8 __U, __m256i __A)
- {
- return (__m512d) __builtin_ia32_cvtudq2pd512_mask ((__v8si) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundepi32_ps (__m512i __A, const int __R)
- {
- return (__m512) __builtin_ia32_cvtdq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundepi32_ps (__m512 __W, __mmask16 __U, __m512i __A,
- const int __R)
- {
- return (__m512) __builtin_ia32_cvtdq2ps512_mask ((__v16si) __A,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundepi32_ps (__mmask16 __U, __m512i __A, const int __R)
- {
- return (__m512) __builtin_ia32_cvtdq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundepu32_ps (__m512i __A, const int __R)
- {
- return (__m512) __builtin_ia32_cvtudq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundepu32_ps (__m512 __W, __mmask16 __U, __m512i __A,
- const int __R)
- {
- return (__m512) __builtin_ia32_cvtudq2ps512_mask ((__v16si) __A,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundepu32_ps (__mmask16 __U, __m512i __A, const int __R)
- {
- return (__m512) __builtin_ia32_cvtudq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- #else
- #define _mm512_cvt_roundepi32_ps(A, B) \
- (__m512)__builtin_ia32_cvtdq2ps512_mask((__v16si)(A), (__v16sf)_mm512_undefined_ps(), -1, B)
- #define _mm512_mask_cvt_roundepi32_ps(W, U, A, B) \
- (__m512)__builtin_ia32_cvtdq2ps512_mask((__v16si)(A), W, U, B)
- #define _mm512_maskz_cvt_roundepi32_ps(U, A, B) \
- (__m512)__builtin_ia32_cvtdq2ps512_mask((__v16si)(A), (__v16sf)_mm512_setzero_ps(), U, B)
- #define _mm512_cvt_roundepu32_ps(A, B) \
- (__m512)__builtin_ia32_cvtudq2ps512_mask((__v16si)(A), (__v16sf)_mm512_undefined_ps(), -1, B)
- #define _mm512_mask_cvt_roundepu32_ps(W, U, A, B) \
- (__m512)__builtin_ia32_cvtudq2ps512_mask((__v16si)(A), W, U, B)
- #define _mm512_maskz_cvt_roundepu32_ps(U, A, B) \
- (__m512)__builtin_ia32_cvtudq2ps512_mask((__v16si)(A), (__v16sf)_mm512_setzero_ps(), U, B)
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m256d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_extractf64x4_pd (__m512d __A, const int __imm)
- {
- return (__m256d) __builtin_ia32_extractf64x4_mask ((__v8df) __A,
- __imm,
- (__v4df)
- _mm256_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m256d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_extractf64x4_pd (__m256d __W, __mmask8 __U, __m512d __A,
- const int __imm)
- {
- return (__m256d) __builtin_ia32_extractf64x4_mask ((__v8df) __A,
- __imm,
- (__v4df) __W,
- (__mmask8) __U);
- }
- extern __inline __m256d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_extractf64x4_pd (__mmask8 __U, __m512d __A, const int __imm)
- {
- return (__m256d) __builtin_ia32_extractf64x4_mask ((__v8df) __A,
- __imm,
- (__v4df)
- _mm256_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_extractf32x4_ps (__m512 __A, const int __imm)
- {
- return (__m128) __builtin_ia32_extractf32x4_mask ((__v16sf) __A,
- __imm,
- (__v4sf)
- _mm_undefined_ps (),
- (__mmask8) -1);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_extractf32x4_ps (__m128 __W, __mmask8 __U, __m512 __A,
- const int __imm)
- {
- return (__m128) __builtin_ia32_extractf32x4_mask ((__v16sf) __A,
- __imm,
- (__v4sf) __W,
- (__mmask8) __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_extractf32x4_ps (__mmask8 __U, __m512 __A, const int __imm)
- {
- return (__m128) __builtin_ia32_extractf32x4_mask ((__v16sf) __A,
- __imm,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_extracti64x4_epi64 (__m512i __A, const int __imm)
- {
- return (__m256i) __builtin_ia32_extracti64x4_mask ((__v8di) __A,
- __imm,
- (__v4di)
- _mm256_undefined_si256 (),
- (__mmask8) -1);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_extracti64x4_epi64 (__m256i __W, __mmask8 __U, __m512i __A,
- const int __imm)
- {
- return (__m256i) __builtin_ia32_extracti64x4_mask ((__v8di) __A,
- __imm,
- (__v4di) __W,
- (__mmask8) __U);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_extracti64x4_epi64 (__mmask8 __U, __m512i __A, const int __imm)
- {
- return (__m256i) __builtin_ia32_extracti64x4_mask ((__v8di) __A,
- __imm,
- (__v4di)
- _mm256_setzero_si256 (),
- (__mmask8) __U);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_extracti32x4_epi32 (__m512i __A, const int __imm)
- {
- return (__m128i) __builtin_ia32_extracti32x4_mask ((__v16si) __A,
- __imm,
- (__v4si)
- _mm_undefined_si128 (),
- (__mmask8) -1);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_extracti32x4_epi32 (__m128i __W, __mmask8 __U, __m512i __A,
- const int __imm)
- {
- return (__m128i) __builtin_ia32_extracti32x4_mask ((__v16si) __A,
- __imm,
- (__v4si) __W,
- (__mmask8) __U);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_extracti32x4_epi32 (__mmask8 __U, __m512i __A, const int __imm)
- {
- return (__m128i) __builtin_ia32_extracti32x4_mask ((__v16si) __A,
- __imm,
- (__v4si)
- _mm_setzero_si128 (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_extractf64x4_pd(X, C) \
- ((__m256d) __builtin_ia32_extractf64x4_mask ((__v8df)(__m512d) (X), \
- (int) (C),\
- (__v4df)(__m256d)_mm256_undefined_pd(),\
- (__mmask8)-1))
- #define _mm512_mask_extractf64x4_pd(W, U, X, C) \
- ((__m256d) __builtin_ia32_extractf64x4_mask ((__v8df)(__m512d) (X), \
- (int) (C),\
- (__v4df)(__m256d)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_extractf64x4_pd(U, X, C) \
- ((__m256d) __builtin_ia32_extractf64x4_mask ((__v8df)(__m512d) (X), \
- (int) (C),\
- (__v4df)(__m256d)_mm256_setzero_pd(),\
- (__mmask8)(U)))
- #define _mm512_extractf32x4_ps(X, C) \
- ((__m128) __builtin_ia32_extractf32x4_mask ((__v16sf)(__m512) (X), \
- (int) (C),\
- (__v4sf)(__m128)_mm_undefined_ps(),\
- (__mmask8)-1))
- #define _mm512_mask_extractf32x4_ps(W, U, X, C) \
- ((__m128) __builtin_ia32_extractf32x4_mask ((__v16sf)(__m512) (X), \
- (int) (C),\
- (__v4sf)(__m128)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_extractf32x4_ps(U, X, C) \
- ((__m128) __builtin_ia32_extractf32x4_mask ((__v16sf)(__m512) (X), \
- (int) (C),\
- (__v4sf)(__m128)_mm_setzero_ps(),\
- (__mmask8)(U)))
- #define _mm512_extracti64x4_epi64(X, C) \
- ((__m256i) __builtin_ia32_extracti64x4_mask ((__v8di)(__m512i) (X), \
- (int) (C),\
- (__v4di)(__m256i)_mm256_undefined_si256 (),\
- (__mmask8)-1))
- #define _mm512_mask_extracti64x4_epi64(W, U, X, C) \
- ((__m256i) __builtin_ia32_extracti64x4_mask ((__v8di)(__m512i) (X), \
- (int) (C),\
- (__v4di)(__m256i)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_extracti64x4_epi64(U, X, C) \
- ((__m256i) __builtin_ia32_extracti64x4_mask ((__v8di)(__m512i) (X), \
- (int) (C),\
- (__v4di)(__m256i)_mm256_setzero_si256 (),\
- (__mmask8)(U)))
- #define _mm512_extracti32x4_epi32(X, C) \
- ((__m128i) __builtin_ia32_extracti32x4_mask ((__v16si)(__m512i) (X), \
- (int) (C),\
- (__v4si)(__m128i)_mm_undefined_si128 (),\
- (__mmask8)-1))
- #define _mm512_mask_extracti32x4_epi32(W, U, X, C) \
- ((__m128i) __builtin_ia32_extracti32x4_mask ((__v16si)(__m512i) (X), \
- (int) (C),\
- (__v4si)(__m128i)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_extracti32x4_epi32(U, X, C) \
- ((__m128i) __builtin_ia32_extracti32x4_mask ((__v16si)(__m512i) (X), \
- (int) (C),\
- (__v4si)(__m128i)_mm_setzero_si128 (),\
- (__mmask8)(U)))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_inserti32x4 (__m512i __A, __m128i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_inserti32x4_mask ((__v16si) __A,
- (__v4si) __B,
- __imm,
- (__v16si) __A, -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_insertf32x4 (__m512 __A, __m128 __B, const int __imm)
- {
- return (__m512) __builtin_ia32_insertf32x4_mask ((__v16sf) __A,
- (__v4sf) __B,
- __imm,
- (__v16sf) __A, -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_inserti64x4 (__m512i __A, __m256i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_inserti64x4_mask ((__v8di) __A,
- (__v4di) __B,
- __imm,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_inserti64x4 (__m512i __W, __mmask8 __U, __m512i __A,
- __m256i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_inserti64x4_mask ((__v8di) __A,
- (__v4di) __B,
- __imm,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_inserti64x4 (__mmask8 __U, __m512i __A, __m256i __B,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_inserti64x4_mask ((__v8di) __A,
- (__v4di) __B,
- __imm,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_insertf64x4 (__m512d __A, __m256d __B, const int __imm)
- {
- return (__m512d) __builtin_ia32_insertf64x4_mask ((__v8df) __A,
- (__v4df) __B,
- __imm,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_insertf64x4 (__m512d __W, __mmask8 __U, __m512d __A,
- __m256d __B, const int __imm)
- {
- return (__m512d) __builtin_ia32_insertf64x4_mask ((__v8df) __A,
- (__v4df) __B,
- __imm,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_insertf64x4 (__mmask8 __U, __m512d __A, __m256d __B,
- const int __imm)
- {
- return (__m512d) __builtin_ia32_insertf64x4_mask ((__v8df) __A,
- (__v4df) __B,
- __imm,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_insertf32x4(X, Y, C) \
- ((__m512) __builtin_ia32_insertf32x4_mask ((__v16sf)(__m512) (X), \
- (__v4sf)(__m128) (Y), (int) (C), (__v16sf)(__m512) (X), (__mmask16)(-1)))
- #define _mm512_inserti32x4(X, Y, C) \
- ((__m512i) __builtin_ia32_inserti32x4_mask ((__v16si)(__m512i) (X), \
- (__v4si)(__m128i) (Y), (int) (C), (__v16si)(__m512i) (X), (__mmask16)(-1)))
- #define _mm512_insertf64x4(X, Y, C) \
- ((__m512d) __builtin_ia32_insertf64x4_mask ((__v8df)(__m512d) (X), \
- (__v4df)(__m256d) (Y), (int) (C), \
- (__v8df)(__m512d)_mm512_undefined_pd(), \
- (__mmask8)-1))
- #define _mm512_mask_insertf64x4(W, U, X, Y, C) \
- ((__m512d) __builtin_ia32_insertf64x4_mask ((__v8df)(__m512d) (X), \
- (__v4df)(__m256d) (Y), (int) (C), \
- (__v8df)(__m512d)(W), \
- (__mmask8)(U)))
- #define _mm512_maskz_insertf64x4(U, X, Y, C) \
- ((__m512d) __builtin_ia32_insertf64x4_mask ((__v8df)(__m512d) (X), \
- (__v4df)(__m256d) (Y), (int) (C), \
- (__v8df)(__m512d)_mm512_setzero_pd(), \
- (__mmask8)(U)))
- #define _mm512_inserti64x4(X, Y, C) \
- ((__m512i) __builtin_ia32_inserti64x4_mask ((__v8di)(__m512i) (X), \
- (__v4di)(__m256i) (Y), (int) (C), \
- (__v8di)(__m512i)_mm512_undefined_epi32 (), \
- (__mmask8)-1))
- #define _mm512_mask_inserti64x4(W, U, X, Y, C) \
- ((__m512i) __builtin_ia32_inserti64x4_mask ((__v8di)(__m512i) (X), \
- (__v4di)(__m256i) (Y), (int) (C),\
- (__v8di)(__m512i)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_inserti64x4(U, X, Y, C) \
- ((__m512i) __builtin_ia32_inserti64x4_mask ((__v8di)(__m512i) (X), \
- (__v4di)(__m256i) (Y), (int) (C), \
- (__v8di)(__m512i)_mm512_setzero_si512 (), \
- (__mmask8)(U)))
- #endif
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_loadu_pd (void const *__P)
- {
- return *(__m512d_u *)__P;
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_loadu_pd (__m512d __W, __mmask8 __U, void const *__P)
- {
- return (__m512d) __builtin_ia32_loadupd512_mask ((const double *) __P,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_loadu_pd (__mmask8 __U, void const *__P)
- {
- return (__m512d) __builtin_ia32_loadupd512_mask ((const double *) __P,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_storeu_pd (void *__P, __m512d __A)
- {
- *(__m512d_u *)__P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_storeu_pd (void *__P, __mmask8 __U, __m512d __A)
- {
- __builtin_ia32_storeupd512_mask ((double *) __P, (__v8df) __A,
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_loadu_ps (void const *__P)
- {
- return *(__m512_u *)__P;
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_loadu_ps (__m512 __W, __mmask16 __U, void const *__P)
- {
- return (__m512) __builtin_ia32_loadups512_mask ((const float *) __P,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_loadu_ps (__mmask16 __U, void const *__P)
- {
- return (__m512) __builtin_ia32_loadups512_mask ((const float *) __P,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_storeu_ps (void *__P, __m512 __A)
- {
- *(__m512_u *)__P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_storeu_ps (void *__P, __mmask16 __U, __m512 __A)
- {
- __builtin_ia32_storeups512_mask ((float *) __P, (__v16sf) __A,
- (__mmask16) __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_load_ss (__m128 __W, __mmask8 __U, const float *__P)
- {
- return (__m128) __builtin_ia32_loadss_mask (__P, (__v4sf) __W, __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_load_ss (__mmask8 __U, const float *__P)
- {
- return (__m128) __builtin_ia32_loadss_mask (__P, (__v4sf) _mm_setzero_ps (),
- __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_load_sd (__m128d __W, __mmask8 __U, const double *__P)
- {
- return (__m128d) __builtin_ia32_loadsd_mask (__P, (__v2df) __W, __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_load_sd (__mmask8 __U, const double *__P)
- {
- return (__m128d) __builtin_ia32_loadsd_mask (__P, (__v2df) _mm_setzero_pd (),
- __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_move_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_movess_mask ((__v4sf) __A, (__v4sf) __B,
- (__v4sf) __W, __U);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_move_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_movess_mask ((__v4sf) __A, (__v4sf) __B,
- (__v4sf) _mm_setzero_ps (), __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_move_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_movesd_mask ((__v2df) __A, (__v2df) __B,
- (__v2df) __W, __U);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_move_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_movesd_mask ((__v2df) __A, (__v2df) __B,
- (__v2df) _mm_setzero_pd (),
- __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_store_ss (float *__P, __mmask8 __U, __m128 __A)
- {
- __builtin_ia32_storess_mask (__P, (__v4sf) __A, (__mmask8) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_store_sd (double *__P, __mmask8 __U, __m128d __A)
- {
- __builtin_ia32_storesd_mask (__P, (__v2df) __A, (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_loadu_epi64 (__m512i __W, __mmask8 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_loaddqudi512_mask ((const long long *) __P,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_loadu_epi64 (__mmask8 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_loaddqudi512_mask ((const long long *) __P,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_storeu_epi64 (void *__P, __mmask8 __U, __m512i __A)
- {
- __builtin_ia32_storedqudi512_mask ((long long *) __P, (__v8di) __A,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_loadu_si512 (void const *__P)
- {
- return *(__m512i_u *)__P;
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_loadu_epi32 (__m512i __W, __mmask16 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_loaddqusi512_mask ((const int *) __P,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_loadu_epi32 (__mmask16 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_loaddqusi512_mask ((const int *) __P,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_storeu_si512 (void *__P, __m512i __A)
- {
- *(__m512i_u *)__P = __A;
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_storeu_epi32 (void *__P, __mmask16 __U, __m512i __A)
- {
- __builtin_ia32_storedqusi512_mask ((int *) __P, (__v16si) __A,
- (__mmask16) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutevar_pd (__m512d __A, __m512i __C)
- {
- return (__m512d) __builtin_ia32_vpermilvarpd512_mask ((__v8df) __A,
- (__v8di) __C,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutevar_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512i __C)
- {
- return (__m512d) __builtin_ia32_vpermilvarpd512_mask ((__v8df) __A,
- (__v8di) __C,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutevar_pd (__mmask8 __U, __m512d __A, __m512i __C)
- {
- return (__m512d) __builtin_ia32_vpermilvarpd512_mask ((__v8df) __A,
- (__v8di) __C,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutevar_ps (__m512 __A, __m512i __C)
- {
- return (__m512) __builtin_ia32_vpermilvarps512_mask ((__v16sf) __A,
- (__v16si) __C,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutevar_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512i __C)
- {
- return (__m512) __builtin_ia32_vpermilvarps512_mask ((__v16sf) __A,
- (__v16si) __C,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutevar_ps (__mmask16 __U, __m512 __A, __m512i __C)
- {
- return (__m512) __builtin_ia32_vpermilvarps512_mask ((__v16sf) __A,
- (__v16si) __C,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutex2var_epi64 (__m512i __A, __m512i __I, __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermt2varq512_mask ((__v8di) __I
- /* idx */ ,
- (__v8di) __A,
- (__v8di) __B,
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutex2var_epi64 (__m512i __A, __mmask8 __U, __m512i __I,
- __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermt2varq512_mask ((__v8di) __I
- /* idx */ ,
- (__v8di) __A,
- (__v8di) __B,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask2_permutex2var_epi64 (__m512i __A, __m512i __I,
- __mmask8 __U, __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermi2varq512_mask ((__v8di) __A,
- (__v8di) __I
- /* idx */ ,
- (__v8di) __B,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutex2var_epi64 (__mmask8 __U, __m512i __A,
- __m512i __I, __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermt2varq512_maskz ((__v8di) __I
- /* idx */ ,
- (__v8di) __A,
- (__v8di) __B,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutex2var_epi32 (__m512i __A, __m512i __I, __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermt2vard512_mask ((__v16si) __I
- /* idx */ ,
- (__v16si) __A,
- (__v16si) __B,
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutex2var_epi32 (__m512i __A, __mmask16 __U,
- __m512i __I, __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermt2vard512_mask ((__v16si) __I
- /* idx */ ,
- (__v16si) __A,
- (__v16si) __B,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask2_permutex2var_epi32 (__m512i __A, __m512i __I,
- __mmask16 __U, __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermi2vard512_mask ((__v16si) __A,
- (__v16si) __I
- /* idx */ ,
- (__v16si) __B,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutex2var_epi32 (__mmask16 __U, __m512i __A,
- __m512i __I, __m512i __B)
- {
- return (__m512i) __builtin_ia32_vpermt2vard512_maskz ((__v16si) __I
- /* idx */ ,
- (__v16si) __A,
- (__v16si) __B,
- (__mmask16) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutex2var_pd (__m512d __A, __m512i __I, __m512d __B)
- {
- return (__m512d) __builtin_ia32_vpermt2varpd512_mask ((__v8di) __I
- /* idx */ ,
- (__v8df) __A,
- (__v8df) __B,
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutex2var_pd (__m512d __A, __mmask8 __U, __m512i __I,
- __m512d __B)
- {
- return (__m512d) __builtin_ia32_vpermt2varpd512_mask ((__v8di) __I
- /* idx */ ,
- (__v8df) __A,
- (__v8df) __B,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask2_permutex2var_pd (__m512d __A, __m512i __I, __mmask8 __U,
- __m512d __B)
- {
- return (__m512d) __builtin_ia32_vpermi2varpd512_mask ((__v8df) __A,
- (__v8di) __I
- /* idx */ ,
- (__v8df) __B,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutex2var_pd (__mmask8 __U, __m512d __A, __m512i __I,
- __m512d __B)
- {
- return (__m512d) __builtin_ia32_vpermt2varpd512_maskz ((__v8di) __I
- /* idx */ ,
- (__v8df) __A,
- (__v8df) __B,
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutex2var_ps (__m512 __A, __m512i __I, __m512 __B)
- {
- return (__m512) __builtin_ia32_vpermt2varps512_mask ((__v16si) __I
- /* idx */ ,
- (__v16sf) __A,
- (__v16sf) __B,
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutex2var_ps (__m512 __A, __mmask16 __U, __m512i __I, __m512 __B)
- {
- return (__m512) __builtin_ia32_vpermt2varps512_mask ((__v16si) __I
- /* idx */ ,
- (__v16sf) __A,
- (__v16sf) __B,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask2_permutex2var_ps (__m512 __A, __m512i __I, __mmask16 __U,
- __m512 __B)
- {
- return (__m512) __builtin_ia32_vpermi2varps512_mask ((__v16sf) __A,
- (__v16si) __I
- /* idx */ ,
- (__v16sf) __B,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutex2var_ps (__mmask16 __U, __m512 __A, __m512i __I,
- __m512 __B)
- {
- return (__m512) __builtin_ia32_vpermt2varps512_maskz ((__v16si) __I
- /* idx */ ,
- (__v16sf) __A,
- (__v16sf) __B,
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permute_pd (__m512d __X, const int __C)
- {
- return (__m512d) __builtin_ia32_vpermilpd512_mask ((__v8df) __X, __C,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permute_pd (__m512d __W, __mmask8 __U, __m512d __X, const int __C)
- {
- return (__m512d) __builtin_ia32_vpermilpd512_mask ((__v8df) __X, __C,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permute_pd (__mmask8 __U, __m512d __X, const int __C)
- {
- return (__m512d) __builtin_ia32_vpermilpd512_mask ((__v8df) __X, __C,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permute_ps (__m512 __X, const int __C)
- {
- return (__m512) __builtin_ia32_vpermilps512_mask ((__v16sf) __X, __C,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permute_ps (__m512 __W, __mmask16 __U, __m512 __X, const int __C)
- {
- return (__m512) __builtin_ia32_vpermilps512_mask ((__v16sf) __X, __C,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permute_ps (__mmask16 __U, __m512 __X, const int __C)
- {
- return (__m512) __builtin_ia32_vpermilps512_mask ((__v16sf) __X, __C,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- #else
- #define _mm512_permute_pd(X, C) \
- ((__m512d) __builtin_ia32_vpermilpd512_mask ((__v8df)(__m512d)(X), (int)(C), \
- (__v8df)(__m512d)_mm512_undefined_pd(),\
- (__mmask8)(-1)))
- #define _mm512_mask_permute_pd(W, U, X, C) \
- ((__m512d) __builtin_ia32_vpermilpd512_mask ((__v8df)(__m512d)(X), (int)(C), \
- (__v8df)(__m512d)(W), \
- (__mmask8)(U)))
- #define _mm512_maskz_permute_pd(U, X, C) \
- ((__m512d) __builtin_ia32_vpermilpd512_mask ((__v8df)(__m512d)(X), (int)(C), \
- (__v8df)(__m512d)_mm512_setzero_pd(), \
- (__mmask8)(U)))
- #define _mm512_permute_ps(X, C) \
- ((__m512) __builtin_ia32_vpermilps512_mask ((__v16sf)(__m512)(X), (int)(C), \
- (__v16sf)(__m512)_mm512_undefined_ps(),\
- (__mmask16)(-1)))
- #define _mm512_mask_permute_ps(W, U, X, C) \
- ((__m512) __builtin_ia32_vpermilps512_mask ((__v16sf)(__m512)(X), (int)(C), \
- (__v16sf)(__m512)(W), \
- (__mmask16)(U)))
- #define _mm512_maskz_permute_ps(U, X, C) \
- ((__m512) __builtin_ia32_vpermilps512_mask ((__v16sf)(__m512)(X), (int)(C), \
- (__v16sf)(__m512)_mm512_setzero_ps(), \
- (__mmask16)(U)))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutex_epi64 (__m512i __X, const int __I)
- {
- return (__m512i) __builtin_ia32_permdi512_mask ((__v8di) __X, __I,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) (-1));
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutex_epi64 (__m512i __W, __mmask8 __M,
- __m512i __X, const int __I)
- {
- return (__m512i) __builtin_ia32_permdi512_mask ((__v8di) __X, __I,
- (__v8di) __W,
- (__mmask8) __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutex_epi64 (__mmask8 __M, __m512i __X, const int __I)
- {
- return (__m512i) __builtin_ia32_permdi512_mask ((__v8di) __X, __I,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __M);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutex_pd (__m512d __X, const int __M)
- {
- return (__m512d) __builtin_ia32_permdf512_mask ((__v8df) __X, __M,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutex_pd (__m512d __W, __mmask8 __U, __m512d __X, const int __M)
- {
- return (__m512d) __builtin_ia32_permdf512_mask ((__v8df) __X, __M,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutex_pd (__mmask8 __U, __m512d __X, const int __M)
- {
- return (__m512d) __builtin_ia32_permdf512_mask ((__v8df) __X, __M,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_permutex_pd(X, M) \
- ((__m512d) __builtin_ia32_permdf512_mask ((__v8df)(__m512d)(X), (int)(M), \
- (__v8df)(__m512d)_mm512_undefined_pd(),\
- (__mmask8)-1))
- #define _mm512_mask_permutex_pd(W, U, X, M) \
- ((__m512d) __builtin_ia32_permdf512_mask ((__v8df)(__m512d)(X), (int)(M), \
- (__v8df)(__m512d)(W), (__mmask8)(U)))
- #define _mm512_maskz_permutex_pd(U, X, M) \
- ((__m512d) __builtin_ia32_permdf512_mask ((__v8df)(__m512d)(X), (int)(M), \
- (__v8df)(__m512d)_mm512_setzero_pd(),\
- (__mmask8)(U)))
- #define _mm512_permutex_epi64(X, I) \
- ((__m512i) __builtin_ia32_permdi512_mask ((__v8di)(__m512i)(X), \
- (int)(I), \
- (__v8di)(__m512i) \
- (_mm512_undefined_epi32 ()),\
- (__mmask8)(-1)))
- #define _mm512_maskz_permutex_epi64(M, X, I) \
- ((__m512i) __builtin_ia32_permdi512_mask ((__v8di)(__m512i)(X), \
- (int)(I), \
- (__v8di)(__m512i) \
- (_mm512_setzero_si512 ()),\
- (__mmask8)(M)))
- #define _mm512_mask_permutex_epi64(W, M, X, I) \
- ((__m512i) __builtin_ia32_permdi512_mask ((__v8di)(__m512i)(X), \
- (int)(I), \
- (__v8di)(__m512i)(W), \
- (__mmask8)(M)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutexvar_epi64 (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_permvardi512_mask ((__v8di) __Y,
- (__v8di) __X,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutexvar_epi64 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_permvardi512_mask ((__v8di) __Y,
- (__v8di) __X,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutexvar_epi64 (__m512i __W, __mmask8 __M, __m512i __X,
- __m512i __Y)
- {
- return (__m512i) __builtin_ia32_permvardi512_mask ((__v8di) __Y,
- (__v8di) __X,
- (__v8di) __W,
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutexvar_epi32 (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_permvarsi512_mask ((__v16si) __Y,
- (__v16si) __X,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutexvar_epi32 (__m512i __X, __m512i __Y)
- {
- return (__m512i) __builtin_ia32_permvarsi512_mask ((__v16si) __Y,
- (__v16si) __X,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutexvar_epi32 (__m512i __W, __mmask16 __M, __m512i __X,
- __m512i __Y)
- {
- return (__m512i) __builtin_ia32_permvarsi512_mask ((__v16si) __Y,
- (__v16si) __X,
- (__v16si) __W,
- __M);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutexvar_pd (__m512i __X, __m512d __Y)
- {
- return (__m512d) __builtin_ia32_permvardf512_mask ((__v8df) __Y,
- (__v8di) __X,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutexvar_pd (__m512d __W, __mmask8 __U, __m512i __X, __m512d __Y)
- {
- return (__m512d) __builtin_ia32_permvardf512_mask ((__v8df) __Y,
- (__v8di) __X,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutexvar_pd (__mmask8 __U, __m512i __X, __m512d __Y)
- {
- return (__m512d) __builtin_ia32_permvardf512_mask ((__v8df) __Y,
- (__v8di) __X,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_permutexvar_ps (__m512i __X, __m512 __Y)
- {
- return (__m512) __builtin_ia32_permvarsf512_mask ((__v16sf) __Y,
- (__v16si) __X,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_permutexvar_ps (__m512 __W, __mmask16 __U, __m512i __X, __m512 __Y)
- {
- return (__m512) __builtin_ia32_permvarsf512_mask ((__v16sf) __Y,
- (__v16si) __X,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_permutexvar_ps (__mmask16 __U, __m512i __X, __m512 __Y)
- {
- return (__m512) __builtin_ia32_permvarsf512_mask ((__v16sf) __Y,
- (__v16si) __X,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_shuffle_ps (__m512 __M, __m512 __V, const int __imm)
- {
- return (__m512) __builtin_ia32_shufps512_mask ((__v16sf) __M,
- (__v16sf) __V, __imm,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_shuffle_ps (__m512 __W, __mmask16 __U, __m512 __M,
- __m512 __V, const int __imm)
- {
- return (__m512) __builtin_ia32_shufps512_mask ((__v16sf) __M,
- (__v16sf) __V, __imm,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_shuffle_ps (__mmask16 __U, __m512 __M, __m512 __V, const int __imm)
- {
- return (__m512) __builtin_ia32_shufps512_mask ((__v16sf) __M,
- (__v16sf) __V, __imm,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_shuffle_pd (__m512d __M, __m512d __V, const int __imm)
- {
- return (__m512d) __builtin_ia32_shufpd512_mask ((__v8df) __M,
- (__v8df) __V, __imm,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_shuffle_pd (__m512d __W, __mmask8 __U, __m512d __M,
- __m512d __V, const int __imm)
- {
- return (__m512d) __builtin_ia32_shufpd512_mask ((__v8df) __M,
- (__v8df) __V, __imm,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_shuffle_pd (__mmask8 __U, __m512d __M, __m512d __V,
- const int __imm)
- {
- return (__m512d) __builtin_ia32_shufpd512_mask ((__v8df) __M,
- (__v8df) __V, __imm,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fixupimm_round_pd (__m512d __A, __m512d __B, __m512i __C,
- const int __imm, const int __R)
- {
- return (__m512d) __builtin_ia32_fixupimmpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8di) __C,
- __imm,
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fixupimm_round_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512i __C, const int __imm, const int __R)
- {
- return (__m512d) __builtin_ia32_fixupimmpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8di) __C,
- __imm,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fixupimm_round_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512i __C, const int __imm, const int __R)
- {
- return (__m512d) __builtin_ia32_fixupimmpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8di) __C,
- __imm,
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fixupimm_round_ps (__m512 __A, __m512 __B, __m512i __C,
- const int __imm, const int __R)
- {
- return (__m512) __builtin_ia32_fixupimmps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16si) __C,
- __imm,
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fixupimm_round_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512i __C, const int __imm, const int __R)
- {
- return (__m512) __builtin_ia32_fixupimmps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16si) __C,
- __imm,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fixupimm_round_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512i __C, const int __imm, const int __R)
- {
- return (__m512) __builtin_ia32_fixupimmps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16si) __C,
- __imm,
- (__mmask16) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fixupimm_round_sd (__m128d __A, __m128d __B, __m128i __C,
- const int __imm, const int __R)
- {
- return (__m128d) __builtin_ia32_fixupimmsd_mask ((__v2df) __A,
- (__v2df) __B,
- (__v2di) __C, __imm,
- (__mmask8) -1, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fixupimm_round_sd (__m128d __A, __mmask8 __U, __m128d __B,
- __m128i __C, const int __imm, const int __R)
- {
- return (__m128d) __builtin_ia32_fixupimmsd_mask ((__v2df) __A,
- (__v2df) __B,
- (__v2di) __C, __imm,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fixupimm_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- __m128i __C, const int __imm, const int __R)
- {
- return (__m128d) __builtin_ia32_fixupimmsd_maskz ((__v2df) __A,
- (__v2df) __B,
- (__v2di) __C,
- __imm,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fixupimm_round_ss (__m128 __A, __m128 __B, __m128i __C,
- const int __imm, const int __R)
- {
- return (__m128) __builtin_ia32_fixupimmss_mask ((__v4sf) __A,
- (__v4sf) __B,
- (__v4si) __C, __imm,
- (__mmask8) -1, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fixupimm_round_ss (__m128 __A, __mmask8 __U, __m128 __B,
- __m128i __C, const int __imm, const int __R)
- {
- return (__m128) __builtin_ia32_fixupimmss_mask ((__v4sf) __A,
- (__v4sf) __B,
- (__v4si) __C, __imm,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fixupimm_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- __m128i __C, const int __imm, const int __R)
- {
- return (__m128) __builtin_ia32_fixupimmss_maskz ((__v4sf) __A,
- (__v4sf) __B,
- (__v4si) __C, __imm,
- (__mmask8) __U, __R);
- }
- #else
- #define _mm512_shuffle_pd(X, Y, C) \
- ((__m512d)__builtin_ia32_shufpd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(C),\
- (__v8df)(__m512d)_mm512_undefined_pd(),\
- (__mmask8)-1))
- #define _mm512_mask_shuffle_pd(W, U, X, Y, C) \
- ((__m512d)__builtin_ia32_shufpd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(C),\
- (__v8df)(__m512d)(W),\
- (__mmask8)(U)))
- #define _mm512_maskz_shuffle_pd(U, X, Y, C) \
- ((__m512d)__builtin_ia32_shufpd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(C),\
- (__v8df)(__m512d)_mm512_setzero_pd(),\
- (__mmask8)(U)))
- #define _mm512_shuffle_ps(X, Y, C) \
- ((__m512)__builtin_ia32_shufps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(C),\
- (__v16sf)(__m512)_mm512_undefined_ps(),\
- (__mmask16)-1))
- #define _mm512_mask_shuffle_ps(W, U, X, Y, C) \
- ((__m512)__builtin_ia32_shufps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(C),\
- (__v16sf)(__m512)(W),\
- (__mmask16)(U)))
- #define _mm512_maskz_shuffle_ps(U, X, Y, C) \
- ((__m512)__builtin_ia32_shufps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(C),\
- (__v16sf)(__m512)_mm512_setzero_ps(),\
- (__mmask16)(U)))
- #define _mm512_fixupimm_round_pd(X, Y, Z, C, R) \
- ((__m512d)__builtin_ia32_fixupimmpd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (__v8di)(__m512i)(Z), (int)(C), \
- (__mmask8)(-1), (R)))
- #define _mm512_mask_fixupimm_round_pd(X, U, Y, Z, C, R) \
- ((__m512d)__builtin_ia32_fixupimmpd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (__v8di)(__m512i)(Z), (int)(C), \
- (__mmask8)(U), (R)))
- #define _mm512_maskz_fixupimm_round_pd(U, X, Y, Z, C, R) \
- ((__m512d)__builtin_ia32_fixupimmpd512_maskz ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (__v8di)(__m512i)(Z), (int)(C), \
- (__mmask8)(U), (R)))
- #define _mm512_fixupimm_round_ps(X, Y, Z, C, R) \
- ((__m512)__builtin_ia32_fixupimmps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (__v16si)(__m512i)(Z), (int)(C), \
- (__mmask16)(-1), (R)))
- #define _mm512_mask_fixupimm_round_ps(X, U, Y, Z, C, R) \
- ((__m512)__builtin_ia32_fixupimmps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (__v16si)(__m512i)(Z), (int)(C), \
- (__mmask16)(U), (R)))
- #define _mm512_maskz_fixupimm_round_ps(U, X, Y, Z, C, R) \
- ((__m512)__builtin_ia32_fixupimmps512_maskz ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (__v16si)(__m512i)(Z), (int)(C), \
- (__mmask16)(U), (R)))
- #define _mm_fixupimm_round_sd(X, Y, Z, C, R) \
- ((__m128d)__builtin_ia32_fixupimmsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (__v2di)(__m128i)(Z), (int)(C), \
- (__mmask8)(-1), (R)))
- #define _mm_mask_fixupimm_round_sd(X, U, Y, Z, C, R) \
- ((__m128d)__builtin_ia32_fixupimmsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (__v2di)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), (R)))
- #define _mm_maskz_fixupimm_round_sd(U, X, Y, Z, C, R) \
- ((__m128d)__builtin_ia32_fixupimmsd_maskz ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (__v2di)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), (R)))
- #define _mm_fixupimm_round_ss(X, Y, Z, C, R) \
- ((__m128)__builtin_ia32_fixupimmss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (__v4si)(__m128i)(Z), (int)(C), \
- (__mmask8)(-1), (R)))
- #define _mm_mask_fixupimm_round_ss(X, U, Y, Z, C, R) \
- ((__m128)__builtin_ia32_fixupimmss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (__v4si)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), (R)))
- #define _mm_maskz_fixupimm_round_ss(U, X, Y, Z, C, R) \
- ((__m128)__builtin_ia32_fixupimmss_maskz ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (__v4si)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), (R)))
- #endif
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_movehdup_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_movshdup512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_movehdup_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_movshdup512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_movehdup_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_movshdup512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_moveldup_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_movsldup512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_moveldup_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_movsldup512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_moveldup_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_movsldup512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_or_si512 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A | (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_or_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A | (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_or_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pord512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_or_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pord512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_or_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v8du) __A | (__v8du) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_or_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_porq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_or_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_porq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_xor_si512 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A ^ (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_xor_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A ^ (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_xor_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pxord512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_xor_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pxord512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_xor_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v8du) __A ^ (__v8du) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_xor_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pxorq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_xor_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pxorq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rol_epi32 (__m512i __A, const int __B)
- {
- return (__m512i) __builtin_ia32_prold512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rol_epi32 (__m512i __W, __mmask16 __U, __m512i __A, const int __B)
- {
- return (__m512i) __builtin_ia32_prold512_mask ((__v16si) __A, __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rol_epi32 (__mmask16 __U, __m512i __A, const int __B)
- {
- return (__m512i) __builtin_ia32_prold512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_ror_epi32 (__m512i __A, int __B)
- {
- return (__m512i) __builtin_ia32_prord512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_ror_epi32 (__m512i __W, __mmask16 __U, __m512i __A, int __B)
- {
- return (__m512i) __builtin_ia32_prord512_mask ((__v16si) __A, __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_ror_epi32 (__mmask16 __U, __m512i __A, int __B)
- {
- return (__m512i) __builtin_ia32_prord512_mask ((__v16si) __A, __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_rol_epi64 (__m512i __A, const int __B)
- {
- return (__m512i) __builtin_ia32_prolq512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_rol_epi64 (__m512i __W, __mmask8 __U, __m512i __A, const int __B)
- {
- return (__m512i) __builtin_ia32_prolq512_mask ((__v8di) __A, __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_rol_epi64 (__mmask8 __U, __m512i __A, const int __B)
- {
- return (__m512i) __builtin_ia32_prolq512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_ror_epi64 (__m512i __A, int __B)
- {
- return (__m512i) __builtin_ia32_prorq512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_ror_epi64 (__m512i __W, __mmask8 __U, __m512i __A, int __B)
- {
- return (__m512i) __builtin_ia32_prorq512_mask ((__v8di) __A, __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_ror_epi64 (__mmask8 __U, __m512i __A, int __B)
- {
- return (__m512i) __builtin_ia32_prorq512_mask ((__v8di) __A, __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_rol_epi32(A, B) \
- ((__m512i)__builtin_ia32_prold512_mask ((__v16si)(__m512i)(A), \
- (int)(B), \
- (__v16si)_mm512_undefined_epi32 (), \
- (__mmask16)(-1)))
- #define _mm512_mask_rol_epi32(W, U, A, B) \
- ((__m512i)__builtin_ia32_prold512_mask ((__v16si)(__m512i)(A), \
- (int)(B), \
- (__v16si)(__m512i)(W), \
- (__mmask16)(U)))
- #define _mm512_maskz_rol_epi32(U, A, B) \
- ((__m512i)__builtin_ia32_prold512_mask ((__v16si)(__m512i)(A), \
- (int)(B), \
- (__v16si)_mm512_setzero_si512 (), \
- (__mmask16)(U)))
- #define _mm512_ror_epi32(A, B) \
- ((__m512i)__builtin_ia32_prord512_mask ((__v16si)(__m512i)(A), \
- (int)(B), \
- (__v16si)_mm512_undefined_epi32 (), \
- (__mmask16)(-1)))
- #define _mm512_mask_ror_epi32(W, U, A, B) \
- ((__m512i)__builtin_ia32_prord512_mask ((__v16si)(__m512i)(A), \
- (int)(B), \
- (__v16si)(__m512i)(W), \
- (__mmask16)(U)))
- #define _mm512_maskz_ror_epi32(U, A, B) \
- ((__m512i)__builtin_ia32_prord512_mask ((__v16si)(__m512i)(A), \
- (int)(B), \
- (__v16si)_mm512_setzero_si512 (), \
- (__mmask16)(U)))
- #define _mm512_rol_epi64(A, B) \
- ((__m512i)__builtin_ia32_prolq512_mask ((__v8di)(__m512i)(A), \
- (int)(B), \
- (__v8di)_mm512_undefined_epi32 (), \
- (__mmask8)(-1)))
- #define _mm512_mask_rol_epi64(W, U, A, B) \
- ((__m512i)__builtin_ia32_prolq512_mask ((__v8di)(__m512i)(A), \
- (int)(B), \
- (__v8di)(__m512i)(W), \
- (__mmask8)(U)))
- #define _mm512_maskz_rol_epi64(U, A, B) \
- ((__m512i)__builtin_ia32_prolq512_mask ((__v8di)(__m512i)(A), \
- (int)(B), \
- (__v8di)_mm512_setzero_si512 (), \
- (__mmask8)(U)))
- #define _mm512_ror_epi64(A, B) \
- ((__m512i)__builtin_ia32_prorq512_mask ((__v8di)(__m512i)(A), \
- (int)(B), \
- (__v8di)_mm512_undefined_epi32 (), \
- (__mmask8)(-1)))
- #define _mm512_mask_ror_epi64(W, U, A, B) \
- ((__m512i)__builtin_ia32_prorq512_mask ((__v8di)(__m512i)(A), \
- (int)(B), \
- (__v8di)(__m512i)(W), \
- (__mmask8)(U)))
- #define _mm512_maskz_ror_epi64(U, A, B) \
- ((__m512i)__builtin_ia32_prorq512_mask ((__v8di)(__m512i)(A), \
- (int)(B), \
- (__v8di)_mm512_setzero_si512 (), \
- (__mmask8)(U)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_and_si512 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A & (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_and_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v16su) __A & (__v16su) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_and_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_and_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_and_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) ((__v8du) __A & (__v8du) __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_and_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W, __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_and_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_pd (),
- __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_andnot_si512 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandnd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_andnot_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandnd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_andnot_epi32 (__m512i __W, __mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandnd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_andnot_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandnd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_andnot_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandnq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_andnot_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandnq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W, __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_andnot_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pandnq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_pd (),
- __U);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_test_epi32_mask (__m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ptestmd512 ((__v16si) __A,
- (__v16si) __B,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_test_epi32_mask (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ptestmd512 ((__v16si) __A,
- (__v16si) __B, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_test_epi64_mask (__m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ptestmq512 ((__v8di) __A,
- (__v8di) __B,
- (__mmask8) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_test_epi64_mask (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ptestmq512 ((__v8di) __A, (__v8di) __B, __U);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_testn_epi32_mask (__m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ptestnmd512 ((__v16si) __A,
- (__v16si) __B,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_testn_epi32_mask (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ptestnmd512 ((__v16si) __A,
- (__v16si) __B, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_testn_epi64_mask (__m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ptestnmq512 ((__v8di) __A,
- (__v8di) __B,
- (__mmask8) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_testn_epi64_mask (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ptestnmq512 ((__v8di) __A,
- (__v8di) __B, __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_abs_ps (__m512 __A)
- {
- return (__m512) _mm512_and_epi32 ((__m512i) __A,
- _mm512_set1_epi32 (0x7fffffff));
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_abs_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) _mm512_mask_and_epi32 ((__m512i) __W, __U, (__m512i) __A,
- _mm512_set1_epi32 (0x7fffffff));
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_abs_pd (__m512d __A)
- {
- return (__m512d) _mm512_and_epi64 ((__m512i) __A,
- _mm512_set1_epi64 (0x7fffffffffffffffLL));
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_abs_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d)
- _mm512_mask_and_epi64 ((__m512i) __W, __U, (__m512i) __A,
- _mm512_set1_epi64 (0x7fffffffffffffffLL));
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpackhi_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckhdq512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpackhi_epi32 (__m512i __W, __mmask16 __U, __m512i __A,
- __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckhdq512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpackhi_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckhdq512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpackhi_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckhqdq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpackhi_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckhqdq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpackhi_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckhqdq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpacklo_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckldq512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpacklo_epi32 (__m512i __W, __mmask16 __U, __m512i __A,
- __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckldq512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpacklo_epi32 (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpckldq512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpacklo_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpcklqdq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpacklo_epi64 (__m512i __W, __mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpcklqdq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpacklo_epi64 (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_punpcklqdq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #ifdef __x86_64__
- #ifdef __OPTIMIZE__
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundss_u64 (__m128 __A, const int __R)
- {
- return (unsigned long long) __builtin_ia32_vcvtss2usi64 ((__v4sf) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundss_si64 (__m128 __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvtss2si64 ((__v4sf) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundss_i64 (__m128 __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvtss2si64 ((__v4sf) __A, __R);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundss_u64 (__m128 __A, const int __R)
- {
- return (unsigned long long) __builtin_ia32_vcvttss2usi64 ((__v4sf) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundss_i64 (__m128 __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvttss2si64 ((__v4sf) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundss_si64 (__m128 __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvttss2si64 ((__v4sf) __A, __R);
- }
- #else
- #define _mm_cvt_roundss_u64(A, B) \
- ((unsigned long long)__builtin_ia32_vcvtss2usi64(A, B))
- #define _mm_cvt_roundss_si64(A, B) \
- ((long long)__builtin_ia32_vcvtss2si64(A, B))
- #define _mm_cvt_roundss_i64(A, B) \
- ((long long)__builtin_ia32_vcvtss2si64(A, B))
- #define _mm_cvtt_roundss_u64(A, B) \
- ((unsigned long long)__builtin_ia32_vcvttss2usi64(A, B))
- #define _mm_cvtt_roundss_i64(A, B) \
- ((long long)__builtin_ia32_vcvttss2si64(A, B))
- #define _mm_cvtt_roundss_si64(A, B) \
- ((long long)__builtin_ia32_vcvttss2si64(A, B))
- #endif
- #endif
- #ifdef __OPTIMIZE__
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundss_u32 (__m128 __A, const int __R)
- {
- return (unsigned) __builtin_ia32_vcvtss2usi32 ((__v4sf) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundss_si32 (__m128 __A, const int __R)
- {
- return (int) __builtin_ia32_vcvtss2si32 ((__v4sf) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundss_i32 (__m128 __A, const int __R)
- {
- return (int) __builtin_ia32_vcvtss2si32 ((__v4sf) __A, __R);
- }
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundss_u32 (__m128 __A, const int __R)
- {
- return (unsigned) __builtin_ia32_vcvttss2usi32 ((__v4sf) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundss_i32 (__m128 __A, const int __R)
- {
- return (int) __builtin_ia32_vcvttss2si32 ((__v4sf) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundss_si32 (__m128 __A, const int __R)
- {
- return (int) __builtin_ia32_vcvttss2si32 ((__v4sf) __A, __R);
- }
- #else
- #define _mm_cvt_roundss_u32(A, B) \
- ((unsigned)__builtin_ia32_vcvtss2usi32(A, B))
- #define _mm_cvt_roundss_si32(A, B) \
- ((int)__builtin_ia32_vcvtss2si32(A, B))
- #define _mm_cvt_roundss_i32(A, B) \
- ((int)__builtin_ia32_vcvtss2si32(A, B))
- #define _mm_cvtt_roundss_u32(A, B) \
- ((unsigned)__builtin_ia32_vcvttss2usi32(A, B))
- #define _mm_cvtt_roundss_si32(A, B) \
- ((int)__builtin_ia32_vcvttss2si32(A, B))
- #define _mm_cvtt_roundss_i32(A, B) \
- ((int)__builtin_ia32_vcvttss2si32(A, B))
- #endif
- #ifdef __x86_64__
- #ifdef __OPTIMIZE__
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsd_u64 (__m128d __A, const int __R)
- {
- return (unsigned long long) __builtin_ia32_vcvtsd2usi64 ((__v2df) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsd_si64 (__m128d __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvtsd2si64 ((__v2df) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsd_i64 (__m128d __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvtsd2si64 ((__v2df) __A, __R);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundsd_u64 (__m128d __A, const int __R)
- {
- return (unsigned long long) __builtin_ia32_vcvttsd2usi64 ((__v2df) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundsd_si64 (__m128d __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvttsd2si64 ((__v2df) __A, __R);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundsd_i64 (__m128d __A, const int __R)
- {
- return (long long) __builtin_ia32_vcvttsd2si64 ((__v2df) __A, __R);
- }
- #else
- #define _mm_cvt_roundsd_u64(A, B) \
- ((unsigned long long)__builtin_ia32_vcvtsd2usi64(A, B))
- #define _mm_cvt_roundsd_si64(A, B) \
- ((long long)__builtin_ia32_vcvtsd2si64(A, B))
- #define _mm_cvt_roundsd_i64(A, B) \
- ((long long)__builtin_ia32_vcvtsd2si64(A, B))
- #define _mm_cvtt_roundsd_u64(A, B) \
- ((unsigned long long)__builtin_ia32_vcvttsd2usi64(A, B))
- #define _mm_cvtt_roundsd_si64(A, B) \
- ((long long)__builtin_ia32_vcvttsd2si64(A, B))
- #define _mm_cvtt_roundsd_i64(A, B) \
- ((long long)__builtin_ia32_vcvttsd2si64(A, B))
- #endif
- #endif
- #ifdef __OPTIMIZE__
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsd_u32 (__m128d __A, const int __R)
- {
- return (unsigned) __builtin_ia32_vcvtsd2usi32 ((__v2df) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsd_si32 (__m128d __A, const int __R)
- {
- return (int) __builtin_ia32_vcvtsd2si32 ((__v2df) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsd_i32 (__m128d __A, const int __R)
- {
- return (int) __builtin_ia32_vcvtsd2si32 ((__v2df) __A, __R);
- }
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundsd_u32 (__m128d __A, const int __R)
- {
- return (unsigned) __builtin_ia32_vcvttsd2usi32 ((__v2df) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundsd_i32 (__m128d __A, const int __R)
- {
- return (int) __builtin_ia32_vcvttsd2si32 ((__v2df) __A, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtt_roundsd_si32 (__m128d __A, const int __R)
- {
- return (int) __builtin_ia32_vcvttsd2si32 ((__v2df) __A, __R);
- }
- #else
- #define _mm_cvt_roundsd_u32(A, B) \
- ((unsigned)__builtin_ia32_vcvtsd2usi32(A, B))
- #define _mm_cvt_roundsd_si32(A, B) \
- ((int)__builtin_ia32_vcvtsd2si32(A, B))
- #define _mm_cvt_roundsd_i32(A, B) \
- ((int)__builtin_ia32_vcvtsd2si32(A, B))
- #define _mm_cvtt_roundsd_u32(A, B) \
- ((unsigned)__builtin_ia32_vcvttsd2usi32(A, B))
- #define _mm_cvtt_roundsd_si32(A, B) \
- ((int)__builtin_ia32_vcvttsd2si32(A, B))
- #define _mm_cvtt_roundsd_i32(A, B) \
- ((int)__builtin_ia32_vcvttsd2si32(A, B))
- #endif
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_movedup_pd (__m512d __A)
- {
- return (__m512d) __builtin_ia32_movddup512_mask ((__v8df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_movedup_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_movddup512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_movedup_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_movddup512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpacklo_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_unpcklpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpacklo_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_unpcklpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpacklo_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_unpcklpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpackhi_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_unpckhpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpackhi_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_unpckhpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpackhi_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_unpckhpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpackhi_ps (__m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_unpckhps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpackhi_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_unpckhps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpackhi_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_unpckhps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundps_pd (__m256 __A, const int __R)
- {
- return (__m512d) __builtin_ia32_cvtps2pd512_mask ((__v8sf) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundps_pd (__m512d __W, __mmask8 __U, __m256 __A,
- const int __R)
- {
- return (__m512d) __builtin_ia32_cvtps2pd512_mask ((__v8sf) __A,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundps_pd (__mmask8 __U, __m256 __A, const int __R)
- {
- return (__m512d) __builtin_ia32_cvtps2pd512_mask ((__v8sf) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundph_ps (__m256i __A, const int __R)
- {
- return (__m512) __builtin_ia32_vcvtph2ps512_mask ((__v16hi) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundph_ps (__m512 __W, __mmask16 __U, __m256i __A,
- const int __R)
- {
- return (__m512) __builtin_ia32_vcvtph2ps512_mask ((__v16hi) __A,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundph_ps (__mmask16 __U, __m256i __A, const int __R)
- {
- return (__m512) __builtin_ia32_vcvtph2ps512_mask ((__v16hi) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundps_ph (__m512 __A, const int __I)
- {
- return (__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf) __A,
- __I,
- (__v16hi)
- _mm256_undefined_si256 (),
- -1);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtps_ph (__m512 __A, const int __I)
- {
- return (__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf) __A,
- __I,
- (__v16hi)
- _mm256_undefined_si256 (),
- -1);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundps_ph (__m256i __U, __mmask16 __W, __m512 __A,
- const int __I)
- {
- return (__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf) __A,
- __I,
- (__v16hi) __U,
- (__mmask16) __W);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtps_ph (__m256i __U, __mmask16 __W, __m512 __A, const int __I)
- {
- return (__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf) __A,
- __I,
- (__v16hi) __U,
- (__mmask16) __W);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundps_ph (__mmask16 __W, __m512 __A, const int __I)
- {
- return (__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf) __A,
- __I,
- (__v16hi)
- _mm256_setzero_si256 (),
- (__mmask16) __W);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtps_ph (__mmask16 __W, __m512 __A, const int __I)
- {
- return (__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf) __A,
- __I,
- (__v16hi)
- _mm256_setzero_si256 (),
- (__mmask16) __W);
- }
- #else
- #define _mm512_cvt_roundps_pd(A, B) \
- (__m512d)__builtin_ia32_cvtps2pd512_mask(A, (__v8df)_mm512_undefined_pd(), -1, B)
- #define _mm512_mask_cvt_roundps_pd(W, U, A, B) \
- (__m512d)__builtin_ia32_cvtps2pd512_mask(A, (__v8df)(W), U, B)
- #define _mm512_maskz_cvt_roundps_pd(U, A, B) \
- (__m512d)__builtin_ia32_cvtps2pd512_mask(A, (__v8df)_mm512_setzero_pd(), U, B)
- #define _mm512_cvt_roundph_ps(A, B) \
- (__m512)__builtin_ia32_vcvtph2ps512_mask((__v16hi)(A), (__v16sf)_mm512_undefined_ps(), -1, B)
- #define _mm512_mask_cvt_roundph_ps(W, U, A, B) \
- (__m512)__builtin_ia32_vcvtph2ps512_mask((__v16hi)(A), (__v16sf)(W), U, B)
- #define _mm512_maskz_cvt_roundph_ps(U, A, B) \
- (__m512)__builtin_ia32_vcvtph2ps512_mask((__v16hi)(A), (__v16sf)_mm512_setzero_ps(), U, B)
- #define _mm512_cvt_roundps_ph(A, I) \
- ((__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf)(__m512) A, (int) (I),\
- (__v16hi)_mm256_undefined_si256 (), -1))
- #define _mm512_cvtps_ph(A, I) \
- ((__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf)(__m512) A, (int) (I),\
- (__v16hi)_mm256_undefined_si256 (), -1))
- #define _mm512_mask_cvt_roundps_ph(U, W, A, I) \
- ((__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf)(__m512) A, (int) (I),\
- (__v16hi)(__m256i)(U), (__mmask16) (W)))
- #define _mm512_mask_cvtps_ph(U, W, A, I) \
- ((__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf)(__m512) A, (int) (I),\
- (__v16hi)(__m256i)(U), (__mmask16) (W)))
- #define _mm512_maskz_cvt_roundps_ph(W, A, I) \
- ((__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf)(__m512) A, (int) (I),\
- (__v16hi)_mm256_setzero_si256 (), (__mmask16) (W)))
- #define _mm512_maskz_cvtps_ph(W, A, I) \
- ((__m256i) __builtin_ia32_vcvtps2ph512_mask ((__v16sf)(__m512) A, (int) (I),\
- (__v16hi)_mm256_setzero_si256 (), (__mmask16) (W)))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvt_roundpd_ps (__m512d __A, const int __R)
- {
- return (__m256) __builtin_ia32_cvtpd2ps512_mask ((__v8df) __A,
- (__v8sf)
- _mm256_undefined_ps (),
- (__mmask8) -1, __R);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvt_roundpd_ps (__m256 __W, __mmask8 __U, __m512d __A,
- const int __R)
- {
- return (__m256) __builtin_ia32_cvtpd2ps512_mask ((__v8df) __A,
- (__v8sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvt_roundpd_ps (__mmask8 __U, __m512d __A, const int __R)
- {
- return (__m256) __builtin_ia32_cvtpd2ps512_mask ((__v8df) __A,
- (__v8sf)
- _mm256_setzero_ps (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundsd_ss (__m128 __A, __m128d __B, const int __R)
- {
- return (__m128) __builtin_ia32_cvtsd2ss_round ((__v4sf) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvt_roundss_sd (__m128d __A, __m128 __B, const int __R)
- {
- return (__m128d) __builtin_ia32_cvtss2sd_round ((__v2df) __A,
- (__v4sf) __B,
- __R);
- }
- #else
- #define _mm512_cvt_roundpd_ps(A, B) \
- (__m256)__builtin_ia32_cvtpd2ps512_mask(A, (__v8sf)_mm256_undefined_ps(), -1, B)
- #define _mm512_mask_cvt_roundpd_ps(W, U, A, B) \
- (__m256)__builtin_ia32_cvtpd2ps512_mask(A, (__v8sf)(W), U, B)
- #define _mm512_maskz_cvt_roundpd_ps(U, A, B) \
- (__m256)__builtin_ia32_cvtpd2ps512_mask(A, (__v8sf)_mm256_setzero_ps(), U, B)
- #define _mm_cvt_roundsd_ss(A, B, C) \
- (__m128)__builtin_ia32_cvtsd2ss_round(A, B, C)
- #define _mm_cvt_roundss_sd(A, B, C) \
- (__m128d)__builtin_ia32_cvtss2sd_round(A, B, C)
- #endif
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_stream_si512 (__m512i * __P, __m512i __A)
- {
- __builtin_ia32_movntdq512 ((__v8di *) __P, (__v8di) __A);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_stream_ps (float *__P, __m512 __A)
- {
- __builtin_ia32_movntps512 (__P, (__v16sf) __A);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_stream_pd (double *__P, __m512d __A)
- {
- __builtin_ia32_movntpd512 (__P, (__v8df) __A);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_stream_load_si512 (void *__P)
- {
- return __builtin_ia32_movntdqa512 ((__v8di *)__P);
- }
- /* Constants for mantissa extraction */
- typedef enum
- {
- _MM_MANT_NORM_1_2, /* interval [1, 2) */
- _MM_MANT_NORM_p5_2, /* interval [0.5, 2) */
- _MM_MANT_NORM_p5_1, /* interval [0.5, 1) */
- _MM_MANT_NORM_p75_1p5 /* interval [0.75, 1.5) */
- } _MM_MANTISSA_NORM_ENUM;
- typedef enum
- {
- _MM_MANT_SIGN_src, /* sign = sign(SRC) */
- _MM_MANT_SIGN_zero, /* sign = 0 */
- _MM_MANT_SIGN_nan /* DEST = NaN if sign(SRC) = 1 */
- } _MM_MANTISSA_SIGN_ENUM;
- #ifdef __OPTIMIZE__
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getexp_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_getexpss128_round ((__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getexp_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_getexpss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getexp_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_getexpss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getexp_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_getexpsd128_round ((__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getexp_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_getexpsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getexp_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_getexpsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getexp_round_ps (__m512 __A, const int __R)
- {
- return (__m512) __builtin_ia32_getexpps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getexp_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- const int __R)
- {
- return (__m512) __builtin_ia32_getexpps512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getexp_round_ps (__mmask16 __U, __m512 __A, const int __R)
- {
- return (__m512) __builtin_ia32_getexpps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getexp_round_pd (__m512d __A, const int __R)
- {
- return (__m512d) __builtin_ia32_getexppd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getexp_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- const int __R)
- {
- return (__m512d) __builtin_ia32_getexppd512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getexp_round_pd (__mmask8 __U, __m512d __A, const int __R)
- {
- return (__m512d) __builtin_ia32_getexppd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getmant_round_pd (__m512d __A, _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C, const int __R)
- {
- return (__m512d) __builtin_ia32_getmantpd512_mask ((__v8df) __A,
- (__C << 2) | __B,
- _mm512_undefined_pd (),
- (__mmask8) -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getmant_round_pd (__m512d __W, __mmask8 __U, __m512d __A,
- _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C, const int __R)
- {
- return (__m512d) __builtin_ia32_getmantpd512_mask ((__v8df) __A,
- (__C << 2) | __B,
- (__v8df) __W, __U,
- __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getmant_round_pd (__mmask8 __U, __m512d __A,
- _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C, const int __R)
- {
- return (__m512d) __builtin_ia32_getmantpd512_mask ((__v8df) __A,
- (__C << 2) | __B,
- (__v8df)
- _mm512_setzero_pd (),
- __U, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getmant_round_ps (__m512 __A, _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C, const int __R)
- {
- return (__m512) __builtin_ia32_getmantps512_mask ((__v16sf) __A,
- (__C << 2) | __B,
- _mm512_undefined_ps (),
- (__mmask16) -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getmant_round_ps (__m512 __W, __mmask16 __U, __m512 __A,
- _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C, const int __R)
- {
- return (__m512) __builtin_ia32_getmantps512_mask ((__v16sf) __A,
- (__C << 2) | __B,
- (__v16sf) __W, __U,
- __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getmant_round_ps (__mmask16 __U, __m512 __A,
- _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C, const int __R)
- {
- return (__m512) __builtin_ia32_getmantps512_mask ((__v16sf) __A,
- (__C << 2) | __B,
- (__v16sf)
- _mm512_setzero_ps (),
- __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getmant_round_sd (__m128d __A, __m128d __B,
- _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D, const int __R)
- {
- return (__m128d) __builtin_ia32_getmantsd_round ((__v2df) __A,
- (__v2df) __B,
- (__D << 2) | __C,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getmant_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D, const int __R)
- {
- return (__m128d) __builtin_ia32_getmantsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__D << 2) | __C,
- (__v2df) __W,
- __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getmant_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D, const int __R)
- {
- return (__m128d) __builtin_ia32_getmantsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__D << 2) | __C,
- (__v2df)
- _mm_setzero_pd(),
- __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getmant_round_ss (__m128 __A, __m128 __B,
- _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D, const int __R)
- {
- return (__m128) __builtin_ia32_getmantss_round ((__v4sf) __A,
- (__v4sf) __B,
- (__D << 2) | __C,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getmant_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D, const int __R)
- {
- return (__m128) __builtin_ia32_getmantss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__D << 2) | __C,
- (__v4sf) __W,
- __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getmant_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D, const int __R)
- {
- return (__m128) __builtin_ia32_getmantss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__D << 2) | __C,
- (__v4sf)
- _mm_setzero_ps(),
- __U, __R);
- }
- #else
- #define _mm512_getmant_round_pd(X, B, C, R) \
- ((__m512d)__builtin_ia32_getmantpd512_mask ((__v8df)(__m512d)(X), \
- (int)(((C)<<2) | (B)), \
- (__v8df)(__m512d)_mm512_undefined_pd(), \
- (__mmask8)-1,\
- (R)))
- #define _mm512_mask_getmant_round_pd(W, U, X, B, C, R) \
- ((__m512d)__builtin_ia32_getmantpd512_mask ((__v8df)(__m512d)(X), \
- (int)(((C)<<2) | (B)), \
- (__v8df)(__m512d)(W), \
- (__mmask8)(U),\
- (R)))
- #define _mm512_maskz_getmant_round_pd(U, X, B, C, R) \
- ((__m512d)__builtin_ia32_getmantpd512_mask ((__v8df)(__m512d)(X), \
- (int)(((C)<<2) | (B)), \
- (__v8df)(__m512d)_mm512_setzero_pd(), \
- (__mmask8)(U),\
- (R)))
- #define _mm512_getmant_round_ps(X, B, C, R) \
- ((__m512)__builtin_ia32_getmantps512_mask ((__v16sf)(__m512)(X), \
- (int)(((C)<<2) | (B)), \
- (__v16sf)(__m512)_mm512_undefined_ps(), \
- (__mmask16)-1,\
- (R)))
- #define _mm512_mask_getmant_round_ps(W, U, X, B, C, R) \
- ((__m512)__builtin_ia32_getmantps512_mask ((__v16sf)(__m512)(X), \
- (int)(((C)<<2) | (B)), \
- (__v16sf)(__m512)(W), \
- (__mmask16)(U),\
- (R)))
- #define _mm512_maskz_getmant_round_ps(U, X, B, C, R) \
- ((__m512)__builtin_ia32_getmantps512_mask ((__v16sf)(__m512)(X), \
- (int)(((C)<<2) | (B)), \
- (__v16sf)(__m512)_mm512_setzero_ps(), \
- (__mmask16)(U),\
- (R)))
- #define _mm_getmant_round_sd(X, Y, C, D, R) \
- ((__m128d)__builtin_ia32_getmantsd_round ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), \
- (int)(((D)<<2) | (C)), \
- (R)))
- #define _mm_mask_getmant_round_sd(W, U, X, Y, C, D, R) \
- ((__m128d)__builtin_ia32_getmantsd_mask_round ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v2df)(__m128d)(W), \
- (__mmask8)(U),\
- (R)))
- #define _mm_maskz_getmant_round_sd(U, X, Y, C, D, R) \
- ((__m128d)__builtin_ia32_getmantsd_mask_round ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v2df)(__m128d)_mm_setzero_pd(), \
- (__mmask8)(U),\
- (R)))
- #define _mm_getmant_round_ss(X, Y, C, D, R) \
- ((__m128)__builtin_ia32_getmantss_round ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), \
- (int)(((D)<<2) | (C)), \
- (R)))
- #define _mm_mask_getmant_round_ss(W, U, X, Y, C, D, R) \
- ((__m128)__builtin_ia32_getmantss_mask_round ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v4sf)(__m128)(W), \
- (__mmask8)(U),\
- (R)))
- #define _mm_maskz_getmant_round_ss(U, X, Y, C, D, R) \
- ((__m128)__builtin_ia32_getmantss_mask_round ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v4sf)(__m128)_mm_setzero_ps(), \
- (__mmask8)(U),\
- (R)))
- #define _mm_getexp_round_ss(A, B, R) \
- ((__m128)__builtin_ia32_getexpss128_round((__v4sf)(__m128)(A), (__v4sf)(__m128)(B), R))
- #define _mm_mask_getexp_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_getexpss_mask_round(A, B, W, U, C)
- #define _mm_maskz_getexp_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_getexpss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U, C)
- #define _mm_getexp_round_sd(A, B, R) \
- ((__m128d)__builtin_ia32_getexpsd128_round((__v2df)(__m128d)(A), (__v2df)(__m128d)(B), R))
- #define _mm_mask_getexp_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_getexpsd_mask_round(A, B, W, U, C)
- #define _mm_maskz_getexp_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_getexpsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U, C)
- #define _mm512_getexp_round_ps(A, R) \
- ((__m512)__builtin_ia32_getexpps512_mask((__v16sf)(__m512)(A), \
- (__v16sf)_mm512_undefined_ps(), (__mmask16)-1, R))
- #define _mm512_mask_getexp_round_ps(W, U, A, R) \
- ((__m512)__builtin_ia32_getexpps512_mask((__v16sf)(__m512)(A), \
- (__v16sf)(__m512)(W), (__mmask16)(U), R))
- #define _mm512_maskz_getexp_round_ps(U, A, R) \
- ((__m512)__builtin_ia32_getexpps512_mask((__v16sf)(__m512)(A), \
- (__v16sf)_mm512_setzero_ps(), (__mmask16)(U), R))
- #define _mm512_getexp_round_pd(A, R) \
- ((__m512d)__builtin_ia32_getexppd512_mask((__v8df)(__m512d)(A), \
- (__v8df)_mm512_undefined_pd(), (__mmask8)-1, R))
- #define _mm512_mask_getexp_round_pd(W, U, A, R) \
- ((__m512d)__builtin_ia32_getexppd512_mask((__v8df)(__m512d)(A), \
- (__v8df)(__m512d)(W), (__mmask8)(U), R))
- #define _mm512_maskz_getexp_round_pd(U, A, R) \
- ((__m512d)__builtin_ia32_getexppd512_mask((__v8df)(__m512d)(A), \
- (__v8df)_mm512_setzero_pd(), (__mmask8)(U), R))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_roundscale_round_ps (__m512 __A, const int __imm, const int __R)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A, __imm,
- (__v16sf)
- _mm512_undefined_ps (),
- -1, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_roundscale_round_ps (__m512 __A, __mmask16 __B, __m512 __C,
- const int __imm, const int __R)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __C, __imm,
- (__v16sf) __A,
- (__mmask16) __B, __R);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_roundscale_round_ps (__mmask16 __A, __m512 __B,
- const int __imm, const int __R)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __B,
- __imm,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __A, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_roundscale_round_pd (__m512d __A, const int __imm, const int __R)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A, __imm,
- (__v8df)
- _mm512_undefined_pd (),
- -1, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_roundscale_round_pd (__m512d __A, __mmask8 __B,
- __m512d __C, const int __imm, const int __R)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __C, __imm,
- (__v8df) __A,
- (__mmask8) __B, __R);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_roundscale_round_pd (__mmask8 __A, __m512d __B,
- const int __imm, const int __R)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __B,
- __imm,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __A, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_roundscale_round_ss (__m128 __A, __m128 __B, const int __imm, const int __R)
- {
- return (__m128) __builtin_ia32_rndscaless_round ((__v4sf) __A,
- (__v4sf) __B, __imm, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_roundscale_round_sd (__m128d __A, __m128d __B, const int __imm,
- const int __R)
- {
- return (__m128d) __builtin_ia32_rndscalesd_round ((__v2df) __A,
- (__v2df) __B, __imm, __R);
- }
- #else
- #define _mm512_roundscale_round_ps(A, B, R) \
- ((__m512) __builtin_ia32_rndscaleps_mask ((__v16sf)(__m512)(A), (int)(B),\
- (__v16sf)_mm512_undefined_ps(), (__mmask16)(-1), R))
- #define _mm512_mask_roundscale_round_ps(A, B, C, D, R) \
- ((__m512) __builtin_ia32_rndscaleps_mask ((__v16sf)(__m512)(C), \
- (int)(D), \
- (__v16sf)(__m512)(A), \
- (__mmask16)(B), R))
- #define _mm512_maskz_roundscale_round_ps(A, B, C, R) \
- ((__m512) __builtin_ia32_rndscaleps_mask ((__v16sf)(__m512)(B), \
- (int)(C), \
- (__v16sf)_mm512_setzero_ps(),\
- (__mmask16)(A), R))
- #define _mm512_roundscale_round_pd(A, B, R) \
- ((__m512d) __builtin_ia32_rndscalepd_mask ((__v8df)(__m512d)(A), (int)(B),\
- (__v8df)_mm512_undefined_pd(), (__mmask8)(-1), R))
- #define _mm512_mask_roundscale_round_pd(A, B, C, D, R) \
- ((__m512d) __builtin_ia32_rndscalepd_mask ((__v8df)(__m512d)(C), \
- (int)(D), \
- (__v8df)(__m512d)(A), \
- (__mmask8)(B), R))
- #define _mm512_maskz_roundscale_round_pd(A, B, C, R) \
- ((__m512d) __builtin_ia32_rndscalepd_mask ((__v8df)(__m512d)(B), \
- (int)(C), \
- (__v8df)_mm512_setzero_pd(),\
- (__mmask8)(A), R))
- #define _mm_roundscale_round_ss(A, B, C, R) \
- ((__m128) __builtin_ia32_rndscaless_round ((__v4sf)(__m128)(A), \
- (__v4sf)(__m128)(B), (int)(C), R))
- #define _mm_roundscale_round_sd(A, B, C, R) \
- ((__m128d) __builtin_ia32_rndscalesd_round ((__v2df)(__m128d)(A), \
- (__v2df)(__m128d)(B), (int)(C), R))
- #endif
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_floor_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A,
- _MM_FROUND_FLOOR,
- (__v16sf) __A, -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_floor_pd (__m512d __A)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A,
- _MM_FROUND_FLOOR,
- (__v8df) __A, -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_ceil_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A,
- _MM_FROUND_CEIL,
- (__v16sf) __A, -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_ceil_pd (__m512d __A)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A,
- _MM_FROUND_CEIL,
- (__v8df) __A, -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_floor_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A,
- _MM_FROUND_FLOOR,
- (__v16sf) __W, __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_floor_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A,
- _MM_FROUND_FLOOR,
- (__v8df) __W, __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_ceil_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A,
- _MM_FROUND_CEIL,
- (__v16sf) __W, __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_ceil_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A,
- _MM_FROUND_CEIL,
- (__v8df) __W, __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_alignr_epi32 (__m512i __A, __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_alignd512_mask ((__v16si) __A,
- (__v16si) __B, __imm,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_alignr_epi32 (__m512i __W, __mmask16 __U, __m512i __A,
- __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_alignd512_mask ((__v16si) __A,
- (__v16si) __B, __imm,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_alignr_epi32 (__mmask16 __U, __m512i __A, __m512i __B,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_alignd512_mask ((__v16si) __A,
- (__v16si) __B, __imm,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_alignr_epi64 (__m512i __A, __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_alignq512_mask ((__v8di) __A,
- (__v8di) __B, __imm,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_alignr_epi64 (__m512i __W, __mmask8 __U, __m512i __A,
- __m512i __B, const int __imm)
- {
- return (__m512i) __builtin_ia32_alignq512_mask ((__v8di) __A,
- (__v8di) __B, __imm,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_alignr_epi64 (__mmask8 __U, __m512i __A, __m512i __B,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_alignq512_mask ((__v8di) __A,
- (__v8di) __B, __imm,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- #else
- #define _mm512_alignr_epi32(X, Y, C) \
- ((__m512i)__builtin_ia32_alignd512_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(C), (__v16si)_mm512_undefined_epi32 (),\
- (__mmask16)-1))
- #define _mm512_mask_alignr_epi32(W, U, X, Y, C) \
- ((__m512i)__builtin_ia32_alignd512_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(C), (__v16si)(__m512i)(W), \
- (__mmask16)(U)))
- #define _mm512_maskz_alignr_epi32(U, X, Y, C) \
- ((__m512i)__builtin_ia32_alignd512_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(C), (__v16si)_mm512_setzero_si512 (),\
- (__mmask16)(U)))
- #define _mm512_alignr_epi64(X, Y, C) \
- ((__m512i)__builtin_ia32_alignq512_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(C), (__v8di)_mm512_undefined_epi32 (), \
- (__mmask8)-1))
- #define _mm512_mask_alignr_epi64(W, U, X, Y, C) \
- ((__m512i)__builtin_ia32_alignq512_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(C), (__v8di)(__m512i)(W), (__mmask8)(U)))
- #define _mm512_maskz_alignr_epi64(U, X, Y, C) \
- ((__m512i)__builtin_ia32_alignq512_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(C), (__v8di)_mm512_setzero_si512 (),\
- (__mmask8)(U)))
- #endif
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpeq_epi32_mask (__m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_pcmpeqd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpeq_epi32_mask (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_pcmpeqd512_mask ((__v16si) __A,
- (__v16si) __B, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpeq_epi64_mask (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_pcmpeqq512_mask ((__v8di) __A,
- (__v8di) __B, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpeq_epi64_mask (__m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_pcmpeqq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpgt_epi32_mask (__m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_pcmpgtd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpgt_epi32_mask (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_pcmpgtd512_mask ((__v16si) __A,
- (__v16si) __B, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpgt_epi64_mask (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_pcmpgtq512_mask ((__v8di) __A,
- (__v8di) __B, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpgt_epi64_mask (__m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_pcmpgtq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpge_epi32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 5,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpge_epi32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 5,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpge_epu32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 5,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpge_epu32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 5,
- (__mmask16) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpge_epi64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 5,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpge_epi64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 5,
- (__mmask8) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpge_epu64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 5,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpge_epu64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 5,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmple_epi32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 2,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmple_epi32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 2,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmple_epu32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 2,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmple_epu32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 2,
- (__mmask16) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmple_epi64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 2,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmple_epi64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 2,
- (__mmask8) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmple_epu64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 2,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmple_epu64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 2,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmplt_epi32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 1,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmplt_epi32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 1,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmplt_epu32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 1,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmplt_epu32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 1,
- (__mmask16) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmplt_epi64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 1,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmplt_epi64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 1,
- (__mmask8) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmplt_epu64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 1,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmplt_epu64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 1,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpneq_epi32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 4,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpneq_epi32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 4,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpneq_epu32_mask (__mmask16 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 4,
- (__mmask16) __M);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpneq_epu32_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, 4,
- (__mmask16) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpneq_epi64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 4,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpneq_epi64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 4,
- (__mmask8) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpneq_epu64_mask (__mmask8 __M, __m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 4,
- (__mmask8) __M);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpneq_epu64_mask (__m512i __X, __m512i __Y)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, 4,
- (__mmask8) -1);
- }
- #define _MM_CMPINT_EQ 0x0
- #define _MM_CMPINT_LT 0x1
- #define _MM_CMPINT_LE 0x2
- #define _MM_CMPINT_UNUSED 0x3
- #define _MM_CMPINT_NE 0x4
- #define _MM_CMPINT_NLT 0x5
- #define _MM_CMPINT_GE 0x5
- #define _MM_CMPINT_NLE 0x6
- #define _MM_CMPINT_GT 0x6
- #ifdef __OPTIMIZE__
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _kshiftli_mask16 (__mmask16 __A, unsigned int __B)
- {
- return (__mmask16) __builtin_ia32_kshiftlihi ((__mmask16) __A,
- (__mmask8) __B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _kshiftri_mask16 (__mmask16 __A, unsigned int __B)
- {
- return (__mmask16) __builtin_ia32_kshiftrihi ((__mmask16) __A,
- (__mmask8) __B);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_epi64_mask (__m512i __X, __m512i __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, __P,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_epi32_mask (__m512i __X, __m512i __Y, const int __P)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, __P,
- (__mmask16) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_epu64_mask (__m512i __X, __m512i __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, __P,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_epu32_mask (__m512i __X, __m512i __Y, const int __P)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, __P,
- (__mmask16) -1);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_round_pd_mask (__m512d __X, __m512d __Y, const int __P,
- const int __R)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, __P,
- (__mmask8) -1, __R);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_round_ps_mask (__m512 __X, __m512 __Y, const int __P, const int __R)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, __P,
- (__mmask16) -1, __R);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_epi64_mask (__mmask8 __U, __m512i __X, __m512i __Y,
- const int __P)
- {
- return (__mmask8) __builtin_ia32_cmpq512_mask ((__v8di) __X,
- (__v8di) __Y, __P,
- (__mmask8) __U);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_epi32_mask (__mmask16 __U, __m512i __X, __m512i __Y,
- const int __P)
- {
- return (__mmask16) __builtin_ia32_cmpd512_mask ((__v16si) __X,
- (__v16si) __Y, __P,
- (__mmask16) __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_epu64_mask (__mmask8 __U, __m512i __X, __m512i __Y,
- const int __P)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __X,
- (__v8di) __Y, __P,
- (__mmask8) __U);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_epu32_mask (__mmask16 __U, __m512i __X, __m512i __Y,
- const int __P)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __X,
- (__v16si) __Y, __P,
- (__mmask16) __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_round_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y,
- const int __P, const int __R)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, __P,
- (__mmask8) __U, __R);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_round_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y,
- const int __P, const int __R)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, __P,
- (__mmask16) __U, __R);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cmp_round_sd_mask (__m128d __X, __m128d __Y, const int __P, const int __R)
- {
- return (__mmask8) __builtin_ia32_cmpsd_mask ((__v2df) __X,
- (__v2df) __Y, __P,
- (__mmask8) -1, __R);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_cmp_round_sd_mask (__mmask8 __M, __m128d __X, __m128d __Y,
- const int __P, const int __R)
- {
- return (__mmask8) __builtin_ia32_cmpsd_mask ((__v2df) __X,
- (__v2df) __Y, __P,
- (__mmask8) __M, __R);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cmp_round_ss_mask (__m128 __X, __m128 __Y, const int __P, const int __R)
- {
- return (__mmask8) __builtin_ia32_cmpss_mask ((__v4sf) __X,
- (__v4sf) __Y, __P,
- (__mmask8) -1, __R);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_cmp_round_ss_mask (__mmask8 __M, __m128 __X, __m128 __Y,
- const int __P, const int __R)
- {
- return (__mmask8) __builtin_ia32_cmpss_mask ((__v4sf) __X,
- (__v4sf) __Y, __P,
- (__mmask8) __M, __R);
- }
- #else
- #define _kshiftli_mask16(X, Y) \
- ((__mmask16) __builtin_ia32_kshiftlihi ((__mmask16)(X), (__mmask8)(Y)))
- #define _kshiftri_mask16(X, Y) \
- ((__mmask16) __builtin_ia32_kshiftrihi ((__mmask16)(X), (__mmask8)(Y)))
- #define _mm512_cmp_epi64_mask(X, Y, P) \
- ((__mmask8) __builtin_ia32_cmpq512_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(P),\
- (__mmask8)-1))
- #define _mm512_cmp_epi32_mask(X, Y, P) \
- ((__mmask16) __builtin_ia32_cmpd512_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(P), \
- (__mmask16)-1))
- #define _mm512_cmp_epu64_mask(X, Y, P) \
- ((__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(P),\
- (__mmask8)-1))
- #define _mm512_cmp_epu32_mask(X, Y, P) \
- ((__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(P), \
- (__mmask16)-1))
- #define _mm512_cmp_round_pd_mask(X, Y, P, R) \
- ((__mmask8) __builtin_ia32_cmppd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(P),\
- (__mmask8)-1, R))
- #define _mm512_cmp_round_ps_mask(X, Y, P, R) \
- ((__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(P),\
- (__mmask16)-1, R))
- #define _mm512_mask_cmp_epi64_mask(M, X, Y, P) \
- ((__mmask8) __builtin_ia32_cmpq512_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(P),\
- (__mmask8)M))
- #define _mm512_mask_cmp_epi32_mask(M, X, Y, P) \
- ((__mmask16) __builtin_ia32_cmpd512_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(P), \
- (__mmask16)M))
- #define _mm512_mask_cmp_epu64_mask(M, X, Y, P) \
- ((__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di)(__m512i)(X), \
- (__v8di)(__m512i)(Y), (int)(P),\
- (__mmask8)M))
- #define _mm512_mask_cmp_epu32_mask(M, X, Y, P) \
- ((__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si)(__m512i)(X), \
- (__v16si)(__m512i)(Y), (int)(P), \
- (__mmask16)M))
- #define _mm512_mask_cmp_round_pd_mask(M, X, Y, P, R) \
- ((__mmask8) __builtin_ia32_cmppd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(P),\
- (__mmask8)M, R))
- #define _mm512_mask_cmp_round_ps_mask(M, X, Y, P, R) \
- ((__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(P),\
- (__mmask16)M, R))
- #define _mm_cmp_round_sd_mask(X, Y, P, R) \
- ((__mmask8) __builtin_ia32_cmpsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (int)(P),\
- (__mmask8)-1, R))
- #define _mm_mask_cmp_round_sd_mask(M, X, Y, P, R) \
- ((__mmask8) __builtin_ia32_cmpsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (int)(P),\
- (M), R))
- #define _mm_cmp_round_ss_mask(X, Y, P, R) \
- ((__mmask8) __builtin_ia32_cmpss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (int)(P), \
- (__mmask8)-1, R))
- #define _mm_mask_cmp_round_ss_mask(M, X, Y, P, R) \
- ((__mmask8) __builtin_ia32_cmpss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (int)(P), \
- (M), R))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32gather_ps (__m512i __index, void const *__addr, int __scale)
- {
- __m512 __v1_old = _mm512_undefined_ps ();
- __mmask16 __mask = 0xFFFF;
- return (__m512) __builtin_ia32_gathersiv16sf ((__v16sf) __v1_old,
- __addr,
- (__v16si) __index,
- __mask, __scale);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32gather_ps (__m512 __v1_old, __mmask16 __mask,
- __m512i __index, void const *__addr, int __scale)
- {
- return (__m512) __builtin_ia32_gathersiv16sf ((__v16sf) __v1_old,
- __addr,
- (__v16si) __index,
- __mask, __scale);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32gather_pd (__m256i __index, void const *__addr, int __scale)
- {
- __m512d __v1_old = _mm512_undefined_pd ();
- __mmask8 __mask = 0xFF;
- return (__m512d) __builtin_ia32_gathersiv8df ((__v8df) __v1_old,
- __addr,
- (__v8si) __index, __mask,
- __scale);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32gather_pd (__m512d __v1_old, __mmask8 __mask,
- __m256i __index, void const *__addr, int __scale)
- {
- return (__m512d) __builtin_ia32_gathersiv8df ((__v8df) __v1_old,
- __addr,
- (__v8si) __index,
- __mask, __scale);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64gather_ps (__m512i __index, void const *__addr, int __scale)
- {
- __m256 __v1_old = _mm256_undefined_ps ();
- __mmask8 __mask = 0xFF;
- return (__m256) __builtin_ia32_gatherdiv16sf ((__v8sf) __v1_old,
- __addr,
- (__v8di) __index, __mask,
- __scale);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64gather_ps (__m256 __v1_old, __mmask8 __mask,
- __m512i __index, void const *__addr, int __scale)
- {
- return (__m256) __builtin_ia32_gatherdiv16sf ((__v8sf) __v1_old,
- __addr,
- (__v8di) __index,
- __mask, __scale);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64gather_pd (__m512i __index, void const *__addr, int __scale)
- {
- __m512d __v1_old = _mm512_undefined_pd ();
- __mmask8 __mask = 0xFF;
- return (__m512d) __builtin_ia32_gatherdiv8df ((__v8df) __v1_old,
- __addr,
- (__v8di) __index, __mask,
- __scale);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64gather_pd (__m512d __v1_old, __mmask8 __mask,
- __m512i __index, void const *__addr, int __scale)
- {
- return (__m512d) __builtin_ia32_gatherdiv8df ((__v8df) __v1_old,
- __addr,
- (__v8di) __index,
- __mask, __scale);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32gather_epi32 (__m512i __index, void const *__addr, int __scale)
- {
- __m512i __v1_old = _mm512_undefined_epi32 ();
- __mmask16 __mask = 0xFFFF;
- return (__m512i) __builtin_ia32_gathersiv16si ((__v16si) __v1_old,
- __addr,
- (__v16si) __index,
- __mask, __scale);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32gather_epi32 (__m512i __v1_old, __mmask16 __mask,
- __m512i __index, void const *__addr, int __scale)
- {
- return (__m512i) __builtin_ia32_gathersiv16si ((__v16si) __v1_old,
- __addr,
- (__v16si) __index,
- __mask, __scale);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32gather_epi64 (__m256i __index, void const *__addr, int __scale)
- {
- __m512i __v1_old = _mm512_undefined_epi32 ();
- __mmask8 __mask = 0xFF;
- return (__m512i) __builtin_ia32_gathersiv8di ((__v8di) __v1_old,
- __addr,
- (__v8si) __index, __mask,
- __scale);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32gather_epi64 (__m512i __v1_old, __mmask8 __mask,
- __m256i __index, void const *__addr,
- int __scale)
- {
- return (__m512i) __builtin_ia32_gathersiv8di ((__v8di) __v1_old,
- __addr,
- (__v8si) __index,
- __mask, __scale);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64gather_epi32 (__m512i __index, void const *__addr, int __scale)
- {
- __m256i __v1_old = _mm256_undefined_si256 ();
- __mmask8 __mask = 0xFF;
- return (__m256i) __builtin_ia32_gatherdiv16si ((__v8si) __v1_old,
- __addr,
- (__v8di) __index,
- __mask, __scale);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64gather_epi32 (__m256i __v1_old, __mmask8 __mask,
- __m512i __index, void const *__addr, int __scale)
- {
- return (__m256i) __builtin_ia32_gatherdiv16si ((__v8si) __v1_old,
- __addr,
- (__v8di) __index,
- __mask, __scale);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64gather_epi64 (__m512i __index, void const *__addr, int __scale)
- {
- __m512i __v1_old = _mm512_undefined_epi32 ();
- __mmask8 __mask = 0xFF;
- return (__m512i) __builtin_ia32_gatherdiv8di ((__v8di) __v1_old,
- __addr,
- (__v8di) __index, __mask,
- __scale);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64gather_epi64 (__m512i __v1_old, __mmask8 __mask,
- __m512i __index, void const *__addr,
- int __scale)
- {
- return (__m512i) __builtin_ia32_gatherdiv8di ((__v8di) __v1_old,
- __addr,
- (__v8di) __index,
- __mask, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32scatter_ps (void *__addr, __m512i __index, __m512 __v1, int __scale)
- {
- __builtin_ia32_scattersiv16sf (__addr, (__mmask16) 0xFFFF,
- (__v16si) __index, (__v16sf) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32scatter_ps (void *__addr, __mmask16 __mask,
- __m512i __index, __m512 __v1, int __scale)
- {
- __builtin_ia32_scattersiv16sf (__addr, __mask, (__v16si) __index,
- (__v16sf) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32scatter_pd (void *__addr, __m256i __index, __m512d __v1,
- int __scale)
- {
- __builtin_ia32_scattersiv8df (__addr, (__mmask8) 0xFF,
- (__v8si) __index, (__v8df) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32scatter_pd (void *__addr, __mmask8 __mask,
- __m256i __index, __m512d __v1, int __scale)
- {
- __builtin_ia32_scattersiv8df (__addr, __mask, (__v8si) __index,
- (__v8df) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64scatter_ps (void *__addr, __m512i __index, __m256 __v1, int __scale)
- {
- __builtin_ia32_scatterdiv16sf (__addr, (__mmask8) 0xFF,
- (__v8di) __index, (__v8sf) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64scatter_ps (void *__addr, __mmask8 __mask,
- __m512i __index, __m256 __v1, int __scale)
- {
- __builtin_ia32_scatterdiv16sf (__addr, __mask, (__v8di) __index,
- (__v8sf) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64scatter_pd (void *__addr, __m512i __index, __m512d __v1,
- int __scale)
- {
- __builtin_ia32_scatterdiv8df (__addr, (__mmask8) 0xFF,
- (__v8di) __index, (__v8df) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64scatter_pd (void *__addr, __mmask8 __mask,
- __m512i __index, __m512d __v1, int __scale)
- {
- __builtin_ia32_scatterdiv8df (__addr, __mask, (__v8di) __index,
- (__v8df) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32scatter_epi32 (void *__addr, __m512i __index,
- __m512i __v1, int __scale)
- {
- __builtin_ia32_scattersiv16si (__addr, (__mmask16) 0xFFFF,
- (__v16si) __index, (__v16si) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32scatter_epi32 (void *__addr, __mmask16 __mask,
- __m512i __index, __m512i __v1, int __scale)
- {
- __builtin_ia32_scattersiv16si (__addr, __mask, (__v16si) __index,
- (__v16si) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i32scatter_epi64 (void *__addr, __m256i __index,
- __m512i __v1, int __scale)
- {
- __builtin_ia32_scattersiv8di (__addr, (__mmask8) 0xFF,
- (__v8si) __index, (__v8di) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i32scatter_epi64 (void *__addr, __mmask8 __mask,
- __m256i __index, __m512i __v1, int __scale)
- {
- __builtin_ia32_scattersiv8di (__addr, __mask, (__v8si) __index,
- (__v8di) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64scatter_epi32 (void *__addr, __m512i __index,
- __m256i __v1, int __scale)
- {
- __builtin_ia32_scatterdiv16si (__addr, (__mmask8) 0xFF,
- (__v8di) __index, (__v8si) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64scatter_epi32 (void *__addr, __mmask8 __mask,
- __m512i __index, __m256i __v1, int __scale)
- {
- __builtin_ia32_scatterdiv16si (__addr, __mask, (__v8di) __index,
- (__v8si) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_i64scatter_epi64 (void *__addr, __m512i __index,
- __m512i __v1, int __scale)
- {
- __builtin_ia32_scatterdiv8di (__addr, (__mmask8) 0xFF,
- (__v8di) __index, (__v8di) __v1, __scale);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_i64scatter_epi64 (void *__addr, __mmask8 __mask,
- __m512i __index, __m512i __v1, int __scale)
- {
- __builtin_ia32_scatterdiv8di (__addr, __mask, (__v8di) __index,
- (__v8di) __v1, __scale);
- }
- #else
- #define _mm512_i32gather_ps(INDEX, ADDR, SCALE) \
- (__m512) __builtin_ia32_gathersiv16sf ((__v16sf)_mm512_undefined_ps(),\
- (void const *)ADDR, \
- (__v16si)(__m512i)INDEX, \
- (__mmask16)0xFFFF, (int)SCALE)
- #define _mm512_mask_i32gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m512) __builtin_ia32_gathersiv16sf ((__v16sf)(__m512)V1OLD, \
- (void const *)ADDR, \
- (__v16si)(__m512i)INDEX, \
- (__mmask16)MASK, (int)SCALE)
- #define _mm512_i32gather_pd(INDEX, ADDR, SCALE) \
- (__m512d) __builtin_ia32_gathersiv8df ((__v8df)_mm512_undefined_pd(), \
- (void const *)ADDR, \
- (__v8si)(__m256i)INDEX, \
- (__mmask8)0xFF, (int)SCALE)
- #define _mm512_mask_i32gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m512d) __builtin_ia32_gathersiv8df ((__v8df)(__m512d)V1OLD, \
- (void const *)ADDR, \
- (__v8si)(__m256i)INDEX, \
- (__mmask8)MASK, (int)SCALE)
- #define _mm512_i64gather_ps(INDEX, ADDR, SCALE) \
- (__m256) __builtin_ia32_gatherdiv16sf ((__v8sf)_mm256_undefined_ps(), \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)0xFF, (int)SCALE)
- #define _mm512_mask_i64gather_ps(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m256) __builtin_ia32_gatherdiv16sf ((__v8sf)(__m256)V1OLD, \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)MASK, (int)SCALE)
- #define _mm512_i64gather_pd(INDEX, ADDR, SCALE) \
- (__m512d) __builtin_ia32_gatherdiv8df ((__v8df)_mm512_undefined_pd(), \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)0xFF, (int)SCALE)
- #define _mm512_mask_i64gather_pd(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m512d) __builtin_ia32_gatherdiv8df ((__v8df)(__m512d)V1OLD, \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)MASK, (int)SCALE)
- #define _mm512_i32gather_epi32(INDEX, ADDR, SCALE) \
- (__m512i) __builtin_ia32_gathersiv16si ((__v16si)_mm512_undefined_epi32 (), \
- (void const *)ADDR, \
- (__v16si)(__m512i)INDEX, \
- (__mmask16)0xFFFF, (int)SCALE)
- #define _mm512_mask_i32gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m512i) __builtin_ia32_gathersiv16si ((__v16si)(__m512i)V1OLD, \
- (void const *)ADDR, \
- (__v16si)(__m512i)INDEX, \
- (__mmask16)MASK, (int)SCALE)
- #define _mm512_i32gather_epi64(INDEX, ADDR, SCALE) \
- (__m512i) __builtin_ia32_gathersiv8di ((__v8di)_mm512_undefined_epi32 (), \
- (void const *)ADDR, \
- (__v8si)(__m256i)INDEX, \
- (__mmask8)0xFF, (int)SCALE)
- #define _mm512_mask_i32gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m512i) __builtin_ia32_gathersiv8di ((__v8di)(__m512i)V1OLD, \
- (void const *)ADDR, \
- (__v8si)(__m256i)INDEX, \
- (__mmask8)MASK, (int)SCALE)
- #define _mm512_i64gather_epi32(INDEX, ADDR, SCALE) \
- (__m256i) __builtin_ia32_gatherdiv16si ((__v8si)_mm256_undefined_si256(), \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)0xFF, (int)SCALE)
- #define _mm512_mask_i64gather_epi32(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m256i) __builtin_ia32_gatherdiv16si ((__v8si)(__m256i)V1OLD, \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)MASK, (int)SCALE)
- #define _mm512_i64gather_epi64(INDEX, ADDR, SCALE) \
- (__m512i) __builtin_ia32_gatherdiv8di ((__v8di)_mm512_undefined_epi32 (), \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)0xFF, (int)SCALE)
- #define _mm512_mask_i64gather_epi64(V1OLD, MASK, INDEX, ADDR, SCALE) \
- (__m512i) __builtin_ia32_gatherdiv8di ((__v8di)(__m512i)V1OLD, \
- (void const *)ADDR, \
- (__v8di)(__m512i)INDEX, \
- (__mmask8)MASK, (int)SCALE)
- #define _mm512_i32scatter_ps(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv16sf ((void *)ADDR, (__mmask16)0xFFFF, \
- (__v16si)(__m512i)INDEX, \
- (__v16sf)(__m512)V1, (int)SCALE)
- #define _mm512_mask_i32scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv16sf ((void *)ADDR, (__mmask16)MASK, \
- (__v16si)(__m512i)INDEX, \
- (__v16sf)(__m512)V1, (int)SCALE)
- #define _mm512_i32scatter_pd(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv8df ((void *)ADDR, (__mmask8)0xFF, \
- (__v8si)(__m256i)INDEX, \
- (__v8df)(__m512d)V1, (int)SCALE)
- #define _mm512_mask_i32scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv8df ((void *)ADDR, (__mmask8)MASK, \
- (__v8si)(__m256i)INDEX, \
- (__v8df)(__m512d)V1, (int)SCALE)
- #define _mm512_i64scatter_ps(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv16sf ((void *)ADDR, (__mmask8)0xFF, \
- (__v8di)(__m512i)INDEX, \
- (__v8sf)(__m256)V1, (int)SCALE)
- #define _mm512_mask_i64scatter_ps(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv16sf ((void *)ADDR, (__mmask16)MASK, \
- (__v8di)(__m512i)INDEX, \
- (__v8sf)(__m256)V1, (int)SCALE)
- #define _mm512_i64scatter_pd(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv8df ((void *)ADDR, (__mmask8)0xFF, \
- (__v8di)(__m512i)INDEX, \
- (__v8df)(__m512d)V1, (int)SCALE)
- #define _mm512_mask_i64scatter_pd(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv8df ((void *)ADDR, (__mmask8)MASK, \
- (__v8di)(__m512i)INDEX, \
- (__v8df)(__m512d)V1, (int)SCALE)
- #define _mm512_i32scatter_epi32(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv16si ((void *)ADDR, (__mmask16)0xFFFF, \
- (__v16si)(__m512i)INDEX, \
- (__v16si)(__m512i)V1, (int)SCALE)
- #define _mm512_mask_i32scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv16si ((void *)ADDR, (__mmask16)MASK, \
- (__v16si)(__m512i)INDEX, \
- (__v16si)(__m512i)V1, (int)SCALE)
- #define _mm512_i32scatter_epi64(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv8di ((void *)ADDR, (__mmask8)0xFF, \
- (__v8si)(__m256i)INDEX, \
- (__v8di)(__m512i)V1, (int)SCALE)
- #define _mm512_mask_i32scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scattersiv8di ((void *)ADDR, (__mmask8)MASK, \
- (__v8si)(__m256i)INDEX, \
- (__v8di)(__m512i)V1, (int)SCALE)
- #define _mm512_i64scatter_epi32(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv16si ((void *)ADDR, (__mmask8)0xFF, \
- (__v8di)(__m512i)INDEX, \
- (__v8si)(__m256i)V1, (int)SCALE)
- #define _mm512_mask_i64scatter_epi32(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv16si ((void *)ADDR, (__mmask8)MASK, \
- (__v8di)(__m512i)INDEX, \
- (__v8si)(__m256i)V1, (int)SCALE)
- #define _mm512_i64scatter_epi64(ADDR, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv8di ((void *)ADDR, (__mmask8)0xFF, \
- (__v8di)(__m512i)INDEX, \
- (__v8di)(__m512i)V1, (int)SCALE)
- #define _mm512_mask_i64scatter_epi64(ADDR, MASK, INDEX, V1, SCALE) \
- __builtin_ia32_scatterdiv8di ((void *)ADDR, (__mmask8)MASK, \
- (__v8di)(__m512i)INDEX, \
- (__v8di)(__m512i)V1, (int)SCALE)
- #endif
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compress_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_compressdf512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_compress_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_compressdf512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compressstoreu_pd (void *__P, __mmask8 __U, __m512d __A)
- {
- __builtin_ia32_compressstoredf512_mask ((__v8df *) __P, (__v8df) __A,
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compress_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_compresssf512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_compress_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_compresssf512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compressstoreu_ps (void *__P, __mmask16 __U, __m512 __A)
- {
- __builtin_ia32_compressstoresf512_mask ((__v16sf *) __P, (__v16sf) __A,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compress_epi64 (__m512i __W, __mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_compressdi512_mask ((__v8di) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_compress_epi64 (__mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_compressdi512_mask ((__v8di) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compressstoreu_epi64 (void *__P, __mmask8 __U, __m512i __A)
- {
- __builtin_ia32_compressstoredi512_mask ((__v8di *) __P, (__v8di) __A,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compress_epi32 (__m512i __W, __mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_compresssi512_mask ((__v16si) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_compress_epi32 (__mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_compresssi512_mask ((__v16si) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_compressstoreu_epi32 (void *__P, __mmask16 __U, __m512i __A)
- {
- __builtin_ia32_compressstoresi512_mask ((__v16si *) __P, (__v16si) __A,
- (__mmask16) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expand_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_expanddf512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expand_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_expanddf512_maskz ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expandloadu_pd (__m512d __W, __mmask8 __U, void const *__P)
- {
- return (__m512d) __builtin_ia32_expandloaddf512_mask ((const __v8df *) __P,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expandloadu_pd (__mmask8 __U, void const *__P)
- {
- return (__m512d) __builtin_ia32_expandloaddf512_maskz ((const __v8df *) __P,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expand_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_expandsf512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expand_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_expandsf512_maskz ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expandloadu_ps (__m512 __W, __mmask16 __U, void const *__P)
- {
- return (__m512) __builtin_ia32_expandloadsf512_mask ((const __v16sf *) __P,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expandloadu_ps (__mmask16 __U, void const *__P)
- {
- return (__m512) __builtin_ia32_expandloadsf512_maskz ((const __v16sf *) __P,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expand_epi64 (__m512i __W, __mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_expanddi512_mask ((__v8di) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expand_epi64 (__mmask8 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_expanddi512_maskz ((__v8di) __A,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expandloadu_epi64 (__m512i __W, __mmask8 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_expandloaddi512_mask ((const __v8di *) __P,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expandloadu_epi64 (__mmask8 __U, void const *__P)
- {
- return (__m512i)
- __builtin_ia32_expandloaddi512_maskz ((const __v8di *) __P,
- (__v8di)
- _mm512_setzero_si512 (),
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expand_epi32 (__m512i __W, __mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_expandsi512_mask ((__v16si) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expand_epi32 (__mmask16 __U, __m512i __A)
- {
- return (__m512i) __builtin_ia32_expandsi512_maskz ((__v16si) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_expandloadu_epi32 (__m512i __W, __mmask16 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_expandloadsi512_mask ((const __v16si *) __P,
- (__v16si) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_expandloadu_epi32 (__mmask16 __U, void const *__P)
- {
- return (__m512i) __builtin_ia32_expandloadsi512_maskz ((const __v16si *) __P,
- (__v16si)
- _mm512_setzero_si512
- (), (__mmask16) __U);
- }
- /* Mask arithmetic operations */
- #define _kand_mask16 _mm512_kand
- #define _kandn_mask16 _mm512_kandn
- #define _knot_mask16 _mm512_knot
- #define _kor_mask16 _mm512_kor
- #define _kxnor_mask16 _mm512_kxnor
- #define _kxor_mask16 _mm512_kxor
- extern __inline unsigned char
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _kortest_mask16_u8 (__mmask16 __A, __mmask16 __B, unsigned char *__CF)
- {
- *__CF = (unsigned char) __builtin_ia32_kortestchi (__A, __B);
- return (unsigned char) __builtin_ia32_kortestzhi (__A, __B);
- }
- extern __inline unsigned char
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _kortestz_mask16_u8 (__mmask16 __A, __mmask16 __B)
- {
- return (unsigned char) __builtin_ia32_kortestzhi ((__mmask16) __A,
- (__mmask16) __B);
- }
- extern __inline unsigned char
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _kortestc_mask16_u8 (__mmask16 __A, __mmask16 __B)
- {
- return (unsigned char) __builtin_ia32_kortestchi ((__mmask16) __A,
- (__mmask16) __B);
- }
- extern __inline unsigned int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _cvtmask16_u32 (__mmask16 __A)
- {
- return (unsigned int) __builtin_ia32_kmovw ((__mmask16 ) __A);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _cvtu32_mask16 (unsigned int __A)
- {
- return (__mmask16) __builtin_ia32_kmovw ((__mmask16 ) __A);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _load_mask16 (__mmask16 *__A)
- {
- return (__mmask16) __builtin_ia32_kmovw (*(__mmask16 *) __A);
- }
- extern __inline void
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _store_mask16 (__mmask16 *__A, __mmask16 __B)
- {
- *(__mmask16 *) __A = __builtin_ia32_kmovw (__B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kand (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_kandhi ((__mmask16) __A, (__mmask16) __B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kandn (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_kandnhi ((__mmask16) __A,
- (__mmask16) __B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kor (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_korhi ((__mmask16) __A, (__mmask16) __B);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kortestz (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_kortestzhi ((__mmask16) __A,
- (__mmask16) __B);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kortestc (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_kortestchi ((__mmask16) __A,
- (__mmask16) __B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kxnor (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_kxnorhi ((__mmask16) __A, (__mmask16) __B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kxor (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_kxorhi ((__mmask16) __A, (__mmask16) __B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_knot (__mmask16 __A)
- {
- return (__mmask16) __builtin_ia32_knothi ((__mmask16) __A);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kunpackb (__mmask16 __A, __mmask16 __B)
- {
- return (__mmask16) __builtin_ia32_kunpckhi ((__mmask16) __A, (__mmask16) __B);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _kunpackb_mask16 (__mmask8 __A, __mmask8 __B)
- {
- return (__mmask16) __builtin_ia32_kunpckhi ((__mmask16) __A, (__mmask16) __B);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_inserti32x4 (__mmask16 __B, __m512i __C, __m128i __D,
- const int __imm)
- {
- return (__m512i) __builtin_ia32_inserti32x4_mask ((__v16si) __C,
- (__v4si) __D,
- __imm,
- (__v16si)
- _mm512_setzero_si512 (),
- __B);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_insertf32x4 (__mmask16 __B, __m512 __C, __m128 __D,
- const int __imm)
- {
- return (__m512) __builtin_ia32_insertf32x4_mask ((__v16sf) __C,
- (__v4sf) __D,
- __imm,
- (__v16sf)
- _mm512_setzero_ps (), __B);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_inserti32x4 (__m512i __A, __mmask16 __B, __m512i __C,
- __m128i __D, const int __imm)
- {
- return (__m512i) __builtin_ia32_inserti32x4_mask ((__v16si) __C,
- (__v4si) __D,
- __imm,
- (__v16si) __A,
- __B);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_insertf32x4 (__m512 __A, __mmask16 __B, __m512 __C,
- __m128 __D, const int __imm)
- {
- return (__m512) __builtin_ia32_insertf32x4_mask ((__v16sf) __C,
- (__v4sf) __D,
- __imm,
- (__v16sf) __A, __B);
- }
- #else
- #define _mm512_maskz_insertf32x4(A, X, Y, C) \
- ((__m512) __builtin_ia32_insertf32x4_mask ((__v16sf)(__m512) (X), \
- (__v4sf)(__m128) (Y), (int) (C), (__v16sf)_mm512_setzero_ps(), \
- (__mmask16)(A)))
- #define _mm512_maskz_inserti32x4(A, X, Y, C) \
- ((__m512i) __builtin_ia32_inserti32x4_mask ((__v16si)(__m512i) (X), \
- (__v4si)(__m128i) (Y), (int) (C), (__v16si)_mm512_setzero_si512 (), \
- (__mmask16)(A)))
- #define _mm512_mask_insertf32x4(A, B, X, Y, C) \
- ((__m512) __builtin_ia32_insertf32x4_mask ((__v16sf)(__m512) (X), \
- (__v4sf)(__m128) (Y), (int) (C), (__v16sf)(__m512) (A), \
- (__mmask16)(B)))
- #define _mm512_mask_inserti32x4(A, B, X, Y, C) \
- ((__m512i) __builtin_ia32_inserti32x4_mask ((__v16si)(__m512i) (X), \
- (__v4si)(__m128i) (Y), (int) (C), (__v16si)(__m512i) (A), \
- (__mmask16)(B)))
- #endif
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxsq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_epi64 (__mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxsq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_epi64 (__m512i __W, __mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxsq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_epi64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminsq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_epi64 (__m512i __W, __mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminsq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_epi64 (__mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminsq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_epu64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxuq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_epu64 (__mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxuq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_epu64 (__m512i __W, __mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxuq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_epu64 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminuq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_undefined_epi32 (),
- (__mmask8) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_epu64 (__m512i __W, __mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminuq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_epu64 (__mmask8 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminuq512_mask ((__v8di) __A,
- (__v8di) __B,
- (__v8di)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxsd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_epi32 (__mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxsd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_epi32 (__m512i __W, __mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxsd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_epi32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminsd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_epi32 (__mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminsd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_epi32 (__m512i __W, __mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminsd512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_epu32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxud512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_epu32 (__mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxud512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_epu32 (__m512i __W, __mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pmaxud512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W, __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_epu32 (__m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminud512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_epu32 (__mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminud512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si)
- _mm512_setzero_si512 (),
- __M);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_epu32 (__m512i __W, __mmask16 __M, __m512i __A, __m512i __B)
- {
- return (__m512i) __builtin_ia32_pminud512_mask ((__v16si) __A,
- (__v16si) __B,
- (__v16si) __W, __M);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_unpacklo_ps (__m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_unpcklps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_unpacklo_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_unpcklps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_unpacklo_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_unpcklps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_max_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_maxsd_round ((__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_max_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_maxsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_max_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_maxsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_max_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_maxss_round ((__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_max_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_maxss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_max_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_maxss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_min_round_sd (__m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_minsd_round ((__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_min_round_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_minsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_min_round_sd (__mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_minsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_min_round_ss (__m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_minss_round ((__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_min_round_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_minss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_min_round_ss (__mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_minss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U, __R);
- }
- #else
- #define _mm_max_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_maxsd_round(A, B, C)
- #define _mm_mask_max_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_maxsd_mask_round(A, B, W, U, C)
- #define _mm_maskz_max_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_maxsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U, C)
- #define _mm_max_round_ss(A, B, C) \
- (__m128)__builtin_ia32_maxss_round(A, B, C)
- #define _mm_mask_max_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_maxss_mask_round(A, B, W, U, C)
- #define _mm_maskz_max_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_maxss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U, C)
- #define _mm_min_round_sd(A, B, C) \
- (__m128d)__builtin_ia32_minsd_round(A, B, C)
- #define _mm_mask_min_round_sd(W, U, A, B, C) \
- (__m128d)__builtin_ia32_minsd_mask_round(A, B, W, U, C)
- #define _mm_maskz_min_round_sd(U, A, B, C) \
- (__m128d)__builtin_ia32_minsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U, C)
- #define _mm_min_round_ss(A, B, C) \
- (__m128)__builtin_ia32_minss_round(A, B, C)
- #define _mm_mask_min_round_ss(W, U, A, B, C) \
- (__m128)__builtin_ia32_minss_mask_round(A, B, W, U, C)
- #define _mm_maskz_min_round_ss(U, A, B, C) \
- (__m128)__builtin_ia32_minss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U, C)
- #endif
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_blend_pd (__mmask8 __U, __m512d __A, __m512d __W)
- {
- return (__m512d) __builtin_ia32_blendmpd_512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_blend_ps (__mmask16 __U, __m512 __A, __m512 __W)
- {
- return (__m512) __builtin_ia32_blendmps_512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_blend_epi64 (__mmask8 __U, __m512i __A, __m512i __W)
- {
- return (__m512i) __builtin_ia32_blendmq_512_mask ((__v8di) __A,
- (__v8di) __W,
- (__mmask8) __U);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_blend_epi32 (__mmask16 __U, __m512i __A, __m512i __W)
- {
- return (__m512i) __builtin_ia32_blendmd_512_mask ((__v16si) __A,
- (__v16si) __W,
- (__mmask16) __U);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fmadd_round_sd (__m128d __W, __m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_round ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fmadd_round_ss (__m128 __W, __m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_round ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fmsub_round_sd (__m128d __W, __m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_round ((__v2df) __W,
- (__v2df) __A,
- -(__v2df) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fmsub_round_ss (__m128 __W, __m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_round ((__v4sf) __W,
- (__v4sf) __A,
- -(__v4sf) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fnmadd_round_sd (__m128d __W, __m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_round ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fnmadd_round_ss (__m128 __W, __m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_round ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fnmsub_round_sd (__m128d __W, __m128d __A, __m128d __B, const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_round ((__v2df) __W,
- -(__v2df) __A,
- -(__v2df) __B,
- __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fnmsub_round_ss (__m128 __W, __m128 __A, __m128 __B, const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_round ((__v4sf) __W,
- -(__v4sf) __A,
- -(__v4sf) __B,
- __R);
- }
- #else
- #define _mm_fmadd_round_sd(A, B, C, R) \
- (__m128d)__builtin_ia32_vfmaddsd3_round(A, B, C, R)
- #define _mm_fmadd_round_ss(A, B, C, R) \
- (__m128)__builtin_ia32_vfmaddss3_round(A, B, C, R)
- #define _mm_fmsub_round_sd(A, B, C, R) \
- (__m128d)__builtin_ia32_vfmaddsd3_round(A, B, -(C), R)
- #define _mm_fmsub_round_ss(A, B, C, R) \
- (__m128)__builtin_ia32_vfmaddss3_round(A, B, -(C), R)
- #define _mm_fnmadd_round_sd(A, B, C, R) \
- (__m128d)__builtin_ia32_vfmaddsd3_round(A, -(B), C, R)
- #define _mm_fnmadd_round_ss(A, B, C, R) \
- (__m128)__builtin_ia32_vfmaddss3_round(A, -(B), C, R)
- #define _mm_fnmsub_round_sd(A, B, C, R) \
- (__m128d)__builtin_ia32_vfmaddsd3_round(A, -(B), -(C), R)
- #define _mm_fnmsub_round_ss(A, B, C, R) \
- (__m128)__builtin_ia32_vfmaddss3_round(A, -(B), -(C), R)
- #endif
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmadd_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmadd_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmadd_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask3 ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmadd_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask3 ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmadd_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmadd_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmsub_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- (__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmsub_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- (__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmsub_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U)
- {
- return (__m128d) __builtin_ia32_vfmsubsd3_mask3 ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmsub_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U)
- {
- return (__m128) __builtin_ia32_vfmsubss3_mask3 ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmsub_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- (__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmsub_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- (__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmadd_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmadd_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmadd_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask3 ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmadd_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask3 ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmadd_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmadd_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmsub_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- -(__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmsub_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- -(__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmsub_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U)
- {
- return (__m128d) __builtin_ia32_vfmsubsd3_mask3 ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmsub_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U)
- {
- return (__m128) __builtin_ia32_vfmsubss3_mask3 ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmsub_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- -(__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmsub_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- -(__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmadd_round_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmadd_round_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmadd_round_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask3 ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmadd_round_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask3 ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmadd_round_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmadd_round_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmsub_round_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- (__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fmsub_round_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- (__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmsub_round_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmsubsd3_mask3 ((__v2df) __W,
- (__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fmsub_round_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmsubss3_mask3 ((__v4sf) __W,
- (__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmsub_round_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- (__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fmsub_round_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- (__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmadd_round_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmadd_round_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmadd_round_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask3 ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmadd_round_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask3 ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmadd_round_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmadd_round_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmsub_round_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_mask ((__v2df) __W,
- -(__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fnmsub_round_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_mask ((__v4sf) __W,
- -(__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmsub_round_sd (__m128d __W, __m128d __A, __m128d __B, __mmask8 __U,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmsubsd3_mask3 ((__v2df) __W,
- -(__v2df) __A,
- (__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask3_fnmsub_round_ss (__m128 __W, __m128 __A, __m128 __B, __mmask8 __U,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmsubss3_mask3 ((__v4sf) __W,
- -(__v4sf) __A,
- (__v4sf) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmsub_round_sd (__mmask8 __U, __m128d __W, __m128d __A, __m128d __B,
- const int __R)
- {
- return (__m128d) __builtin_ia32_vfmaddsd3_maskz ((__v2df) __W,
- -(__v2df) __A,
- -(__v2df) __B,
- (__mmask8) __U, __R);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fnmsub_round_ss (__mmask8 __U, __m128 __W, __m128 __A, __m128 __B,
- const int __R)
- {
- return (__m128) __builtin_ia32_vfmaddss3_maskz ((__v4sf) __W,
- -(__v4sf) __A,
- -(__v4sf) __B,
- (__mmask8) __U, __R);
- }
- #else
- #define _mm_mask_fmadd_round_sd(A, U, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_mask (A, B, C, U, R)
- #define _mm_mask_fmadd_round_ss(A, U, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_mask (A, B, C, U, R)
- #define _mm_mask3_fmadd_round_sd(A, B, C, U, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_mask3 (A, B, C, U, R)
- #define _mm_mask3_fmadd_round_ss(A, B, C, U, R) \
- (__m128) __builtin_ia32_vfmaddss3_mask3 (A, B, C, U, R)
- #define _mm_maskz_fmadd_round_sd(U, A, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_maskz (A, B, C, U, R)
- #define _mm_maskz_fmadd_round_ss(U, A, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_maskz (A, B, C, U, R)
- #define _mm_mask_fmsub_round_sd(A, U, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_mask (A, B, -(C), U, R)
- #define _mm_mask_fmsub_round_ss(A, U, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_mask (A, B, -(C), U, R)
- #define _mm_mask3_fmsub_round_sd(A, B, C, U, R) \
- (__m128d) __builtin_ia32_vfmsubsd3_mask3 (A, B, C, U, R)
- #define _mm_mask3_fmsub_round_ss(A, B, C, U, R) \
- (__m128) __builtin_ia32_vfmsubss3_mask3 (A, B, C, U, R)
- #define _mm_maskz_fmsub_round_sd(U, A, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_maskz (A, B, -(C), U, R)
- #define _mm_maskz_fmsub_round_ss(U, A, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_maskz (A, B, -(C), U, R)
- #define _mm_mask_fnmadd_round_sd(A, U, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_mask (A, -(B), C, U, R)
- #define _mm_mask_fnmadd_round_ss(A, U, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_mask (A, -(B), C, U, R)
- #define _mm_mask3_fnmadd_round_sd(A, B, C, U, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_mask3 (A, -(B), C, U, R)
- #define _mm_mask3_fnmadd_round_ss(A, B, C, U, R) \
- (__m128) __builtin_ia32_vfmaddss3_mask3 (A, -(B), C, U, R)
- #define _mm_maskz_fnmadd_round_sd(U, A, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_maskz (A, -(B), C, U, R)
- #define _mm_maskz_fnmadd_round_ss(U, A, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_maskz (A, -(B), C, U, R)
- #define _mm_mask_fnmsub_round_sd(A, U, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_mask (A, -(B), -(C), U, R)
- #define _mm_mask_fnmsub_round_ss(A, U, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_mask (A, -(B), -(C), U, R)
- #define _mm_mask3_fnmsub_round_sd(A, B, C, U, R) \
- (__m128d) __builtin_ia32_vfmsubsd3_mask3 (A, -(B), C, U, R)
- #define _mm_mask3_fnmsub_round_ss(A, B, C, U, R) \
- (__m128) __builtin_ia32_vfmsubss3_mask3 (A, -(B), C, U, R)
- #define _mm_maskz_fnmsub_round_sd(U, A, B, C, R) \
- (__m128d) __builtin_ia32_vfmaddsd3_maskz (A, -(B), -(C), U, R)
- #define _mm_maskz_fnmsub_round_ss(U, A, B, C, R) \
- (__m128) __builtin_ia32_vfmaddss3_maskz (A, -(B), -(C), U, R)
- #endif
- #ifdef __OPTIMIZE__
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_comi_round_ss (__m128 __A, __m128 __B, const int __P, const int __R)
- {
- return __builtin_ia32_vcomiss ((__v4sf) __A, (__v4sf) __B, __P, __R);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_comi_round_sd (__m128d __A, __m128d __B, const int __P, const int __R)
- {
- return __builtin_ia32_vcomisd ((__v2df) __A, (__v2df) __B, __P, __R);
- }
- #else
- #define _mm_comi_round_ss(A, B, C, D)\
- __builtin_ia32_vcomiss(A, B, C, D)
- #define _mm_comi_round_sd(A, B, C, D)\
- __builtin_ia32_vcomisd(A, B, C, D)
- #endif
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sqrt_pd (__m512d __A)
- {
- return (__m512d) __builtin_ia32_sqrtpd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sqrt_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_sqrtpd512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sqrt_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_sqrtpd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sqrt_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_sqrtps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sqrt_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_sqrtps512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sqrt_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_sqrtps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_add_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) ((__v8df)__A + (__v8df)__B);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_add_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_addpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_add_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_addpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_add_ps (__m512 __A, __m512 __B)
- {
- return (__m512) ((__v16sf)__A + (__v16sf)__B);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_add_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_addps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_add_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_addps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_add_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_addsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_add_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_addsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_add_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_addss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_add_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_addss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sub_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) ((__v8df)__A - (__v8df)__B);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sub_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_subpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sub_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_subpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_sub_ps (__m512 __A, __m512 __B)
- {
- return (__m512) ((__v16sf)__A - (__v16sf)__B);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_sub_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_subps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_sub_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_subps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_sub_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_subsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_sub_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_subsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_sub_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_subss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_sub_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_subss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mul_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) ((__v8df)__A * (__v8df)__B);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mul_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_mulpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mul_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_mulpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mul_ps (__m512 __A, __m512 __B)
- {
- return (__m512) ((__v16sf)__A * (__v16sf)__B);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_mul_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_mulps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_mul_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_mulps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_mul_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B)
- {
- return (__m128d) __builtin_ia32_mulsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_mul_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_mulsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_mul_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B)
- {
- return (__m128) __builtin_ia32_mulss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_mul_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_mulss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_div_pd (__m512d __M, __m512d __V)
- {
- return (__m512d) ((__v8df)__M / (__v8df)__V);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_div_pd (__m512d __W, __mmask8 __U, __m512d __M, __m512d __V)
- {
- return (__m512d) __builtin_ia32_divpd512_mask ((__v8df) __M,
- (__v8df) __V,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_div_pd (__mmask8 __U, __m512d __M, __m512d __V)
- {
- return (__m512d) __builtin_ia32_divpd512_mask ((__v8df) __M,
- (__v8df) __V,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_div_ps (__m512 __A, __m512 __B)
- {
- return (__m512) ((__v16sf)__A / (__v16sf)__B);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_div_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_divps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_div_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_divps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_div_sd (__m128d __W, __mmask8 __U, __m128d __A,
- __m128d __B)
- {
- return (__m128d) __builtin_ia32_divsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_div_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_divsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_div_ss (__m128 __W, __mmask8 __U, __m128 __A,
- __m128 __B)
- {
- return (__m128) __builtin_ia32_divss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_div_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_divss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_maxpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_maxpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_maxpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_max_ps (__m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_maxps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_max_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_maxps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_max_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_maxps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_max_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_maxsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_max_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_maxsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_max_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_maxss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_max_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_maxss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_minpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_minpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_minpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_min_ps (__m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_minps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_min_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_minps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_min_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_minps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_min_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_minsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_min_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_minsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_min_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_minss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_min_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_minss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_scalef_pd (__m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_scalefpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_scalef_pd (__m512d __W, __mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_scalefpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_scalef_pd (__mmask8 __U, __m512d __A, __m512d __B)
- {
- return (__m512d) __builtin_ia32_scalefpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_scalef_ps (__m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_scalefps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_scalef_ps (__m512 __W, __mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_scalefps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_scalef_ps (__mmask16 __U, __m512 __A, __m512 __B)
- {
- return (__m512) __builtin_ia32_scalefps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_scalef_sd (__m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_scalefsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_scalef_ss (__m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_scalefss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmadd_pd (__m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmadd_pd (__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmadd_pd (__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmadd_pd (__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmadd_ps (__m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmadd_ps (__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmadd_ps (__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
- {
- return (__m512) __builtin_ia32_vfmaddps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmadd_ps (__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsub_pd (__m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsub_pd (__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsub_pd (__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsub_pd (__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsub_ps (__m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsub_ps (__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsub_ps (__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
- {
- return (__m512) __builtin_ia32_vfmsubps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsub_ps (__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmaddsub_pd (__m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmaddsub_pd (__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmaddsub_pd (__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmaddsub_pd (__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmaddsub_ps (__m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmaddsub_ps (__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmaddsub_ps (__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmaddsub_ps (__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsubadd_pd (__m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- -(__v8df) __C,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsubadd_pd (__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- -(__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsubadd_pd (__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
- {
- return (__m512d) __builtin_ia32_vfmsubaddpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsubadd_pd (__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfmaddsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- -(__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fmsubadd_ps (__m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- -(__v16sf) __C,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fmsubadd_ps (__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- -(__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fmsubadd_ps (__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
- {
- return (__m512) __builtin_ia32_vfmsubaddps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fmsubadd_ps (__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfmaddsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- -(__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmadd_pd (__m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmadd_pd (__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmadd_pd (__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmadd_pd (__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfnmaddpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmadd_ps (__m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmadd_ps (__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmadd_ps (__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmadd_ps (__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfnmaddps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmsub_pd (__m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmsub_pd (__m512d __A, __mmask8 __U, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmsub_pd (__m512d __A, __m512d __B, __m512d __C, __mmask8 __U)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_mask3 ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmsub_pd (__mmask8 __U, __m512d __A, __m512d __B, __m512d __C)
- {
- return (__m512d) __builtin_ia32_vfnmsubpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8df) __C,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fnmsub_ps (__m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fnmsub_ps (__m512 __A, __mmask16 __U, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask3_fnmsub_ps (__m512 __A, __m512 __B, __m512 __C, __mmask16 __U)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_mask3 ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fnmsub_ps (__mmask16 __U, __m512 __A, __m512 __B, __m512 __C)
- {
- return (__m512) __builtin_ia32_vfnmsubps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16sf) __C,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvttpd_epi32 (__m512d __A)
- {
- return (__m256i) __builtin_ia32_cvttpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvttpd_epi32 (__m256i __W, __mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvttpd2dq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvttpd_epi32 (__mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvttpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvttpd_epu32 (__m512d __A)
- {
- return (__m256i) __builtin_ia32_cvttpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvttpd_epu32 (__m256i __W, __mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvttpd2udq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvttpd_epu32 (__mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvttpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtpd_epi32 (__m512d __A)
- {
- return (__m256i) __builtin_ia32_cvtpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtpd_epi32 (__m256i __W, __mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvtpd2dq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtpd_epi32 (__mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvtpd2dq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtpd_epu32 (__m512d __A)
- {
- return (__m256i) __builtin_ia32_cvtpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_undefined_si256 (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtpd_epu32 (__m256i __W, __mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvtpd2udq512_mask ((__v8df) __A,
- (__v8si) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtpd_epu32 (__mmask8 __U, __m512d __A)
- {
- return (__m256i) __builtin_ia32_cvtpd2udq512_mask ((__v8df) __A,
- (__v8si)
- _mm256_setzero_si256 (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvttps_epi32 (__m512 __A)
- {
- return (__m512i) __builtin_ia32_cvttps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvttps_epi32 (__m512i __W, __mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvttps2dq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvttps_epi32 (__mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvttps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvttps_epu32 (__m512 __A)
- {
- return (__m512i) __builtin_ia32_cvttps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvttps_epu32 (__m512i __W, __mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvttps2udq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvttps_epu32 (__mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvttps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtps_epi32 (__m512 __A)
- {
- return (__m512i) __builtin_ia32_cvtps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtps_epi32 (__m512i __W, __mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvtps2dq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtps_epi32 (__mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvtps2dq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtps_epu32 (__m512 __A)
- {
- return (__m512i) __builtin_ia32_cvtps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_undefined_epi32 (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtps_epu32 (__m512i __W, __mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvtps2udq512_mask ((__v16sf) __A,
- (__v16si) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtps_epu32 (__mmask16 __U, __m512 __A)
- {
- return (__m512i) __builtin_ia32_cvtps2udq512_mask ((__v16sf) __A,
- (__v16si)
- _mm512_setzero_si512 (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtsd_f64 (__m512d __A)
- {
- return __A[0];
- }
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtss_f32 (__m512 __A)
- {
- return __A[0];
- }
- #ifdef __x86_64__
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtu64_ss (__m128 __A, unsigned long long __B)
- {
- return (__m128) __builtin_ia32_cvtusi2ss64 ((__v4sf) __A, __B,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtu64_sd (__m128d __A, unsigned long long __B)
- {
- return (__m128d) __builtin_ia32_cvtusi2sd64 ((__v2df) __A, __B,
- _MM_FROUND_CUR_DIRECTION);
- }
- #endif
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtu32_ss (__m128 __A, unsigned __B)
- {
- return (__m128) __builtin_ia32_cvtusi2ss32 ((__v4sf) __A, __B,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepi32_ps (__m512i __A)
- {
- return (__m512) __builtin_ia32_cvtdq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepi32_ps (__m512 __W, __mmask16 __U, __m512i __A)
- {
- return (__m512) __builtin_ia32_cvtdq2ps512_mask ((__v16si) __A,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepi32_ps (__mmask16 __U, __m512i __A)
- {
- return (__m512) __builtin_ia32_cvtdq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtepu32_ps (__m512i __A)
- {
- return (__m512) __builtin_ia32_cvtudq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtepu32_ps (__m512 __W, __mmask16 __U, __m512i __A)
- {
- return (__m512) __builtin_ia32_cvtudq2ps512_mask ((__v16si) __A,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtepu32_ps (__mmask16 __U, __m512i __A)
- {
- return (__m512) __builtin_ia32_cvtudq2ps512_mask ((__v16si) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fixupimm_pd (__m512d __A, __m512d __B, __m512i __C, const int __imm)
- {
- return (__m512d) __builtin_ia32_fixupimmpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8di) __C,
- __imm,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fixupimm_pd (__m512d __A, __mmask8 __U, __m512d __B,
- __m512i __C, const int __imm)
- {
- return (__m512d) __builtin_ia32_fixupimmpd512_mask ((__v8df) __A,
- (__v8df) __B,
- (__v8di) __C,
- __imm,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fixupimm_pd (__mmask8 __U, __m512d __A, __m512d __B,
- __m512i __C, const int __imm)
- {
- return (__m512d) __builtin_ia32_fixupimmpd512_maskz ((__v8df) __A,
- (__v8df) __B,
- (__v8di) __C,
- __imm,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_fixupimm_ps (__m512 __A, __m512 __B, __m512i __C, const int __imm)
- {
- return (__m512) __builtin_ia32_fixupimmps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16si) __C,
- __imm,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_fixupimm_ps (__m512 __A, __mmask16 __U, __m512 __B,
- __m512i __C, const int __imm)
- {
- return (__m512) __builtin_ia32_fixupimmps512_mask ((__v16sf) __A,
- (__v16sf) __B,
- (__v16si) __C,
- __imm,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_fixupimm_ps (__mmask16 __U, __m512 __A, __m512 __B,
- __m512i __C, const int __imm)
- {
- return (__m512) __builtin_ia32_fixupimmps512_maskz ((__v16sf) __A,
- (__v16sf) __B,
- (__v16si) __C,
- __imm,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fixupimm_sd (__m128d __A, __m128d __B, __m128i __C, const int __imm)
- {
- return (__m128d) __builtin_ia32_fixupimmsd_mask ((__v2df) __A,
- (__v2df) __B,
- (__v2di) __C, __imm,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fixupimm_sd (__m128d __A, __mmask8 __U, __m128d __B,
- __m128i __C, const int __imm)
- {
- return (__m128d) __builtin_ia32_fixupimmsd_mask ((__v2df) __A,
- (__v2df) __B,
- (__v2di) __C, __imm,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fixupimm_sd (__mmask8 __U, __m128d __A, __m128d __B,
- __m128i __C, const int __imm)
- {
- return (__m128d) __builtin_ia32_fixupimmsd_maskz ((__v2df) __A,
- (__v2df) __B,
- (__v2di) __C,
- __imm,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_fixupimm_ss (__m128 __A, __m128 __B, __m128i __C, const int __imm)
- {
- return (__m128) __builtin_ia32_fixupimmss_mask ((__v4sf) __A,
- (__v4sf) __B,
- (__v4si) __C, __imm,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_fixupimm_ss (__m128 __A, __mmask8 __U, __m128 __B,
- __m128i __C, const int __imm)
- {
- return (__m128) __builtin_ia32_fixupimmss_mask ((__v4sf) __A,
- (__v4sf) __B,
- (__v4si) __C, __imm,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_fixupimm_ss (__mmask8 __U, __m128 __A, __m128 __B,
- __m128i __C, const int __imm)
- {
- return (__m128) __builtin_ia32_fixupimmss_maskz ((__v4sf) __A,
- (__v4sf) __B,
- (__v4si) __C, __imm,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- #else
- #define _mm512_fixupimm_pd(X, Y, Z, C) \
- ((__m512d)__builtin_ia32_fixupimmpd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (__v8di)(__m512i)(Z), (int)(C), \
- (__mmask8)(-1), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_fixupimm_pd(X, U, Y, Z, C) \
- ((__m512d)__builtin_ia32_fixupimmpd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (__v8di)(__m512i)(Z), (int)(C), \
- (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_fixupimm_pd(U, X, Y, Z, C) \
- ((__m512d)__builtin_ia32_fixupimmpd512_maskz ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (__v8di)(__m512i)(Z), (int)(C), \
- (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_fixupimm_ps(X, Y, Z, C) \
- ((__m512)__builtin_ia32_fixupimmps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (__v16si)(__m512i)(Z), (int)(C), \
- (__mmask16)(-1), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_fixupimm_ps(X, U, Y, Z, C) \
- ((__m512)__builtin_ia32_fixupimmps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (__v16si)(__m512i)(Z), (int)(C), \
- (__mmask16)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_fixupimm_ps(U, X, Y, Z, C) \
- ((__m512)__builtin_ia32_fixupimmps512_maskz ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (__v16si)(__m512i)(Z), (int)(C), \
- (__mmask16)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm_fixupimm_sd(X, Y, Z, C) \
- ((__m128d)__builtin_ia32_fixupimmsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (__v2di)(__m128i)(Z), (int)(C), \
- (__mmask8)(-1), _MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_fixupimm_sd(X, U, Y, Z, C) \
- ((__m128d)__builtin_ia32_fixupimmsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (__v2di)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm_maskz_fixupimm_sd(U, X, Y, Z, C) \
- ((__m128d)__builtin_ia32_fixupimmsd_maskz ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (__v2di)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm_fixupimm_ss(X, Y, Z, C) \
- ((__m128)__builtin_ia32_fixupimmss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (__v4si)(__m128i)(Z), (int)(C), \
- (__mmask8)(-1), _MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_fixupimm_ss(X, U, Y, Z, C) \
- ((__m128)__builtin_ia32_fixupimmss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (__v4si)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm_maskz_fixupimm_ss(U, X, Y, Z, C) \
- ((__m128)__builtin_ia32_fixupimmss_maskz ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (__v4si)(__m128i)(Z), (int)(C), \
- (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #endif
- #ifdef __x86_64__
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtss_u64 (__m128 __A)
- {
- return (unsigned long long) __builtin_ia32_vcvtss2usi64 ((__v4sf)
- __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttss_u64 (__m128 __A)
- {
- return (unsigned long long) __builtin_ia32_vcvttss2usi64 ((__v4sf)
- __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttss_i64 (__m128 __A)
- {
- return (long long) __builtin_ia32_vcvttss2si64 ((__v4sf) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- #endif /* __x86_64__ */
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtss_u32 (__m128 __A)
- {
- return (unsigned) __builtin_ia32_vcvtss2usi32 ((__v4sf) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttss_u32 (__m128 __A)
- {
- return (unsigned) __builtin_ia32_vcvttss2usi32 ((__v4sf) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttss_i32 (__m128 __A)
- {
- return (int) __builtin_ia32_vcvttss2si32 ((__v4sf) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- #ifdef __x86_64__
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtsd_u64 (__m128d __A)
- {
- return (unsigned long long) __builtin_ia32_vcvtsd2usi64 ((__v2df)
- __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttsd_u64 (__m128d __A)
- {
- return (unsigned long long) __builtin_ia32_vcvttsd2usi64 ((__v2df)
- __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttsd_i64 (__m128d __A)
- {
- return (long long) __builtin_ia32_vcvttsd2si64 ((__v2df) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- #endif /* __x86_64__ */
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvtsd_u32 (__m128d __A)
- {
- return (unsigned) __builtin_ia32_vcvtsd2usi32 ((__v2df) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline unsigned
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttsd_u32 (__m128d __A)
- {
- return (unsigned) __builtin_ia32_vcvttsd2usi32 ((__v2df) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cvttsd_i32 (__m128d __A)
- {
- return (int) __builtin_ia32_vcvttsd2si32 ((__v2df) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtps_pd (__m256 __A)
- {
- return (__m512d) __builtin_ia32_cvtps2pd512_mask ((__v8sf) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtps_pd (__m512d __W, __mmask8 __U, __m256 __A)
- {
- return (__m512d) __builtin_ia32_cvtps2pd512_mask ((__v8sf) __A,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtps_pd (__mmask8 __U, __m256 __A)
- {
- return (__m512d) __builtin_ia32_cvtps2pd512_mask ((__v8sf) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtph_ps (__m256i __A)
- {
- return (__m512) __builtin_ia32_vcvtph2ps512_mask ((__v16hi) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtph_ps (__m512 __W, __mmask16 __U, __m256i __A)
- {
- return (__m512) __builtin_ia32_vcvtph2ps512_mask ((__v16hi) __A,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtph_ps (__mmask16 __U, __m256i __A)
- {
- return (__m512) __builtin_ia32_vcvtph2ps512_mask ((__v16hi) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cvtpd_ps (__m512d __A)
- {
- return (__m256) __builtin_ia32_cvtpd2ps512_mask ((__v8df) __A,
- (__v8sf)
- _mm256_undefined_ps (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cvtpd_ps (__m256 __W, __mmask8 __U, __m512d __A)
- {
- return (__m256) __builtin_ia32_cvtpd2ps512_mask ((__v8df) __A,
- (__v8sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_cvtpd_ps (__mmask8 __U, __m512d __A)
- {
- return (__m256) __builtin_ia32_cvtpd2ps512_mask ((__v8df) __A,
- (__v8sf)
- _mm256_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- #ifdef __OPTIMIZE__
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getexp_ps (__m512 __A)
- {
- return (__m512) __builtin_ia32_getexpps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getexp_ps (__m512 __W, __mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_getexpps512_mask ((__v16sf) __A,
- (__v16sf) __W,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getexp_ps (__mmask16 __U, __m512 __A)
- {
- return (__m512) __builtin_ia32_getexpps512_mask ((__v16sf) __A,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getexp_pd (__m512d __A)
- {
- return (__m512d) __builtin_ia32_getexppd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_undefined_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getexp_pd (__m512d __W, __mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_getexppd512_mask ((__v8df) __A,
- (__v8df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getexp_pd (__mmask8 __U, __m512d __A)
- {
- return (__m512d) __builtin_ia32_getexppd512_mask ((__v8df) __A,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getexp_ss (__m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_getexpss128_round ((__v4sf) __A,
- (__v4sf) __B,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getexp_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_getexpss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getexp_ss (__mmask8 __U, __m128 __A, __m128 __B)
- {
- return (__m128) __builtin_ia32_getexpss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__v4sf)
- _mm_setzero_ps (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getexp_sd (__m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_getexpsd128_round ((__v2df) __A,
- (__v2df) __B,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getexp_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_getexpsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df) __W,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getexp_sd (__mmask8 __U, __m128d __A, __m128d __B)
- {
- return (__m128d) __builtin_ia32_getexpsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__v2df)
- _mm_setzero_pd (),
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getmant_pd (__m512d __A, _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C)
- {
- return (__m512d) __builtin_ia32_getmantpd512_mask ((__v8df) __A,
- (__C << 2) | __B,
- _mm512_undefined_pd (),
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getmant_pd (__m512d __W, __mmask8 __U, __m512d __A,
- _MM_MANTISSA_NORM_ENUM __B, _MM_MANTISSA_SIGN_ENUM __C)
- {
- return (__m512d) __builtin_ia32_getmantpd512_mask ((__v8df) __A,
- (__C << 2) | __B,
- (__v8df) __W, __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getmant_pd (__mmask8 __U, __m512d __A,
- _MM_MANTISSA_NORM_ENUM __B, _MM_MANTISSA_SIGN_ENUM __C)
- {
- return (__m512d) __builtin_ia32_getmantpd512_mask ((__v8df) __A,
- (__C << 2) | __B,
- (__v8df)
- _mm512_setzero_pd (),
- __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_getmant_ps (__m512 __A, _MM_MANTISSA_NORM_ENUM __B,
- _MM_MANTISSA_SIGN_ENUM __C)
- {
- return (__m512) __builtin_ia32_getmantps512_mask ((__v16sf) __A,
- (__C << 2) | __B,
- _mm512_undefined_ps (),
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_getmant_ps (__m512 __W, __mmask16 __U, __m512 __A,
- _MM_MANTISSA_NORM_ENUM __B, _MM_MANTISSA_SIGN_ENUM __C)
- {
- return (__m512) __builtin_ia32_getmantps512_mask ((__v16sf) __A,
- (__C << 2) | __B,
- (__v16sf) __W, __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_getmant_ps (__mmask16 __U, __m512 __A,
- _MM_MANTISSA_NORM_ENUM __B, _MM_MANTISSA_SIGN_ENUM __C)
- {
- return (__m512) __builtin_ia32_getmantps512_mask ((__v16sf) __A,
- (__C << 2) | __B,
- (__v16sf)
- _mm512_setzero_ps (),
- __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getmant_sd (__m128d __A, __m128d __B, _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D)
- {
- return (__m128d) __builtin_ia32_getmantsd_round ((__v2df) __A,
- (__v2df) __B,
- (__D << 2) | __C,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getmant_sd (__m128d __W, __mmask8 __U, __m128d __A, __m128d __B,
- _MM_MANTISSA_NORM_ENUM __C, _MM_MANTISSA_SIGN_ENUM __D)
- {
- return (__m128d) __builtin_ia32_getmantsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__D << 2) | __C,
- (__v2df) __W,
- __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getmant_sd (__mmask8 __U, __m128d __A, __m128d __B,
- _MM_MANTISSA_NORM_ENUM __C, _MM_MANTISSA_SIGN_ENUM __D)
- {
- return (__m128d) __builtin_ia32_getmantsd_mask_round ((__v2df) __A,
- (__v2df) __B,
- (__D << 2) | __C,
- (__v2df)
- _mm_setzero_pd(),
- __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_getmant_ss (__m128 __A, __m128 __B, _MM_MANTISSA_NORM_ENUM __C,
- _MM_MANTISSA_SIGN_ENUM __D)
- {
- return (__m128) __builtin_ia32_getmantss_round ((__v4sf) __A,
- (__v4sf) __B,
- (__D << 2) | __C,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_getmant_ss (__m128 __W, __mmask8 __U, __m128 __A, __m128 __B,
- _MM_MANTISSA_NORM_ENUM __C, _MM_MANTISSA_SIGN_ENUM __D)
- {
- return (__m128) __builtin_ia32_getmantss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__D << 2) | __C,
- (__v4sf) __W,
- __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_maskz_getmant_ss (__mmask8 __U, __m128 __A, __m128 __B,
- _MM_MANTISSA_NORM_ENUM __C, _MM_MANTISSA_SIGN_ENUM __D)
- {
- return (__m128) __builtin_ia32_getmantss_mask_round ((__v4sf) __A,
- (__v4sf) __B,
- (__D << 2) | __C,
- (__v4sf)
- _mm_setzero_ps(),
- __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- #else
- #define _mm512_getmant_pd(X, B, C) \
- ((__m512d)__builtin_ia32_getmantpd512_mask ((__v8df)(__m512d)(X), \
- (int)(((C)<<2) | (B)), \
- (__v8df)_mm512_undefined_pd(), \
- (__mmask8)-1,\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_getmant_pd(W, U, X, B, C) \
- ((__m512d)__builtin_ia32_getmantpd512_mask ((__v8df)(__m512d)(X), \
- (int)(((C)<<2) | (B)), \
- (__v8df)(__m512d)(W), \
- (__mmask8)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_getmant_pd(U, X, B, C) \
- ((__m512d)__builtin_ia32_getmantpd512_mask ((__v8df)(__m512d)(X), \
- (int)(((C)<<2) | (B)), \
- (__v8df)_mm512_setzero_pd(), \
- (__mmask8)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm512_getmant_ps(X, B, C) \
- ((__m512)__builtin_ia32_getmantps512_mask ((__v16sf)(__m512)(X), \
- (int)(((C)<<2) | (B)), \
- (__v16sf)_mm512_undefined_ps(), \
- (__mmask16)-1,\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_getmant_ps(W, U, X, B, C) \
- ((__m512)__builtin_ia32_getmantps512_mask ((__v16sf)(__m512)(X), \
- (int)(((C)<<2) | (B)), \
- (__v16sf)(__m512)(W), \
- (__mmask16)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_getmant_ps(U, X, B, C) \
- ((__m512)__builtin_ia32_getmantps512_mask ((__v16sf)(__m512)(X), \
- (int)(((C)<<2) | (B)), \
- (__v16sf)_mm512_setzero_ps(), \
- (__mmask16)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_getmant_sd(X, Y, C, D) \
- ((__m128d)__builtin_ia32_getmantsd_round ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), \
- (int)(((D)<<2) | (C)), \
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_getmant_sd(W, U, X, Y, C, D) \
- ((__m128d)__builtin_ia32_getmantsd_mask_round ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v2df)(__m128d)(W), \
- (__mmask8)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_maskz_getmant_sd(U, X, Y, C, D) \
- ((__m128d)__builtin_ia32_getmantsd_mask_round ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v2df)_mm_setzero_pd(), \
- (__mmask8)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_getmant_ss(X, Y, C, D) \
- ((__m128)__builtin_ia32_getmantss_round ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), \
- (int)(((D)<<2) | (C)), \
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_getmant_ss(W, U, X, Y, C, D) \
- ((__m128)__builtin_ia32_getmantss_mask_round ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v4sf)(__m128)(W), \
- (__mmask8)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_maskz_getmant_ss(U, X, Y, C, D) \
- ((__m128)__builtin_ia32_getmantss_mask_round ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), \
- (int)(((D)<<2) | (C)), \
- (__v4sf)_mm_setzero_ps(), \
- (__mmask8)(U),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_getexp_ss(A, B) \
- ((__m128)__builtin_ia32_getexpss128_round((__v4sf)(__m128)(A), (__v4sf)(__m128)(B), \
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_getexp_ss(W, U, A, B) \
- (__m128)__builtin_ia32_getexpss_mask_round(A, B, W, U,\
- _MM_FROUND_CUR_DIRECTION)
- #define _mm_maskz_getexp_ss(U, A, B) \
- (__m128)__builtin_ia32_getexpss_mask_round(A, B, (__v4sf)_mm_setzero_ps(), U,\
- _MM_FROUND_CUR_DIRECTION)
- #define _mm_getexp_sd(A, B) \
- ((__m128d)__builtin_ia32_getexpsd128_round((__v2df)(__m128d)(A), (__v2df)(__m128d)(B),\
- _MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_getexp_sd(W, U, A, B) \
- (__m128d)__builtin_ia32_getexpsd_mask_round(A, B, W, U,\
- _MM_FROUND_CUR_DIRECTION)
- #define _mm_maskz_getexp_sd(U, A, B) \
- (__m128d)__builtin_ia32_getexpsd_mask_round(A, B, (__v2df)_mm_setzero_pd(), U,\
- _MM_FROUND_CUR_DIRECTION)
- #define _mm512_getexp_ps(A) \
- ((__m512)__builtin_ia32_getexpps512_mask((__v16sf)(__m512)(A), \
- (__v16sf)_mm512_undefined_ps(), (__mmask16)-1, _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_getexp_ps(W, U, A) \
- ((__m512)__builtin_ia32_getexpps512_mask((__v16sf)(__m512)(A), \
- (__v16sf)(__m512)(W), (__mmask16)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_getexp_ps(U, A) \
- ((__m512)__builtin_ia32_getexpps512_mask((__v16sf)(__m512)(A), \
- (__v16sf)_mm512_setzero_ps(), (__mmask16)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_getexp_pd(A) \
- ((__m512d)__builtin_ia32_getexppd512_mask((__v8df)(__m512d)(A), \
- (__v8df)_mm512_undefined_pd(), (__mmask8)-1, _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_getexp_pd(W, U, A) \
- ((__m512d)__builtin_ia32_getexppd512_mask((__v8df)(__m512d)(A), \
- (__v8df)(__m512d)(W), (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_getexp_pd(U, A) \
- ((__m512d)__builtin_ia32_getexppd512_mask((__v8df)(__m512d)(A), \
- (__v8df)_mm512_setzero_pd(), (__mmask8)(U), _MM_FROUND_CUR_DIRECTION))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_roundscale_ps (__m512 __A, const int __imm)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __A, __imm,
- (__v16sf)
- _mm512_undefined_ps (),
- -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_roundscale_ps (__m512 __A, __mmask16 __B, __m512 __C,
- const int __imm)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __C, __imm,
- (__v16sf) __A,
- (__mmask16) __B,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_roundscale_ps (__mmask16 __A, __m512 __B, const int __imm)
- {
- return (__m512) __builtin_ia32_rndscaleps_mask ((__v16sf) __B,
- __imm,
- (__v16sf)
- _mm512_setzero_ps (),
- (__mmask16) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_roundscale_pd (__m512d __A, const int __imm)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __A, __imm,
- (__v8df)
- _mm512_undefined_pd (),
- -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_roundscale_pd (__m512d __A, __mmask8 __B, __m512d __C,
- const int __imm)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __C, __imm,
- (__v8df) __A,
- (__mmask8) __B,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_maskz_roundscale_pd (__mmask8 __A, __m512d __B, const int __imm)
- {
- return (__m512d) __builtin_ia32_rndscalepd_mask ((__v8df) __B,
- __imm,
- (__v8df)
- _mm512_setzero_pd (),
- (__mmask8) __A,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_roundscale_ss (__m128 __A, __m128 __B, const int __imm)
- {
- return (__m128) __builtin_ia32_rndscaless_round ((__v4sf) __A,
- (__v4sf) __B, __imm,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_roundscale_sd (__m128d __A, __m128d __B, const int __imm)
- {
- return (__m128d) __builtin_ia32_rndscalesd_round ((__v2df) __A,
- (__v2df) __B, __imm,
- _MM_FROUND_CUR_DIRECTION);
- }
- #else
- #define _mm512_roundscale_ps(A, B) \
- ((__m512) __builtin_ia32_rndscaleps_mask ((__v16sf)(__m512)(A), (int)(B),\
- (__v16sf)_mm512_undefined_ps(), (__mmask16)(-1), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_roundscale_ps(A, B, C, D) \
- ((__m512) __builtin_ia32_rndscaleps_mask ((__v16sf)(__m512)(C), \
- (int)(D), \
- (__v16sf)(__m512)(A), \
- (__mmask16)(B), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_roundscale_ps(A, B, C) \
- ((__m512) __builtin_ia32_rndscaleps_mask ((__v16sf)(__m512)(B), \
- (int)(C), \
- (__v16sf)_mm512_setzero_ps(),\
- (__mmask16)(A), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_roundscale_pd(A, B) \
- ((__m512d) __builtin_ia32_rndscalepd_mask ((__v8df)(__m512d)(A), (int)(B),\
- (__v8df)_mm512_undefined_pd(), (__mmask8)(-1), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_roundscale_pd(A, B, C, D) \
- ((__m512d) __builtin_ia32_rndscalepd_mask ((__v8df)(__m512d)(C), \
- (int)(D), \
- (__v8df)(__m512d)(A), \
- (__mmask8)(B), _MM_FROUND_CUR_DIRECTION))
- #define _mm512_maskz_roundscale_pd(A, B, C) \
- ((__m512d) __builtin_ia32_rndscalepd_mask ((__v8df)(__m512d)(B), \
- (int)(C), \
- (__v8df)_mm512_setzero_pd(),\
- (__mmask8)(A), _MM_FROUND_CUR_DIRECTION))
- #define _mm_roundscale_ss(A, B, C) \
- ((__m128) __builtin_ia32_rndscaless_round ((__v4sf)(__m128)(A), \
- (__v4sf)(__m128)(B), (int)(C), _MM_FROUND_CUR_DIRECTION))
- #define _mm_roundscale_sd(A, B, C) \
- ((__m128d) __builtin_ia32_rndscalesd_round ((__v2df)(__m128d)(A), \
- (__v2df)(__m128d)(B), (int)(C), _MM_FROUND_CUR_DIRECTION))
- #endif
- #ifdef __OPTIMIZE__
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_pd_mask (__m512d __X, __m512d __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, __P,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmp_ps_mask (__m512 __X, __m512 __Y, const int __P)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, __P,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y, const int __P)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, __P,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmp_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, __P,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpeq_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_EQ_OQ,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpeq_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_EQ_OQ,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmplt_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_LT_OS,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmplt_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_LT_OS,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmple_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_LE_OS,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmple_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_LE_OS,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpunord_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_UNORD_Q,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpunord_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_UNORD_Q,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpneq_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_NEQ_UQ,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpneq_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_NEQ_UQ,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpnlt_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_NLT_US,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpnlt_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_NLT_US,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpnle_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_NLE_US,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpnle_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_NLE_US,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpord_pd_mask (__m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_ORD_Q,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpord_pd_mask (__mmask8 __U, __m512d __X, __m512d __Y)
- {
- return (__mmask8) __builtin_ia32_cmppd512_mask ((__v8df) __X,
- (__v8df) __Y, _CMP_ORD_Q,
- (__mmask8) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpeq_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_EQ_OQ,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpeq_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_EQ_OQ,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmplt_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_LT_OS,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmplt_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_LT_OS,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmple_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_LE_OS,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmple_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_LE_OS,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpunord_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_UNORD_Q,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpunord_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_UNORD_Q,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpneq_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_NEQ_UQ,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpneq_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_NEQ_UQ,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpnlt_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_NLT_US,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpnlt_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_NLT_US,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpnle_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_NLE_US,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpnle_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_NLE_US,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpord_ps_mask (__m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_ORD_Q,
- (__mmask16) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpord_ps_mask (__mmask16 __U, __m512 __X, __m512 __Y)
- {
- return (__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf) __X,
- (__v16sf) __Y, _CMP_ORD_Q,
- (__mmask16) __U,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cmp_sd_mask (__m128d __X, __m128d __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_cmpsd_mask ((__v2df) __X,
- (__v2df) __Y, __P,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_cmp_sd_mask (__mmask8 __M, __m128d __X, __m128d __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_cmpsd_mask ((__v2df) __X,
- (__v2df) __Y, __P,
- (__mmask8) __M,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_cmp_ss_mask (__m128 __X, __m128 __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_cmpss_mask ((__v4sf) __X,
- (__v4sf) __Y, __P,
- (__mmask8) -1,
- _MM_FROUND_CUR_DIRECTION);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm_mask_cmp_ss_mask (__mmask8 __M, __m128 __X, __m128 __Y, const int __P)
- {
- return (__mmask8) __builtin_ia32_cmpss_mask ((__v4sf) __X,
- (__v4sf) __Y, __P,
- (__mmask8) __M,
- _MM_FROUND_CUR_DIRECTION);
- }
- #else
- #define _mm512_cmp_pd_mask(X, Y, P) \
- ((__mmask8) __builtin_ia32_cmppd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(P),\
- (__mmask8)-1,_MM_FROUND_CUR_DIRECTION))
- #define _mm512_cmp_ps_mask(X, Y, P) \
- ((__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(P),\
- (__mmask16)-1,_MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_cmp_pd_mask(M, X, Y, P) \
- ((__mmask8) __builtin_ia32_cmppd512_mask ((__v8df)(__m512d)(X), \
- (__v8df)(__m512d)(Y), (int)(P),\
- (__mmask8)M, _MM_FROUND_CUR_DIRECTION))
- #define _mm512_mask_cmp_ps_mask(M, X, Y, P) \
- ((__mmask16) __builtin_ia32_cmpps512_mask ((__v16sf)(__m512)(X), \
- (__v16sf)(__m512)(Y), (int)(P),\
- (__mmask16)M,_MM_FROUND_CUR_DIRECTION))
- #define _mm_cmp_sd_mask(X, Y, P) \
- ((__mmask8) __builtin_ia32_cmpsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (int)(P),\
- (__mmask8)-1,_MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_cmp_sd_mask(M, X, Y, P) \
- ((__mmask8) __builtin_ia32_cmpsd_mask ((__v2df)(__m128d)(X), \
- (__v2df)(__m128d)(Y), (int)(P),\
- M,_MM_FROUND_CUR_DIRECTION))
- #define _mm_cmp_ss_mask(X, Y, P) \
- ((__mmask8) __builtin_ia32_cmpss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (int)(P), \
- (__mmask8)-1,_MM_FROUND_CUR_DIRECTION))
- #define _mm_mask_cmp_ss_mask(M, X, Y, P) \
- ((__mmask8) __builtin_ia32_cmpss_mask ((__v4sf)(__m128)(X), \
- (__v4sf)(__m128)(Y), (int)(P), \
- M,_MM_FROUND_CUR_DIRECTION))
- #endif
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_kmov (__mmask16 __A)
- {
- return __builtin_ia32_kmovw (__A);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castpd_ps (__m512d __A)
- {
- return (__m512) (__A);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castpd_si512 (__m512d __A)
- {
- return (__m512i) (__A);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castps_pd (__m512 __A)
- {
- return (__m512d) (__A);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castps_si512 (__m512 __A)
- {
- return (__m512i) (__A);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castsi512_ps (__m512i __A)
- {
- return (__m512) (__A);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castsi512_pd (__m512i __A)
- {
- return (__m512d) (__A);
- }
- extern __inline __m128d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castpd512_pd128 (__m512d __A)
- {
- return (__m128d)_mm512_extractf32x4_ps((__m512)__A, 0);
- }
- extern __inline __m128
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castps512_ps128 (__m512 __A)
- {
- return _mm512_extractf32x4_ps(__A, 0);
- }
- extern __inline __m128i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castsi512_si128 (__m512i __A)
- {
- return (__m128i)_mm512_extracti32x4_epi32((__m512i)__A, 0);
- }
- extern __inline __m256d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castpd512_pd256 (__m512d __A)
- {
- return _mm512_extractf64x4_pd(__A, 0);
- }
- extern __inline __m256
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castps512_ps256 (__m512 __A)
- {
- return (__m256)_mm512_extractf64x4_pd((__m512d)__A, 0);
- }
- extern __inline __m256i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castsi512_si256 (__m512i __A)
- {
- return (__m256i)_mm512_extractf64x4_pd((__m512d)__A, 0);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castpd128_pd512 (__m128d __A)
- {
- return (__m512d) __builtin_ia32_pd512_pd((__m128d)__A);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castps128_ps512 (__m128 __A)
- {
- return (__m512) __builtin_ia32_ps512_ps((__m128)__A);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castsi128_si512 (__m128i __A)
- {
- return (__m512i) __builtin_ia32_si512_si((__v4si)__A);
- }
- extern __inline __m512d
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castpd256_pd512 (__m256d __A)
- {
- return __builtin_ia32_pd512_256pd (__A);
- }
- extern __inline __m512
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castps256_ps512 (__m256 __A)
- {
- return __builtin_ia32_ps512_256ps (__A);
- }
- extern __inline __m512i
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_castsi256_si512 (__m256i __A)
- {
- return (__m512i)__builtin_ia32_si512_256si ((__v8si)__A);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpeq_epu32_mask (__m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __A,
- (__v16si) __B, 0,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpeq_epu32_mask (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __A,
- (__v16si) __B, 0, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpeq_epu64_mask (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __A,
- (__v8di) __B, 0, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpeq_epu64_mask (__m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __A,
- (__v8di) __B, 0,
- (__mmask8) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpgt_epu32_mask (__m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __A,
- (__v16si) __B, 6,
- (__mmask16) -1);
- }
- extern __inline __mmask16
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpgt_epu32_mask (__mmask16 __U, __m512i __A, __m512i __B)
- {
- return (__mmask16) __builtin_ia32_ucmpd512_mask ((__v16si) __A,
- (__v16si) __B, 6, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_cmpgt_epu64_mask (__mmask8 __U, __m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __A,
- (__v8di) __B, 6, __U);
- }
- extern __inline __mmask8
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_cmpgt_epu64_mask (__m512i __A, __m512i __B)
- {
- return (__mmask8) __builtin_ia32_ucmpq512_mask ((__v8di) __A,
- (__v8di) __B, 6,
- (__mmask8) -1);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __v8si __T1 = (__v8si) _mm512_extracti64x4_epi64 (__A, 1); \
- __v8si __T2 = (__v8si) _mm512_extracti64x4_epi64 (__A, 0); \
- __m256i __T3 = (__m256i) (__T1 op __T2); \
- __v4si __T4 = (__v4si) _mm256_extracti128_si256 (__T3, 1); \
- __v4si __T5 = (__v4si) _mm256_extracti128_si256 (__T3, 0); \
- __v4si __T6 = __T4 op __T5; \
- __v4si __T7 = __builtin_shuffle (__T6, (__v4si) { 2, 3, 0, 1 }); \
- __v4si __T8 = __T6 op __T7; \
- return __T8[0] op __T8[1]
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_add_epi32 (__m512i __A)
- {
- __MM512_REDUCE_OP (+);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_mul_epi32 (__m512i __A)
- {
- __MM512_REDUCE_OP (*);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_and_epi32 (__m512i __A)
- {
- __MM512_REDUCE_OP (&);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_or_epi32 (__m512i __A)
- {
- __MM512_REDUCE_OP (|);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_add_epi32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_maskz_mov_epi32 (__U, __A);
- __MM512_REDUCE_OP (+);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_mul_epi32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi32 (_mm512_set1_epi32 (1), __U, __A);
- __MM512_REDUCE_OP (*);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_and_epi32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi32 (_mm512_set1_epi32 (~0), __U, __A);
- __MM512_REDUCE_OP (&);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_or_epi32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_maskz_mov_epi32 (__U, __A);
- __MM512_REDUCE_OP (|);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __m256i __T1 = (__m256i) _mm512_extracti64x4_epi64 (__A, 1); \
- __m256i __T2 = (__m256i) _mm512_extracti64x4_epi64 (__A, 0); \
- __m256i __T3 = _mm256_##op (__T1, __T2); \
- __m128i __T4 = (__m128i) _mm256_extracti128_si256 (__T3, 1); \
- __m128i __T5 = (__m128i) _mm256_extracti128_si256 (__T3, 0); \
- __m128i __T6 = _mm_##op (__T4, __T5); \
- __m128i __T7 = (__m128i) __builtin_shuffle ((__v4si) __T6, \
- (__v4si) { 2, 3, 0, 1 }); \
- __m128i __T8 = _mm_##op (__T6, __T7); \
- __m128i __T9 = (__m128i) __builtin_shuffle ((__v4si) __T8, \
- (__v4si) { 1, 0, 1, 0 }); \
- __v4si __T10 = (__v4si) _mm_##op (__T8, __T9); \
- return __T10[0]
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_min_epi32 (__m512i __A)
- {
- __MM512_REDUCE_OP (min_epi32);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_max_epi32 (__m512i __A)
- {
- __MM512_REDUCE_OP (max_epi32);
- }
- extern __inline unsigned int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_min_epu32 (__m512i __A)
- {
- __MM512_REDUCE_OP (min_epu32);
- }
- extern __inline unsigned int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_max_epu32 (__m512i __A)
- {
- __MM512_REDUCE_OP (max_epu32);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_min_epi32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi32 (_mm512_set1_epi32 (__INT_MAX__), __U, __A);
- __MM512_REDUCE_OP (min_epi32);
- }
- extern __inline int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_max_epi32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi32 (_mm512_set1_epi32 (-__INT_MAX__ - 1), __U, __A);
- __MM512_REDUCE_OP (max_epi32);
- }
- extern __inline unsigned int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_min_epu32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi32 (_mm512_set1_epi32 (~0), __U, __A);
- __MM512_REDUCE_OP (min_epu32);
- }
- extern __inline unsigned int
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_max_epu32 (__mmask16 __U, __m512i __A)
- {
- __A = _mm512_maskz_mov_epi32 (__U, __A);
- __MM512_REDUCE_OP (max_epu32);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __m256 __T1 = (__m256) _mm512_extractf64x4_pd ((__m512d) __A, 1); \
- __m256 __T2 = (__m256) _mm512_extractf64x4_pd ((__m512d) __A, 0); \
- __m256 __T3 = __T1 op __T2; \
- __m128 __T4 = _mm256_extractf128_ps (__T3, 1); \
- __m128 __T5 = _mm256_extractf128_ps (__T3, 0); \
- __m128 __T6 = __T4 op __T5; \
- __m128 __T7 = __builtin_shuffle (__T6, (__v4si) { 2, 3, 0, 1 }); \
- __m128 __T8 = __T6 op __T7; \
- return __T8[0] op __T8[1]
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_add_ps (__m512 __A)
- {
- __MM512_REDUCE_OP (+);
- }
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_mul_ps (__m512 __A)
- {
- __MM512_REDUCE_OP (*);
- }
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_add_ps (__mmask16 __U, __m512 __A)
- {
- __A = _mm512_maskz_mov_ps (__U, __A);
- __MM512_REDUCE_OP (+);
- }
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_mul_ps (__mmask16 __U, __m512 __A)
- {
- __A = _mm512_mask_mov_ps (_mm512_set1_ps (1.0f), __U, __A);
- __MM512_REDUCE_OP (*);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __m256 __T1 = (__m256) _mm512_extractf64x4_pd ((__m512d) __A, 1); \
- __m256 __T2 = (__m256) _mm512_extractf64x4_pd ((__m512d) __A, 0); \
- __m256 __T3 = _mm256_##op (__T1, __T2); \
- __m128 __T4 = _mm256_extractf128_ps (__T3, 1); \
- __m128 __T5 = _mm256_extractf128_ps (__T3, 0); \
- __m128 __T6 = _mm_##op (__T4, __T5); \
- __m128 __T7 = __builtin_shuffle (__T6, (__v4si) { 2, 3, 0, 1 }); \
- __m128 __T8 = _mm_##op (__T6, __T7); \
- __m128 __T9 = __builtin_shuffle (__T8, (__v4si) { 1, 0, 1, 0 }); \
- __m128 __T10 = _mm_##op (__T8, __T9); \
- return __T10[0]
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_min_ps (__m512 __A)
- {
- __MM512_REDUCE_OP (min_ps);
- }
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_max_ps (__m512 __A)
- {
- __MM512_REDUCE_OP (max_ps);
- }
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_min_ps (__mmask16 __U, __m512 __A)
- {
- __A = _mm512_mask_mov_ps (_mm512_set1_ps (__builtin_inff ()), __U, __A);
- __MM512_REDUCE_OP (min_ps);
- }
- extern __inline float
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_max_ps (__mmask16 __U, __m512 __A)
- {
- __A = _mm512_mask_mov_ps (_mm512_set1_ps (-__builtin_inff ()), __U, __A);
- __MM512_REDUCE_OP (max_ps);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __v4di __T1 = (__v4di) _mm512_extracti64x4_epi64 (__A, 1); \
- __v4di __T2 = (__v4di) _mm512_extracti64x4_epi64 (__A, 0); \
- __m256i __T3 = (__m256i) (__T1 op __T2); \
- __v2di __T4 = (__v2di) _mm256_extracti128_si256 (__T3, 1); \
- __v2di __T5 = (__v2di) _mm256_extracti128_si256 (__T3, 0); \
- __v2di __T6 = __T4 op __T5; \
- return __T6[0] op __T6[1]
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_add_epi64 (__m512i __A)
- {
- __MM512_REDUCE_OP (+);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_mul_epi64 (__m512i __A)
- {
- __MM512_REDUCE_OP (*);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_and_epi64 (__m512i __A)
- {
- __MM512_REDUCE_OP (&);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_or_epi64 (__m512i __A)
- {
- __MM512_REDUCE_OP (|);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_add_epi64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_maskz_mov_epi64 (__U, __A);
- __MM512_REDUCE_OP (+);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_mul_epi64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi64 (_mm512_set1_epi64 (1LL), __U, __A);
- __MM512_REDUCE_OP (*);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_and_epi64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi64 (_mm512_set1_epi64 (~0LL), __U, __A);
- __MM512_REDUCE_OP (&);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_or_epi64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_maskz_mov_epi64 (__U, __A);
- __MM512_REDUCE_OP (|);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __m512i __T1 = _mm512_shuffle_i64x2 (__A, __A, 0x4e); \
- __m512i __T2 = _mm512_##op (__A, __T1); \
- __m512i __T3 \
- = (__m512i) __builtin_shuffle ((__v8di) __T2, \
- (__v8di) { 2, 3, 0, 1, 6, 7, 4, 5 });\
- __m512i __T4 = _mm512_##op (__T2, __T3); \
- __m512i __T5 \
- = (__m512i) __builtin_shuffle ((__v8di) __T4, \
- (__v8di) { 1, 0, 3, 2, 5, 4, 7, 6 });\
- __v8di __T6 = (__v8di) _mm512_##op (__T4, __T5); \
- return __T6[0]
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_min_epi64 (__m512i __A)
- {
- __MM512_REDUCE_OP (min_epi64);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_max_epi64 (__m512i __A)
- {
- __MM512_REDUCE_OP (max_epi64);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_min_epi64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi64 (_mm512_set1_epi64 (__LONG_LONG_MAX__),
- __U, __A);
- __MM512_REDUCE_OP (min_epi64);
- }
- extern __inline long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_max_epi64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi64 (_mm512_set1_epi64 (-__LONG_LONG_MAX__ - 1),
- __U, __A);
- __MM512_REDUCE_OP (max_epi64);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_min_epu64 (__m512i __A)
- {
- __MM512_REDUCE_OP (min_epu64);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_max_epu64 (__m512i __A)
- {
- __MM512_REDUCE_OP (max_epu64);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_min_epu64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_mask_mov_epi64 (_mm512_set1_epi64 (~0LL), __U, __A);
- __MM512_REDUCE_OP (min_epu64);
- }
- extern __inline unsigned long long
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_max_epu64 (__mmask8 __U, __m512i __A)
- {
- __A = _mm512_maskz_mov_epi64 (__U, __A);
- __MM512_REDUCE_OP (max_epu64);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __m256d __T1 = (__m256d) _mm512_extractf64x4_pd (__A, 1); \
- __m256d __T2 = (__m256d) _mm512_extractf64x4_pd (__A, 0); \
- __m256d __T3 = __T1 op __T2; \
- __m128d __T4 = _mm256_extractf128_pd (__T3, 1); \
- __m128d __T5 = _mm256_extractf128_pd (__T3, 0); \
- __m128d __T6 = __T4 op __T5; \
- return __T6[0] op __T6[1]
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_add_pd (__m512d __A)
- {
- __MM512_REDUCE_OP (+);
- }
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_mul_pd (__m512d __A)
- {
- __MM512_REDUCE_OP (*);
- }
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_add_pd (__mmask8 __U, __m512d __A)
- {
- __A = _mm512_maskz_mov_pd (__U, __A);
- __MM512_REDUCE_OP (+);
- }
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_mul_pd (__mmask8 __U, __m512d __A)
- {
- __A = _mm512_mask_mov_pd (_mm512_set1_pd (1.0), __U, __A);
- __MM512_REDUCE_OP (*);
- }
- #undef __MM512_REDUCE_OP
- #define __MM512_REDUCE_OP(op) \
- __m256d __T1 = (__m256d) _mm512_extractf64x4_pd (__A, 1); \
- __m256d __T2 = (__m256d) _mm512_extractf64x4_pd (__A, 0); \
- __m256d __T3 = _mm256_##op (__T1, __T2); \
- __m128d __T4 = _mm256_extractf128_pd (__T3, 1); \
- __m128d __T5 = _mm256_extractf128_pd (__T3, 0); \
- __m128d __T6 = _mm_##op (__T4, __T5); \
- __m128d __T7 = (__m128d) __builtin_shuffle (__T6, (__v2di) { 1, 0 }); \
- __m128d __T8 = _mm_##op (__T6, __T7); \
- return __T8[0]
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_min_pd (__m512d __A)
- {
- __MM512_REDUCE_OP (min_pd);
- }
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_reduce_max_pd (__m512d __A)
- {
- __MM512_REDUCE_OP (max_pd);
- }
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_min_pd (__mmask8 __U, __m512d __A)
- {
- __A = _mm512_mask_mov_pd (_mm512_set1_pd (__builtin_inf ()), __U, __A);
- __MM512_REDUCE_OP (min_pd);
- }
- extern __inline double
- __attribute__ ((__gnu_inline__, __always_inline__, __artificial__))
- _mm512_mask_reduce_max_pd (__mmask8 __U, __m512d __A)
- {
- __A = _mm512_mask_mov_pd (_mm512_set1_pd (-__builtin_inf ()), __U, __A);
- __MM512_REDUCE_OP (max_pd);
- }
- #undef __MM512_REDUCE_OP
- #ifdef __DISABLE_AVX512F__
- #undef __DISABLE_AVX512F__
- #pragma GCC pop_options
- #endif /* __DISABLE_AVX512F__ */
- #endif /* _AVX512FINTRIN_H_INCLUDED */
|