ngrams.csv 229 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227122812291230123112321233123412351236123712381239124012411242124312441245124612471248124912501251125212531254125512561257125812591260126112621263126412651266126712681269127012711272127312741275127612771278127912801281128212831284128512861287128812891290129112921293129412951296129712981299130013011302130313041305130613071308130913101311131213131314131513161317131813191320132113221323132413251326132713281329133013311332133313341335133613371338133913401341134213431344134513461347134813491350135113521353135413551356135713581359136013611362136313641365136613671368136913701371137213731374137513761377137813791380138113821383138413851386138713881389139013911392139313941395139613971398139914001401140214031404140514061407140814091410141114121413141414151416141714181419142014211422142314241425142614271428142914301431143214331434143514361437143814391440144114421443144414451446144714481449145014511452145314541455145614571458145914601461146214631464146514661467146814691470147114721473147414751476147714781479148014811482148314841485148614871488148914901491149214931494149514961497149814991500150115021503150415051506150715081509151015111512151315141515151615171518151915201521152215231524152515261527152815291530153115321533153415351536153715381539154015411542154315441545154615471548154915501551155215531554155515561557155815591560156115621563156415651566156715681569157015711572157315741575157615771578157915801581158215831584158515861587158815891590159115921593159415951596159715981599160016011602160316041605160616071608160916101611161216131614161516161617161816191620162116221623162416251626162716281629163016311632163316341635163616371638163916401641164216431644164516461647164816491650165116521653165416551656165716581659166016611662166316641665166616671668166916701671167216731674167516761677167816791680168116821683168416851686168716881689169016911692169316941695169616971698169917001701170217031704170517061707170817091710171117121713171417151716171717181719172017211722172317241725172617271728172917301731173217331734173517361737173817391740174117421743174417451746174717481749175017511752175317541755175617571758175917601761176217631764176517661767176817691770177117721773177417751776177717781779178017811782178317841785178617871788178917901791179217931794179517961797179817991800180118021803180418051806180718081809181018111812181318141815181618171818181918201821182218231824182518261827182818291830183118321833183418351836183718381839184018411842184318441845184618471848184918501851185218531854185518561857185818591860186118621863186418651866186718681869187018711872187318741875187618771878187918801881188218831884188518861887188818891890189118921893189418951896189718981899190019011902190319041905190619071908190919101911191219131914191519161917191819191920192119221923192419251926192719281929193019311932193319341935193619371938193919401941194219431944194519461947194819491950195119521953195419551956195719581959196019611962196319641965196619671968196919701971197219731974197519761977197819791980198119821983198419851986198719881989199019911992199319941995199619971998199920002001200220032004200520062007200820092010201120122013201420152016201720182019202020212022202320242025202620272028202920302031203220332034203520362037203820392040204120422043204420452046204720482049205020512052205320542055205620572058205920602061206220632064206520662067206820692070207120722073207420752076207720782079208020812082208320842085208620872088208920902091209220932094209520962097209820992100210121022103210421052106210721082109211021112112211321142115211621172118211921202121212221232124212521262127212821292130213121322133213421352136213721382139214021412142214321442145214621472148214921502151215221532154215521562157215821592160216121622163216421652166216721682169217021712172217321742175217621772178217921802181218221832184218521862187218821892190219121922193219421952196219721982199220022012202220322042205220622072208220922102211221222132214221522162217221822192220222122222223222422252226222722282229223022312232223322342235223622372238223922402241224222432244224522462247224822492250225122522253225422552256225722582259226022612262226322642265226622672268226922702271227222732274227522762277227822792280228122822283228422852286228722882289229022912292229322942295229622972298229923002301230223032304230523062307230823092310231123122313231423152316231723182319232023212322232323242325232623272328232923302331233223332334233523362337233823392340234123422343234423452346234723482349235023512352235323542355235623572358235923602361236223632364236523662367236823692370237123722373237423752376237723782379238023812382238323842385238623872388238923902391239223932394239523962397239823992400240124022403240424052406240724082409241024112412241324142415241624172418241924202421242224232424242524262427242824292430243124322433243424352436243724382439244024412442244324442445244624472448244924502451245224532454245524562457245824592460246124622463246424652466246724682469247024712472247324742475247624772478247924802481248224832484248524862487248824892490249124922493249424952496249724982499250025012502250325042505250625072508250925102511251225132514251525162517251825192520252125222523252425252526252725282529253025312532253325342535253625372538253925402541254225432544254525462547254825492550255125522553255425552556255725582559256025612562256325642565256625672568256925702571257225732574257525762577257825792580258125822583258425852586258725882589259025912592259325942595259625972598259926002601260226032604260526062607260826092610261126122613261426152616261726182619262026212622262326242625262626272628262926302631263226332634263526362637263826392640264126422643264426452646264726482649265026512652265326542655265626572658265926602661266226632664266526662667266826692670267126722673267426752676267726782679268026812682268326842685268626872688268926902691269226932694269526962697269826992700270127022703270427052706270727082709271027112712271327142715271627172718271927202721272227232724272527262727272827292730273127322733273427352736273727382739274027412742274327442745274627472748274927502751275227532754275527562757275827592760276127622763276427652766276727682769277027712772277327742775277627772778277927802781278227832784278527862787278827892790279127922793279427952796279727982799280028012802280328042805280628072808280928102811281228132814281528162817281828192820282128222823282428252826282728282829283028312832283328342835283628372838283928402841284228432844284528462847284828492850285128522853285428552856285728582859286028612862286328642865286628672868286928702871287228732874287528762877287828792880288128822883288428852886288728882889289028912892289328942895289628972898289929002901290229032904290529062907290829092910291129122913291429152916291729182919292029212922292329242925292629272928292929302931293229332934293529362937293829392940294129422943294429452946294729482949295029512952295329542955295629572958295929602961296229632964296529662967296829692970297129722973297429752976297729782979298029812982298329842985298629872988298929902991299229932994299529962997299829993000300130023003300430053006300730083009301030113012301330143015301630173018301930203021302230233024302530263027302830293030303130323033303430353036303730383039304030413042304330443045304630473048304930503051305230533054305530563057305830593060306130623063306430653066306730683069307030713072307330743075307630773078307930803081308230833084308530863087308830893090309130923093309430953096309730983099310031013102310331043105310631073108310931103111311231133114311531163117311831193120312131223123312431253126312731283129313031313132313331343135313631373138313931403141314231433144314531463147314831493150315131523153315431553156315731583159316031613162316331643165316631673168316931703171317231733174317531763177317831793180318131823183318431853186318731883189319031913192319331943195319631973198319932003201320232033204320532063207320832093210321132123213321432153216321732183219322032213222322332243225322632273228322932303231323232333234323532363237323832393240324132423243324432453246324732483249325032513252325332543255325632573258325932603261326232633264326532663267326832693270327132723273327432753276327732783279328032813282328332843285328632873288328932903291329232933294329532963297329832993300330133023303330433053306330733083309331033113312331333143315331633173318331933203321332233233324332533263327332833293330333133323333333433353336333733383339334033413342334333443345334633473348334933503351335233533354335533563357335833593360336133623363336433653366336733683369337033713372337333743375337633773378337933803381338233833384338533863387338833893390339133923393339433953396339733983399340034013402340334043405340634073408340934103411341234133414341534163417341834193420342134223423342434253426342734283429343034313432343334343435343634373438343934403441344234433444344534463447344834493450345134523453345434553456345734583459346034613462346334643465346634673468346934703471347234733474347534763477347834793480348134823483348434853486348734883489349034913492349334943495349634973498349935003501350235033504350535063507350835093510351135123513351435153516351735183519352035213522352335243525352635273528352935303531353235333534353535363537353835393540354135423543354435453546354735483549355035513552355335543555355635573558355935603561356235633564356535663567356835693570357135723573357435753576357735783579358035813582358335843585358635873588358935903591359235933594359535963597359835993600360136023603360436053606360736083609361036113612361336143615361636173618361936203621362236233624362536263627362836293630363136323633363436353636363736383639364036413642364336443645364636473648364936503651365236533654365536563657365836593660366136623663366436653666366736683669367036713672367336743675367636773678367936803681368236833684368536863687368836893690369136923693369436953696369736983699370037013702370337043705370637073708370937103711371237133714371537163717371837193720372137223723372437253726372737283729373037313732373337343735373637373738373937403741374237433744374537463747374837493750375137523753375437553756375737583759376037613762376337643765376637673768376937703771377237733774377537763777377837793780378137823783378437853786378737883789379037913792379337943795379637973798379938003801380238033804380538063807380838093810381138123813381438153816381738183819382038213822382338243825382638273828382938303831383238333834383538363837383838393840384138423843384438453846384738483849385038513852385338543855385638573858385938603861386238633864386538663867386838693870387138723873387438753876387738783879388038813882388338843885388638873888388938903891389238933894389538963897389838993900390139023903390439053906390739083909391039113912391339143915391639173918391939203921392239233924392539263927392839293930393139323933393439353936393739383939394039413942394339443945394639473948394939503951395239533954395539563957395839593960396139623963396439653966396739683969397039713972397339743975397639773978397939803981398239833984398539863987398839893990399139923993399439953996399739983999400040014002400340044005400640074008400940104011401240134014401540164017401840194020402140224023402440254026402740284029403040314032403340344035403640374038403940404041404240434044404540464047404840494050405140524053405440554056405740584059406040614062406340644065406640674068406940704071407240734074407540764077407840794080408140824083408440854086408740884089409040914092409340944095409640974098409941004101410241034104410541064107410841094110411141124113411441154116411741184119412041214122412341244125412641274128412941304131413241334134413541364137413841394140414141424143414441454146414741484149415041514152415341544155415641574158415941604161416241634164416541664167416841694170417141724173417441754176417741784179418041814182418341844185418641874188418941904191419241934194419541964197419841994200420142024203420442054206420742084209421042114212421342144215421642174218421942204221422242234224422542264227422842294230423142324233423442354236423742384239424042414242424342444245424642474248424942504251425242534254425542564257425842594260426142624263426442654266426742684269427042714272427342744275427642774278427942804281428242834284428542864287428842894290429142924293429442954296429742984299430043014302430343044305430643074308430943104311431243134314431543164317431843194320432143224323432443254326432743284329433043314332433343344335433643374338433943404341434243434344434543464347434843494350435143524353435443554356435743584359436043614362436343644365436643674368436943704371437243734374437543764377437843794380438143824383438443854386438743884389439043914392439343944395439643974398439944004401440244034404440544064407440844094410441144124413441444154416441744184419442044214422442344244425442644274428442944304431443244334434443544364437443844394440444144424443444444454446444744484449445044514452445344544455445644574458445944604461446244634464446544664467446844694470447144724473447444754476447744784479448044814482448344844485448644874488448944904491449244934494449544964497449844994500450145024503450445054506450745084509451045114512451345144515451645174518451945204521452245234524452545264527452845294530453145324533453445354536453745384539454045414542454345444545454645474548454945504551455245534554455545564557455845594560456145624563456445654566456745684569457045714572457345744575457645774578457945804581458245834584458545864587458845894590459145924593459445954596459745984599460046014602460346044605460646074608460946104611461246134614461546164617461846194620462146224623462446254626462746284629463046314632463346344635463646374638463946404641464246434644464546464647464846494650465146524653465446554656465746584659466046614662466346644665466646674668466946704671467246734674467546764677467846794680468146824683468446854686468746884689469046914692469346944695469646974698469947004701470247034704470547064707470847094710471147124713471447154716471747184719472047214722472347244725472647274728472947304731473247334734473547364737473847394740474147424743474447454746474747484749475047514752475347544755475647574758475947604761476247634764476547664767476847694770477147724773477447754776477747784779478047814782478347844785478647874788478947904791479247934794479547964797479847994800480148024803480448054806480748084809481048114812481348144815481648174818481948204821482248234824482548264827482848294830483148324833483448354836483748384839484048414842484348444845484648474848484948504851485248534854485548564857485848594860486148624863486448654866486748684869487048714872487348744875487648774878487948804881488248834884488548864887488848894890489148924893489448954896489748984899490049014902490349044905490649074908490949104911491249134914491549164917491849194920492149224923492449254926492749284929493049314932493349344935493649374938493949404941494249434944494549464947494849494950495149524953495449554956495749584959496049614962496349644965496649674968496949704971497249734974497549764977497849794980498149824983498449854986498749884989499049914992499349944995499649974998499950005001500250035004500550065007500850095010501150125013501450155016501750185019502050215022502350245025502650275028502950305031503250335034503550365037503850395040504150425043504450455046504750485049505050515052505350545055505650575058505950605061506250635064506550665067506850695070507150725073507450755076507750785079508050815082508350845085508650875088508950905091509250935094509550965097509850995100510151025103510451055106510751085109511051115112511351145115511651175118511951205121512251235124512551265127512851295130513151325133513451355136513751385139514051415142514351445145514651475148514951505151515251535154515551565157515851595160516151625163516451655166516751685169517051715172517351745175517651775178517951805181518251835184518551865187518851895190519151925193519451955196519751985199520052015202520352045205520652075208520952105211521252135214521552165217521852195220522152225223522452255226522752285229523052315232523352345235523652375238523952405241524252435244524552465247524852495250525152525253525452555256525752585259526052615262526352645265526652675268526952705271527252735274527552765277527852795280528152825283528452855286528752885289529052915292529352945295529652975298529953005301530253035304530553065307530853095310531153125313531453155316531753185319532053215322532353245325532653275328532953305331533253335334533553365337533853395340534153425343534453455346534753485349535053515352535353545355535653575358535953605361536253635364536553665367536853695370537153725373537453755376537753785379538053815382538353845385538653875388538953905391539253935394539553965397539853995400540154025403540454055406540754085409541054115412541354145415541654175418541954205421542254235424542554265427542854295430543154325433543454355436543754385439544054415442544354445445544654475448544954505451545254535454545554565457545854595460546154625463546454655466546754685469547054715472547354745475547654775478547954805481548254835484548554865487548854895490549154925493549454955496549754985499550055015502550355045505550655075508550955105511551255135514551555165517551855195520552155225523552455255526552755285529553055315532553355345535553655375538553955405541554255435544554555465547554855495550555155525553555455555556555755585559556055615562556355645565556655675568556955705571557255735574557555765577557855795580558155825583558455855586558755885589559055915592559355945595559655975598559956005601560256035604560556065607560856095610561156125613561456155616561756185619562056215622562356245625562656275628562956305631563256335634563556365637563856395640564156425643564456455646564756485649565056515652565356545655565656575658565956605661566256635664566556665667566856695670567156725673567456755676567756785679568056815682568356845685568656875688568956905691569256935694569556965697569856995700570157025703570457055706570757085709571057115712571357145715571657175718571957205721572257235724572557265727572857295730573157325733573457355736573757385739574057415742574357445745574657475748574957505751575257535754575557565757575857595760576157625763576457655766576757685769577057715772577357745775577657775778577957805781578257835784578557865787578857895790579157925793579457955796579757985799580058015802580358045805580658075808580958105811581258135814581558165817581858195820582158225823582458255826582758285829583058315832583358345835583658375838583958405841584258435844584558465847584858495850585158525853585458555856585758585859586058615862586358645865586658675868586958705871587258735874587558765877587858795880588158825883588458855886588758885889589058915892589358945895589658975898589959005901590259035904590559065907590859095910591159125913591459155916591759185919592059215922592359245925592659275928592959305931593259335934593559365937593859395940594159425943594459455946594759485949595059515952595359545955595659575958595959605961596259635964596559665967
  1. ngram,count,df,len
  2. semantic,8385,0.14385218480330766,8
  3. problem,8348,0.14321741666523702,7
  4. neural,8024,0.13765890648321297,6
  5. set,7899,0.13551441953027157,3
  6. training,7844,0.13457084527097737,8
  7. learning,7580,0.1300416888263652,8
  8. natural,7436,0.1275712398565767,7
  9. representation,7396,0.12688500403163547,14
  10. study,7346,0.12602720925045893,5
  11. novel,6844,0.11741494964744635,5
  12. english,6795,0.11657431076189333,7
  13. natural_language,6704,0.115013124260152,16
  14. baseline,6675,0.1145156032870696,8
  15. large,6555,0.11245689581224588,5
  16. knowledge,6474,0.11106726826673986,9
  17. automatic,6388,0.10959186124311619,9
  18. research,6362,0.10914580795690439,8
  19. classification,6217,0.10665820309149239,14
  20. human,6184,0.10609205853591587,5
  21. state_of_the_art,6157,0.10562884935408053,16
  22. dataset,6090,0.10447940434730395,7
  23. accuracy,5992,0.10279812657619791,8
  24. network,5892,0.10108253701384481,7
  25. domain,5880,0.10087666626636244,6
  26. datasets,5833,0.10007033917205647,8
  27. context,5812,0.09971006536396232,7
  28. improvement,5797,0.09945272692960937,11
  29. available,5789,0.09931547976462111,9
  30. structure,5781,0.09917823259963286,9
  31. technique,5724,0.0982003465490916,9
  32. type,5617,0.09636466571737377,4
  33. framework,5608,0.096210262656762,9
  34. several,5539,0.09502650585873836,7
  35. use,5497,0.09430595824255006,3
  36. application,5483,0.09406577570382062,11
  37. algorithm,5379,0.09228156255897339,9
  38. annotation,5360,0.0919556005421263,10
  39. linguistic,5313,0.09114927344782034,10
  40. first,5312,0.09113211755219681,5
  41. source,5261,0.09025716687539673,6
  42. resource,5234,0.0897939576935614,8
  43. relation,5097,0.08744359999313764,8
  44. many,5092,0.08735782051501999,4
  45. processing,5081,0.08716910566316115,10
  46. previous,5044,0.0865343375250905,8
  47. quality,5027,0.08624268729949047,7
  48. experimental,4812,0.0825541697404313,12
  49. document,4773,0.08188508981111359,8
  50. lexical,4722,0.08101013913431351,7
  51. score,4660,0.07994647360565459,5
  52. extraction,4655,0.07986069412753692,10
  53. user,4595,0.07883134039012507,4
  54. best,4585,0.07865978143388976,4
  55. time,4563,0.07828235173017208,4
  56. order,4519,0.0775274923227367,5
  57. nlp,4515,0.07745886874024259,3
  58. pair,4511,0.07739024515774846,4
  59. various,4456,0.07644667089845425,7
  60. question,4451,0.0763608914203366,8
  61. important,4412,0.07569181149101889,9
  62. generation,4373,0.07502273156170118,10
  63. statistical,4361,0.0748168608142188,11
  64. process,4344,0.07452521058861877,7
  65. syntactic,4322,0.0741477808849011,9
  66. term,4310,0.07394191013741873,4
  67. multiple,4305,0.07385613065930106,8
  68. entity,4291,0.07361594812057164,6
  69. number,4287,0.07354732453807751,6
  70. better,4260,0.07308411535624217,6
  71. simple,4250,0.07291255640000686,6
  72. standard,4206,0.07215769699257149,8
  73. input,4090,0.0701676131002419,5
  74. detection,4024,0.06903532398908885,9
  75. recent,3982,0.06831477637290055,6
  76. challenge,3963,0.06798881435605346,9
  77. experimental_result,3960,0.06793734666918287,19
  78. case,3956,0.06786872308668875,4
  79. way,3953,0.06781725539981814,3
  80. test,3952,0.06780009950419462,4
  81. target,3915,0.06716533136612397,6
  82. dependency,3884,0.0666334986017945,10
  83. level,3870,0.06639331606306507,5
  84. error,3783,0.06490075314381788,5
  85. speech,3722,0.06385424351078248,6
  86. prediction,3648,0.06258470723464118,10
  87. recognition,3647,0.06256755133901766,11
  88. significant,3620,0.062104342157182316,11
  89. tool,3616,0.06203571857468819,4
  90. effective,3569,0.061229391480382235,9
  91. neural_network,3520,0.06038875259482921,14
  92. article,3431,0.05886187788433495,7
  93. similarity,3407,0.05845013638937021,10
  94. architecture,3302,0.05664876734889945,12
  95. output,3288,0.05640858481017001,6
  96. example,3281,0.0562884935408053,7
  97. classifier,3270,0.05609977868894646,10
  98. embeddings,3260,0.05592821973271114,10
  99. content,3245,0.055670881298358184,7
  100. current,3227,0.05536207517713462,7
  101. natural_language_processing,3190,0.05472730703906398,27
  102. high,3160,0.054212630170358045,4
  103. part,3118,0.05349208255416974,4
  104. issue,3107,0.0533033677023109,5
  105. second,3096,0.05311465285045206,6
  106. specific,3094,0.053080341059205,8
  107. development,3081,0.052857314416099095,11
  108. chinese,3041,0.052171078591157855,7
  109. particular,3006,0.051570622244334265,10
  110. parsing,2946,0.05054126850692241,7
  111. et,2929,0.05024961828132238,2
  112. attention,2920,0.050095215220710594,9
  113. form,2913,0.04997512395134588,4
  114. present,2903,0.04980356499511057,7
  115. metric,2888,0.049546226560757606,6
  116. unsupervised,2883,0.04946044708263995,12
  117. multilingual,2882,0.04944329118701642,12
  118. benchmark,2870,0.049237420439534045,9
  119. deep,2850,0.04889430252706343,4
  120. le,2837,0.048671275883957525,2
  121. phrase,2819,0.048362469762733964,6
  122. vector,2787,0.04781348110278097,6
  123. strategy,2778,0.04765907804216919,8
  124. sequence,2764,0.04741889550343976,8
  125. due,2753,0.04723018065158092,3
  126. similar,2746,0.0471100893822162,7
  127. possible,2741,0.047024309904098546,8
  128. parser,2710,0.04649247713976908,6
  129. addition,2695,0.046235138705416116,8
  130. parallel,2691,0.04616651512292199,8
  131. social,2684,0.046046423853557276,6
  132. general,2639,0.04527440855049838,7
  133. grammar,2627,0.04506853780301601,7
  134. space,2627,0.04506853780301601,5
  135. combination,2623,0.04499991422052188,11
  136. complex,2612,0.04481119936866304,7
  137. identification,2611,0.04479404347303951,14
  138. topic,2608,0.044742575786168914,5
  139. state,2605,0.04469110809929833,5
  140. role,2604,0.044673952203674795,4
  141. dialogue,2587,0.044382301978074766,8
  142. tree,2587,0.044382301978074766,4
  143. sentiment,2573,0.04414211943934533,9
  144. component,2568,0.044056339961227674,9
  145. effectiveness,2547,0.043696066153133525,13
  146. small,2537,0.04352450719689822,5
  147. step,2534,0.04347303951002762,4
  148. setting,2500,0.042889739058827564,7
  149. computational,2492,0.04275249189383932,13
  150. common,2491,0.04273533599821579,6
  151. single,2480,0.04254662114635695,6
  152. able,2477,0.04249515345948635,4
  153. graph,2467,0.042323594503251044,5
  154. useful,2440,0.041860385321415707,6
  155. rule,2416,0.04144864382645096,4
  156. amount,2403,0.041225617183345054,6
  157. point,2353,0.040367822402168504,5
  158. inference,2310,0.03963011889035667,9
  159. textual,2302,0.039492871725368424,7
  160. pattern,2302,0.039492871725368424,7
  161. web,2286,0.039218377395391926,3
  162. label,2274,0.039012506647909555,5
  163. strong,2257,0.038720856422309526,6
  164. expression,2246,0.038532141570450686,10
  165. effect,2237,0.03837773850983891,6
  166. search,2222,0.03812040007548594,6
  167. main,2218,0.038051776492991816,4
  168. additional,2215,0.03800030880612122,10
  169. understanding,2213,0.03796599701487416,13
  170. alignment,2212,0.03794884111925063,9
  171. online,2210,0.03791452932800357,6
  172. aspect,2200,0.037742970371768256,6
  173. meaning,2196,0.03767434678927414,7
  174. measure,2195,0.037657190893650605,7
  175. bleu,2174,0.03729691708555645,4
  176. news,2162,0.03709104633807408,4
  177. mt,2159,0.037039578651203484,2
  178. medium,2154,0.03695379917308583,6
  179. class,2150,0.03688517559059171,5
  180. event,2149,0.036868019694968175,5
  181. function,2143,0.03676508432122699,8
  182. field,2135,0.03662783715623874,5
  183. efficient,2117,0.03631903103501518,9
  184. goal,2116,0.036301875139391655,4
  185. show,2108,0.0361646279744034,4
  186. large_scale,2099,0.036010224913791626,11
  187. description,2081,0.035701418792568065,11
  188. relevant,2074,0.03558132752320335,8
  189. comparison,2058,0.035306833193226854,10
  190. lexicon,2050,0.0351695860282386,7
  191. semantics,2039,0.03498087117637976,9
  192. base,2032,0.03486077990701505,4
  193. mechanism,2031,0.034843624011391516,9
  194. selection,2012,0.034517661994544424,9
  195. effort,2001,0.034328947142685584,6
  196. pre_trained,1993,0.03419169997769734,11
  197. difference,1991,0.034157388186450276,10
  198. year,1986,0.03407160870833262,4
  199. future,1975,0.03388289385647378,6
  200. collection,1968,0.03376280258710906,10
  201. concept,1967,0.033745646691485526,7
  202. interaction,1967,0.033745646691485526,11
  203. good,1961,0.033642711317744343,4
  204. difficult,1960,0.03362555542212081,9
  205. potential,1948,0.03341968467463844,9
  206. variety,1944,0.033351061092144314,7
  207. statistical_machine,1936,0.03321381392715607,19
  208. construction,1930,0.03311087855341488,12
  209. code,1928,0.03307656676216782,4
  210. bert,1921,0.0329564754928031,4
  211. distribution,1915,0.032853540119061914,12
  212. statistical_machine_translation,1899,0.032579045789085416,31
  213. traditional,1894,0.032493266310967765,11
  214. property,1886,0.03235601914597951,8
  215. need,1882,0.032287395563485394,4
  216. retrieval,1880,0.03225308377223833,9
  217. discourse,1879,0.0322359278766148,9
  218. solution,1878,0.03221877198099127,8
  219. key,1872,0.03211583660725008,3
  220. individual,1869,0.03206436892037949,10
  221. overall,1868,0.03204721302475596,7
  222. empirical,1866,0.032012901233508896,9
  223. transformer,1865,0.031995745337885365,11
  224. category,1853,0.03178987459040299,8
  225. al.,1851,0.03175556279915593,3
  226. sense,1825,0.031309509512944124,5
  227. de,1813,0.031103638765461752,2
  228. supervised,1808,0.031017859287344095,10
  229. comparable,1784,0.030606117792379352,10
  230. ability,1781,0.030554650105508757,7
  231. modeling,1773,0.03041740294052051,8
  232. original,1765,0.030280155775532263,8
  233. relationship,1759,0.030177220401791077,12
  234. range,1746,0.02995419375868517,5
  235. parameter,1744,0.02991988196743811,9
  236. rich,1738,0.029816946593696925,4
  237. community,1733,0.029731167115579268,9
  238. candidate,1733,0.029731167115579268,9
  239. competitive,1732,0.029714011219955736,11
  240. french,1731,0.029696855324332208,6
  241. morphological,1727,0.029628231741838082,13
  242. social_medium,1723,0.02955960815934396,13
  243. project,1722,0.029542452263720428,7
  244. summarization,1720,0.029508140472473365,13
  245. bilingual,1716,0.029439516889979242,9
  246. technology,1707,0.02928511382936746,10
  247. contribution,1696,0.02909639897750862,12
  248. precision,1695,0.02907924308188509,9
  249. extensive,1692,0.029027775395014496,9
  250. dictionary,1690,0.028993463603767436,10
  251. higher,1688,0.028959151812520373,6
  252. manual,1681,0.028839060543155656,6
  253. la,1669,0.028633189795673284,2
  254. size,1667,0.02859887800442622,4
  255. constraint,1660,0.028478786735061504,10
  256. verb,1660,0.028478786735061504,4
  257. open,1651,0.028324383674449723,4
  258. answer,1649,0.028290071883202664,6
  259. robust,1645,0.028221448300708538,6
  260. impact,1644,0.028204292405085006,6
  261. e.g.,1639,0.028118512926967352,4
  262. segmentation,1635,0.02804988934447323,12
  263. towards,1629,0.027946953970732043,7
  264. query,1620,0.027792550910120263,5
  265. instance,1616,0.02772392732762614,8
  266. support,1602,0.027483744788896706,7
  267. average,1594,0.027346497623908457,7
  268. advantage,1587,0.02722640635454374,9
  269. scheme,1585,0.027192094563296677,6
  270. disambiguation,1582,0.027140626876426086,14
  271. german,1582,0.027140626876426086,6
  272. contextual,1579,0.02708915918955549,10
  273. transfer,1577,0.027054847398308428,8
  274. neural_machine,1569,0.02691760023332018,14
  275. neural_machine_translation,1559,0.02674604127708487,26
  276. fact,1556,0.026694573590214276,4
  277. previous_work,1554,0.026660261798967216,13
  278. utterance,1544,0.026488702842731904,9
  279. scenario,1541,0.026437235155861313,8
  280. adaptation,1535,0.026334299782120124,10
  281. une,1532,0.026282832095249533,3
  282. un,1524,0.026145584930261284,2
  283. nous,1515,0.025991181869649504,4
  284. submission,1510,0.02590540239153185,10
  285. one,1506,0.025836778809037727,3
  286. phenomenon,1500,0.02573384343529654,10
  287. character,1499,0.02571668753967301,9
  288. reference,1497,0.025682375748425947,9
  289. monolingual,1495,0.025648063957178883,11
  290. evidence,1494,0.025630908061555352,8
  291. dans,1494,0.025630908061555352,4
  292. joint,1490,0.02556228447906123,5
  293. argument,1484,0.025459349105320044,8
  294. version,1481,0.02540788141844945,7
  295. speaker,1477,0.025339257835955326,7
  296. token,1475,0.025304946044708263,5
  297. value,1472,0.025253478357837672,5
  298. annotated,1468,0.025184854775343546,9
  299. rate,1464,0.025116231192849423,4
  300. team,1460,0.025047607610355297,4
  301. objective,1459,0.02503045171473177,9
  302. limited,1455,0.024961828132237643,7
  303. people,1449,0.024858892758496457,6
  304. unit,1445,0.024790269176002334,4
  305. spoken,1442,0.02473880148913174,6
  306. prior,1438,0.024670177906637617,5
  307. group,1437,0.024653022011014086,5
  308. purpose,1434,0.02460155432414349,7
  309. par,1432,0.02456724253289643,3
  310. finding,1423,0.02441283947228465,7
  311. tweet,1423,0.02441283947228465,5
  312. conversation,1420,0.024361371785414056,12
  313. correlation,1418,0.024327059994166997,11
  314. cross_lingual,1415,0.024275592307296402,13
  315. accurate,1407,0.024138345142308153,8
  316. hierarchical,1404,0.024086877455437562,12
  317. related,1397,0.023966786186072845,7
  318. random,1396,0.023949630290449313,6
  319. complexity,1382,0.02370944775171988,10
  320. alternative,1373,0.0235550446911081,11
  321. decision,1372,0.023537888795484567,8
  322. lack,1368,0.023469265212990444,4
  323. kind,1367,0.023452109317366913,4
  324. popular,1365,0.02341779752611985,7
  325. short,1358,0.023297706256755132,5
  326. design,1355,0.02324623856988454,6
  327. summary,1354,0.02322908267426101,7
  328. gain,1351,0.023177614987390415,4
  329. characteristic,1349,0.023143303196143356,14
  330. response,1343,0.02304036782240217,8
  331. literature,1342,0.023023211926778638,10
  332. diverse,1340,0.022988900135531575,7
  333. twitter,1329,0.022800185283672735,7
  334. major,1327,0.022765873492425672,5
  335. treebank,1324,0.022714405805555078,8
  336. grammatical,1323,0.02269724990993155,11
  337. sample,1317,0.02259431453619036,6
  338. module,1317,0.02259431453619036,6
  339. significant_improvement,1314,0.02254284684931977,23
  340. local,1314,0.02254284684931977,5
  341. relative,1314,0.02254284684931977,8
  342. low,1313,0.022525690953696238,3
  343. f1,1313,0.022525690953696238,2
  344. tag,1311,0.022491379162449174,3
  345. direction,1309,0.022457067371202115,9
  346. art,1306,0.02240559968433152,3
  347. factor,1299,0.022285508414966803,6
  348. researcher,1299,0.022285508414966803,10
  349. area,1295,0.02221688483247268,4
  350. interest,1292,0.022165417145602086,8
  351. implementation,1291,0.022148261249978554,14
  352. latent,1286,0.0220624817718609,6
  353. final,1286,0.0220624817718609,5
  354. probability,1282,0.021993858189366777,11
  355. noun,1282,0.021993858189366777,4
  356. layer,1278,0.02192523460687265,5
  357. aim,1275,0.02187376692000206,3
  358. world,1269,0.021770831546260874,5
  359. importance,1266,0.02171936385939028,10
  360. low_resource,1261,0.021633584381272625,12
  361. theory,1257,0.0215649607987785,6
  362. long,1257,0.0215649607987785,4
  363. much,1253,0.021496337216284377,4
  364. tagging,1250,0.021444869529413782,7
  365. procedure,1250,0.021444869529413782,9
  366. japanese,1245,0.021359090051296128,8
  367. database,1237,0.02122184288630788,8
  368. real,1234,0.021170375199437288,4
  369. idea,1233,0.021153219303813756,4
  370. variation,1230,0.02110175161694316,9
  371. memory,1228,0.021067439825696102,6
  372. correct,1223,0.020981660347578444,7
  373. resolution,1222,0.020964504451954913,10
  374. hypothesis,1215,0.020844413182590196,10
  375. methodology,1210,0.02075863370447254,11
  376. mean,1206,0.02069001012197842,4
  377. arabic,1205,0.020672854226354887,6
  378. focus,1201,0.020604230643860764,5
  379. list,1201,0.020604230643860764,4
  380. real_world,1195,0.020501295270119575,10
  381. change,1194,0.020484139374496047,6
  382. global,1192,0.020449827583248984,6
  383. account,1191,0.020432671687625453,7
  384. certain,1188,0.020381204000754858,7
  385. sur,1187,0.02036404810513133,3
  386. participant,1187,0.02036404810513133,11
  387. full,1185,0.020329736313884267,4
  388. linear,1185,0.020329736313884267,6
  389. pour,1184,0.020312580418260735,4
  390. coverage,1183,0.020295424522637204,8
  391. image,1183,0.020295424522637204,5
  392. challenging,1181,0.02026111273139014,11
  393. wordnet,1179,0.02022680094014308,7
  394. wide,1175,0.020158177357648955,4
  395. basic,1152,0.019763591758307743,5
  396. crucial,1144,0.019626344593319495,7
  397. smt,1138,0.01952340921957831,3
  398. interface,1133,0.01943762974146065,9
  399. end,1131,0.01940331795021359,3
  400. ensemble,1130,0.01938616205459006,8
  401. cost,1129,0.01936900615896653,4
  402. bias,1127,0.019334694367719465,4
  403. distributional,1125,0.019300382576472406,14
  404. probabilistic,1124,0.019283226680848874,13
  405. dynamic,1123,0.019266070785225343,7
  406. success,1122,0.01924891488960181,7
  407. benefit,1122,0.01924891488960181,7
  408. platform,1121,0.01923175899397828,8
  409. difficulty,1120,0.019214603098354748,10
  410. wikipedia,1118,0.01918029130710769,9
  411. insight,1117,0.019163135411484157,7
  412. nature,1116,0.019145979515860626,6
  413. vocabulary,1114,0.019111667724613562,10
  414. recurrent,1114,0.019111667724613562,9
  415. respect,1113,0.01909451182899003,7
  416. perspective,1106,0.018974420559625314,11
  417. frequency,1103,0.018922952872754722,9
  418. recall,1101,0.01888864108150766,6
  419. end_to_end,1101,0.01888864108150766,10
  420. high_quality,1100,0.018871485185884128,12
  421. positive,1100,0.018871485185884128,8
  422. promising,1099,0.018854329290260596,9
  423. downstream,1093,0.01875139391651941,10
  424. opinion,1092,0.018734238020895883,7
  425. practical,1090,0.01869992622964882,9
  426. fine_grained,1089,0.018682770334025288,12
  427. visual,1088,0.018665614438401756,6
  428. appropriate,1086,0.018631302647154693,11
  429. preliminary,1085,0.018614146751531165,11
  430. du,1084,0.018596990855907634,2
  431. choice,1078,0.018494055482166448,6
  432. scale,1078,0.018494055482166448,5
  433. name,1078,0.018494055482166448,4
  434. public,1074,0.018425431899672322,6
  435. pipeline,1074,0.018425431899672322,8
  436. negative,1069,0.018339652421554668,8
  437. behavior,1067,0.018305340630307605,8
  438. gap,1066,0.018288184734684073,3
  439. syntax,1064,0.018253872943437013,6
  440. external,1061,0.01820240525656642,8
  441. consistent,1058,0.018150937569695828,10
  442. answering,1056,0.018116625778448765,9
  443. initial,1050,0.01801369040470758,7
  444. learner,1047,0.017962222717836984,7
  445. phrase_based,1046,0.017945066822213453,12
  446. review,1044,0.017910755030966393,6
  447. deep_learning,1038,0.017807819657225204,13
  448. po,1037,0.017790663761601676,2
  449. loss,1033,0.01772204017910755,4
  450. conditional,1031,0.017687728387860487,11
  451. generative,1031,0.017687728387860487,10
  452. e.g,1027,0.017619104805366364,3
  453. conversational,1026,0.017601948909742832,14
  454. author,1025,0.0175847930141193,6
  455. usage,1022,0.01753332532724871,5
  456. little,1021,0.017516169431625178,6
  457. environment,1021,0.017516169431625178,11
  458. mining,1020,0.017499013536001647,6
  459. ce,1020,0.017499013536001647,2
  460. linguistics,1013,0.01737892226663693,11
  461. communication,1009,0.017310298684142807,13
  462. supervision,1009,0.017310298684142807,11
  463. variant,1009,0.017310298684142807,7
  464. explicit,1008,0.017293142788519275,8
  465. expert,1007,0.017275986892895744,6
  466. limitation,1007,0.017275986892895744,10
  467. length,1006,0.017258830997272212,6
  468. basis,1005,0.01724167510164868,5
  469. part_of_speech,1004,0.01722451920602515,14
  470. parallel_corpus,997,0.01710442793666043,15
  471. noisy,994,0.01705296024978984,5
  472. generalization,994,0.01705296024978984,14
  473. ranking,988,0.016950024876048655,7
  474. necessary,988,0.016950024876048655,9
  475. labeling,987,0.016932868980425123,8
  476. distance,986,0.01691571308480159,8
  477. top,986,0.01691571308480159,3
  478. access,986,0.01691571308480159,6
  479. hybrid,986,0.01691571308480159,6
  480. contrast,986,0.01691571308480159,8
  481. mention,984,0.01688140129355453,7
  482. extension,981,0.016829933606683938,9
  483. ii,976,0.016744154128566283,2
  484. interpretation,976,0.016744154128566283,14
  485. acquisition,974,0.01670984233731922,11
  486. nmt,972,0.016675530546072157,3
  487. agreement,970,0.016641218754825094,9
  488. temporal,966,0.01657259517233097,8
  489. rule_based,966,0.01657259517233097,10
  490. estimation,965,0.01655543927670744,10
  491. structural,965,0.01655543927670744,10
  492. report,963,0.016521127485460377,6
  493. annotator,961,0.016486815694213317,9
  494. gold,960,0.016469659798589786,4
  495. est,959,0.016452503902966254,3
  496. essential,958,0.016435348007342723,9
  497. degree,954,0.0163667244248486,6
  498. reduction,953,0.01634956852922507,9
  499. service,949,0.016280944946730946,7
  500. larger,948,0.016263789051107414,6
  501. different_language,948,0.016263789051107414,18
  502. position,947,0.016246633155483883,8
  503. spanish,945,0.01621232136423682,7
  504. i.e,941,0.016143697781742697,3
  505. condition,931,0.015972138825507385,9
  506. abstract,929,0.015937827034260322,8
  507. neural_model,922,0.015817735764895608,12
  508. universal,920,0.015783423973648545,9
  509. capability,917,0.01573195628677795,10
  510. emotion,917,0.01573195628677795,7
  511. weight,915,0.01569764449553089,6
  512. style,911,0.015629020913036765,5
  513. human_evaluation,910,0.015611865017413235,16
  514. decoder,907,0.01556039733054264,7
  515. structured,905,0.015526085539295579,10
  516. efficiency,903,0.015491773748048518,10
  517. scientific,903,0.015491773748048518,10
  518. subject,902,0.015474617852424986,7
  519. independent,901,0.015457461956801455,11
  520. engine,897,0.01538883837430733,6
  521. view,892,0.015303058896189676,4
  522. progress,891,0.015285903000566144,8
  523. detail,889,0.015251591209319083,6
  524. manner,887,0.01521727941807202,6
  525. medical,886,0.01520012352244849,7
  526. stage,886,0.01520012352244849,5
  527. coreference,882,0.015131499939954366,11
  528. detailed,881,0.015114344044330834,8
  529. corresponding,879,0.015080032253083773,13
  530. building,876,0.01502856456621318,8
  531. practice,876,0.01502856456621318,8
  532. suitable,876,0.01502856456621318,8
  533. object,875,0.015011408670589648,6
  534. encoder,873,0.014977096879342585,7
  535. open_source,873,0.014977096879342585,11
  536. creation,870,0.014925629192471992,8
  537. fine_tuning,868,0.014891317401224931,11
  538. semeval,867,0.0148741615056014,7
  539. student,867,0.0148741615056014,7
  540. que,866,0.014857005609977868,3
  541. embedding,865,0.014839849714354338,9
  542. definition,864,0.014822693818730807,10
  543. automated,863,0.014805537923107275,9
  544. paradigm,862,0.014788382027483745,8
  545. correction,862,0.014788382027483745,10
  546. multimodal,861,0.014771226131860214,10
  547. segment,861,0.014771226131860214,7
  548. increase,860,0.014754070236236682,8
  549. discussion,860,0.014754070236236682,10
  550. attempt,854,0.014651134862495497,7
  551. dialog,853,0.014633978966871965,6
  552. substantial,853,0.014633978966871965,11
  553. reason,851,0.014599667175624904,6
  554. modern,851,0.014599667175624904,6
  555. assessment,845,0.014496731801883718,10
  556. great,844,0.014479575906260186,5
  557. nlp_task,841,0.014428108219389594,8
  558. biomedical,840,0.014410952323766062,10
  559. comprehension,840,0.014410952323766062,13
  560. regression,839,0.01439379642814253,10
  561. unlabeled,836,0.014342328741271938,9
  562. binary,836,0.014342328741271938,6
  563. variable,836,0.014342328741271938,8
  564. convolutional,835,0.014325172845648408,13
  565. interactive,834,0.014308016950024876,11
  566. cluster,828,0.01420508157628369,7
  567. discriminative,828,0.01420508157628369,14
  568. hand,827,0.014187925680660159,4
  569. maximum,822,0.014102146202542503,7
  570. mapping,820,0.014067834411295442,7
  571. critical,820,0.014067834411295442,8
  572. al,815,0.013982054933177786,2
  573. reading,814,0.013964899037554256,7
  574. comprehensive,814,0.013964899037554256,13
  575. generated,813,0.013947743141930724,9
  576. university,812,0.013930587246307193,10
  577. agent,811,0.013913431350683663,5
  578. conventional,810,0.013896275455060132,12
  579. subset,809,0.0138791195594366,6
  580. computer,809,0.0138791195594366,8
  581. cet,806,0.013827651872566007,3
  582. parse,805,0.013810495976942476,5
  583. n_gram,805,0.013810495976942476,6
  584. judgment,802,0.013759028290071883,8
  585. signal,800,0.013724716498824821,6
  586. heuristic,799,0.01370756060320129,9
  587. formal,799,0.01370756060320129,6
  588. assumption,796,0.013656092916330697,10
  589. reasoning,793,0.013604625229460104,9
  590. augmentation,790,0.013553157542589511,12
  591. action,789,0.01353600164696598,6
  592. series,787,0.013501689855718918,6
  593. clustering,787,0.013501689855718918,10
  594. others,787,0.013501689855718918,6
  595. ambiguity,786,0.013484533960095387,9
  596. place,785,0.013467378064471855,5
  597. extensive_experiment,783,0.013433066273224794,20
  598. product,783,0.013433066273224794,7
  599. polarity,782,0.013415910377601262,8
  600. unified,781,0.01339875448197773,7
  601. subtask,781,0.01339875448197773,7
  602. unseen,778,0.013347286795107138,6
  603. qa,777,0.013330130899483608,2
  604. message,777,0.013330130899483608,7
  605. integration,776,0.013312975003860077,11
  606. ontology,776,0.013312975003860077,8
  607. core,774,0.013278663212613015,4
  608. robustness,774,0.013278663212613015,10
  609. yield,773,0.013261507316989484,5
  610. software,769,0.01319288373449536,8
  611. element,769,0.01319288373449536,7
  612. induction,768,0.013175727838871828,9
  613. generic,768,0.013175727838871828,7
  614. state_of_the_art_performance,763,0.013089948360754174,28
  615. semantic_role,761,0.01305563656950711,13
  616. lstm,758,0.013004168882636518,4
  617. attribute,757,0.012987012987012988,9
  618. item,757,0.012987012987012988,4
  619. performs,756,0.012969857091389456,8
  620. pretrained,755,0.012952701195765925,10
  621. f1_score,755,0.012952701195765925,8
  622. experience,754,0.012935545300142393,10
  623. strong_baseline,754,0.012935545300142393,15
  624. post,749,0.012849765822024739,4
  625. capable,742,0.012729674552660022,7
  626. clinical,742,0.012729674552660022,8
  627. morphology,742,0.012729674552660022,10
  628. format,742,0.012729674552660022,6
  629. improved,740,0.01269536276141296,8
  630. participation,739,0.012678206865789429,13
  631. novel_approach,738,0.012661050970165897,14
  632. last,736,0.012626739178918836,4
  633. implicit,736,0.012626739178918836,8
  634. situation,735,0.012609583283295304,9
  635. domain_specific,734,0.012592427387671773,15
  636. surface,733,0.012575271492048243,7
  637. span,732,0.012558115596424712,4
  638. statistic,732,0.012558115596424712,9
  639. past,729,0.012506647909554119,4
  640. investigation,727,0.012472336118307056,13
  641. likely,726,0.012455180222683526,6
  642. recent_year,725,0.012438024327059994,11
  643. ner,725,0.012438024327059994,3
  644. paraphrase,723,0.012403712535812931,10
  645. easy,723,0.012403712535812931,4
  646. science,722,0.012386556640189401,7
  647. large_amount,722,0.012386556640189401,12
  648. hard,720,0.012352244848942338,4
  649. workshop,719,0.012335088953318809,8
  650. sens,718,0.012317933057695277,4
  651. unique,718,0.012317933057695277,6
  652. multi_task,717,0.012300777162071745,10
  653. tagger,710,0.012180685892707028,6
  654. relevance,709,0.012163529997083498,9
  655. link,707,0.012129218205836435,4
  656. recent_work,707,0.012129218205836435,11
  657. direct,707,0.012129218205836435,6
  658. expensive,707,0.012129218205836435,9
  659. comment,703,0.012060594623342311,7
  660. flexible,702,0.012043438727718781,8
  661. successful,701,0.01202628283209525,10
  662. influence,700,0.012009126936471718,9
  663. reliable,698,0.011974815145224657,8
  664. boundary,694,0.011906191562730532,8
  665. quantitative,694,0.011906191562730532,12
  666. optimization,694,0.011906191562730532,12
  667. next,692,0.011871879771483471,4
  668. sentence_level,692,0.011871879771483471,14
  669. association,691,0.01185472387585994,11
  670. track,690,0.011837567980236408,5
  671. decoding,690,0.011837567980236408,8
  672. semi_supervised,690,0.011837567980236408,15
  673. production,689,0.011820412084612876,10
  674. entry,688,0.011803256188989347,5
  675. special,687,0.011786100293365815,7
  676. dimension,686,0.011768944397742283,9
  677. optimal,684,0.011734632606495222,7
  678. hidden,683,0.01171747671087169,6
  679. operation,681,0.01168316491962463,9
  680. constituent,681,0.01168316491962463,11
  681. adversarial,675,0.011580229545883444,11
  682. noise,673,0.01154591775463638,5
  683. d'un,673,0.01154591775463638,4
  684. pre_trained_language,672,0.011528761859012849,20
  685. health,672,0.011528761859012849,6
  686. automatique,672,0.011528761859012849,11
  687. lower,667,0.011442982380895195,5
  688. cognitive,666,0.011425826485271663,9
  689. diversity,666,0.011425826485271663,9
  690. advance,665,0.011408670589648133,7
  691. free,665,0.011408670589648133,4
  692. continuous,664,0.011391514694024602,10
  693. bidirectional,663,0.01137435879840107,13
  694. observation,662,0.011357202902777539,11
  695. different_type,661,0.011340047007154009,14
  696. third,661,0.011340047007154009,5
  697. overview,661,0.011340047007154009,8
  698. frame,661,0.011340047007154009,5
  699. f_score,659,0.011305735215906946,7
  700. fundamental,657,0.011271423424659885,11
  701. systematic,657,0.011271423424659885,10
  702. criterion,656,0.011254267529036353,9
  703. genre,653,0.01120279984216576,5
  704. state_of_the_art_result,652,0.011185643946542229,23
  705. requirement,650,0.011151332155295167,11
  706. pre_trained_language_model,650,0.011151332155295167,26
  707. semantic_similarity,650,0.011151332155295167,19
  708. feedback,649,0.011134176259671636,8
  709. subtasks,649,0.011134176259671636,8
  710. notion,649,0.011134176259671636,6
  711. raw,648,0.011117020364048106,3
  712. complete,647,0.011099864468424574,8
  713. other_language,644,0.011048396781553982,14
  714. cette,644,0.011048396781553982,5
  715. matching,643,0.01103124088593045,8
  716. svm,643,0.01103124088593045,3
  717. large_corpus,641,0.010996929094683389,12
  718. share,641,0.010996929094683389,5
  719. informative,640,0.010979773199059857,11
  720. power,640,0.010979773199059857,5
  721. shallow,639,0.010962617303436326,7
  722. stateof_the_art,636,0.010911149616565733,15
  723. minimal,636,0.010911149616565733,7
  724. text_classification,636,0.010911149616565733,19
  725. whole,634,0.010876837825318671,5
  726. comparative,631,0.010825370138448078,11
  727. native,630,0.010808214242824547,6
  728. entailment,630,0.010808214242824547,10
  729. distinct,629,0.010791058347201015,8
  730. theoretical,628,0.010773902451577484,11
  731. predicate,627,0.010756746555953954,9
  732. interesting,626,0.010739590660330423,11
  733. transformation,623,0.01068812297345983,14
  734. total,620,0.010636655286589237,5
  735. extent,620,0.010636655286589237,6
  736. transformer_based,618,0.010602343495342174,17
  737. sequential,616,0.010568031704095112,10
  738. utility,615,0.01055087580847158,7
  739. qualitative,612,0.010499408121600988,11
  740. node,611,0.010482252225977456,4
  741. pre_training,611,0.010482252225977456,12
  742. ambiguous,609,0.010447940434730395,9
  743. synthetic,607,0.010413628643483334,9
  744. history,606,0.010396472747859802,7
  745. wmt,606,0.010396472747859802,3
  746. smaller,605,0.01037931685223627,7
  747. latter,605,0.01037931685223627,6
  748. cue,603,0.01034500506098921,3
  749. preference,602,0.010327849165365678,10
  750. zero_shot,602,0.010327849165365678,9
  751. material,601,0.010310693269742146,8
  752. transcription,600,0.010293537374118616,13
  753. phase,600,0.010293537374118616,5
  754. principle,599,0.010276381478495085,9
  755. entropy,599,0.010276381478495085,7
  756. qui,599,0.010276381478495085,3
  757. string,599,0.010276381478495085,6
  758. reader,598,0.010259225582871553,6
  759. wide_range,596,0.010224913791624492,10
  760. valuable,595,0.01020775789600096,8
  761. official,595,0.01020775789600096,8
  762. claim,595,0.01020775789600096,5
  763. in_domain,595,0.01020775789600096,9
  764. state_ofthe_art,594,0.010190602000377429,15
  765. translator,594,0.010190602000377429,10
  766. graph_based,592,0.010156290209130368,11
  767. conditional_random,591,0.010139134313506836,18
  768. underlying,589,0.010104822522259775,10
  769. margin,588,0.010087666626636243,6
  770. guideline,587,0.010070510731012712,9
  771. absolute,587,0.010070510731012712,8
  772. story,585,0.01003619893976565,5
  773. writing,585,0.01003619893976565,7
  774. semantic_relation,585,0.01003619893976565,17
  775. formalism,584,0.010019043044142119,9
  776. gold_standard,584,0.010019043044142119,13
  777. conditional_random_field,583,0.010001887148518589,24
  778. weighted,583,0.010001887148518589,8
  779. technical,581,0.009967575357271526,9
  780. superior,581,0.009967575357271526,8
  781. explanation,579,0.009933263566024465,11
  782. powerful,578,0.009916107670400933,8
  783. table,578,0.009916107670400933,5
  784. family,576,0.009881795879153872,6
  785. state_of_theart,576,0.009881795879153872,15
  786. spoken_language,575,0.00986463998353034,15
  787. person,575,0.00986463998353034,6
  788. speed,574,0.009847484087906809,5
  789. large_number,572,0.009813172296659747,12
  790. compositional,572,0.009813172296659747,13
  791. outperforms,572,0.009813172296659747,11
  792. en,572,0.009813172296659747,2
  793. coherence,571,0.009796016401036216,9
  794. gender,571,0.009796016401036216,6
  795. consistency,569,0.009761704609789154,11
  796. help,568,0.009744548714165623,4
  797. data_driven,566,0.009710236922918562,11
  798. computation,566,0.009710236922918562,11
  799. entire,564,0.009675925131671499,6
  800. setup,564,0.009675925131671499,5
  801. control,564,0.009675925131671499,7
  802. open_domain,562,0.009641613340424437,11
  803. least,562,0.009641613340424437,5
  804. program,561,0.009624457444800906,7
  805. strength,561,0.009624457444800906,8
  806. linguistic_feature,558,0.009572989757930313,18
  807. separate,558,0.009572989757930313,8
  808. modality,557,0.009555833862306781,8
  809. typical,555,0.00952152207105972,7
  810. logical,554,0.009504366175436188,7
  811. modification,554,0.009504366175436188,12
  812. unknown,554,0.009504366175436188,7
  813. natural_language_generation,552,0.009470054384189127,27
  814. clear,552,0.009470054384189127,5
  815. proper,549,0.009418586697318534,6
  816. possibility,549,0.009418586697318534,11
  817. low_resource_language,549,0.009418586697318534,21
  818. background,548,0.009401430801695003,10
  819. labeled,546,0.009367119010447941,7
  820. highest,545,0.00934996311482441,7
  821. automatic_speech,545,0.00934996311482441,16
  822. semantic_representation,544,0.009332807219200878,23
  823. prsentons,544,0.009332807219200878,9
  824. best_result,544,0.009332807219200878,11
  825. incremental,542,0.009298495427953817,11
  826. fast,541,0.009281339532330285,4
  827. semantic_information,539,0.009247027741083224,20
  828. nous_prsentons,538,0.009229871845459692,14
  829. light,538,0.009229871845459692,5
  830. engineering,538,0.009229871845459692,11
  831. internet,537,0.009212715949836161,8
  832. head,537,0.009212715949836161,4
  833. location,535,0.0091784041585891,8
  834. majority,535,0.0091784041585891,8
  835. asr,534,0.009161248262965568,3
  836. sufficient,534,0.009161248262965568,10
  837. predictive,533,0.009144092367342036,10
  838. word_level,531,0.009109780576094975,10
  839. automatic_evaluation,531,0.009109780576094975,20
  840. au,529,0.009075468784847914,2
  841. composition,528,0.009058312889224382,11
  842. management,527,0.00904115699360085,10
  843. d'une,527,0.00904115699360085,5
  844. sequence_to_sequence,527,0.00904115699360085,20
  845. lexical_resource,526,0.00902400109797732,16
  846. forum,525,0.00900684520235379,5
  847. narrative,524,0.008989689306730258,9
  848. activity,523,0.008972533411106726,8
  849. active,522,0.008955377515483197,6
  850. turn,522,0.008955377515483197,4
  851. equivalent,519,0.008903909828612602,10
  852. sont,519,0.008903909828612602,4
  853. date,517,0.00886959803736554,4
  854. trained,515,0.00883528624611848,7
  855. usefulness,513,0.008800974454871416,10
  856. meaningful,512,0.008783818559247886,10
  857. page,512,0.008783818559247886,4
  858. historical,511,0.008766662663624355,10
  859. patient,510,0.008749506768000823,7
  860. scope,510,0.008749506768000823,5
  861. better_performance,509,0.008732350872377292,18
  862. learned,506,0.008680883185506699,7
  863. penn,506,0.008680883185506699,4
  864. availability,505,0.008663727289883169,12
  865. coherent,504,0.008646571394259638,8
  866. computational_linguistics,504,0.008646571394259638,25
  867. act,503,0.008629415498636106,3
  868. reinforcement,502,0.008612259603012574,13
  869. prior_work,502,0.008612259603012574,10
  870. automatic_speech_recognition,501,0.008595103707389045,28
  871. partial,500,0.008577947811765513,7
  872. primary,495,0.008492168333647859,7
  873. matrix,494,0.008475012438024327,6
  874. bayesian,494,0.008475012438024327,8
  875. treebanks,492,0.008440700646777264,9
  876. presence,492,0.008440700646777264,8
  877. markov,492,0.008440700646777264,6
  878. terminology,491,0.008423544751153735,11
  879. line,491,0.008423544751153735,4
  880. demonstrate,491,0.008423544751153735,11
  881. syntactic_structure,491,0.008423544751153735,19
  882. sparse,491,0.008423544751153735,6
  883. achieves,491,0.008423544751153735,8
  884. path,489,0.008389232959906671,4
  885. artificial,489,0.008389232959906671,10
  886. complementary,488,0.008372077064283142,13
  887. dialect,488,0.008372077064283142,7
  888. survey,488,0.008372077064283142,6
  889. first_step,487,0.00835492116865961,10
  890. exploration,487,0.00835492116865961,11
  891. connection,487,0.00835492116865961,10
  892. side,487,0.00835492116865961,4
  893. policy,486,0.008337765273036079,6
  894. frequent,486,0.008337765273036079,8
  895. verbal,485,0.008320609377412547,6
  896. crf,485,0.008320609377412547,3
  897. rating,485,0.008320609377412547,6
  898. auxiliary,484,0.008303453481789017,9
  899. novel_method,483,0.008286297586165486,12
  900. considerable,483,0.008286297586165486,12
  901. video,482,0.008269141690541954,5
  902. normalization,479,0.008217674003671361,13
  903. applicable,479,0.008217674003671361,10
  904. semantic_parsing,478,0.008200518108047831,16
  905. corpus_based,476,0.008166206316800768,12
  906. n_grams,475,0.008149050421177237,7
  907. discovery,475,0.008149050421177237,9
  908. early,474,0.008131894525553707,5
  909. compound,474,0.008131894525553707,8
  910. interpretable,473,0.008114738629930176,13
  911. proposal,472,0.008097582734306644,8
  912. relational,471,0.008080426838683114,10
  913. state_of_the_art_method,468,0.00802895915181252,23
  914. new_method,468,0.00802895915181252,10
  915. programming,468,0.00802895915181252,11
  916. distant,467,0.00801180325618899,7
  917. sensitive,465,0.007977491464941927,9
  918. hierarchy,465,0.007977491464941927,9
  919. extractive,464,0.007960335569318397,10
  920. beneficial,463,0.007943179673694865,10
  921. poor,462,0.007926023778071334,4
  922. prototype,462,0.007926023778071334,9
  923. central,461,0.007908867882447804,7
  924. acoustic,460,0.007891711986824273,8
  925. conceptual,460,0.007891711986824273,10
  926. generator,459,0.007874556091200741,9
  927. russian,459,0.007874556091200741,7
  928. confidence,458,0.00785740019557721,10
  929. helpful,456,0.007823088404330148,7
  930. recommendation,456,0.007823088404330148,14
  931. portuguese,456,0.007823088404330148,10
  932. personal,455,0.007805932508706617,8
  933. other_hand,455,0.007805932508706617,10
  934. broad,454,0.007788776613083086,5
  935. record,453,0.007771620717459555,6
  936. schema,453,0.007771620717459555,6
  937. hindi,451,0.007737308926212493,5
  938. validation,450,0.0077201530305889615,10
  939. co_occurrence,450,0.0077201530305889615,13
  940. extracted,450,0.0077201530305889615,9
  941. exact,448,0.0076858412393419,5
  942. international,448,0.0076858412393419,13
  943. conversion,448,0.0076858412393419,10
  944. script,448,0.0076858412393419,6
  945. lot,447,0.007668685343718369,3
  946. neural_network_model,447,0.007668685343718369,20
  947. same_time,446,0.007651529448094838,9
  948. professional,445,0.007634373552471306,12
  949. european,445,0.007634373552471306,8
  950. occurrence,444,0.007617217656847776,10
  951. state_of_the_art_model,444,0.007617217656847776,22
  952. true,443,0.007600061761224245,4
  953. contextual_information,443,0.007600061761224245,22
  954. annotated_corpus,440,0.007548594074353651,16
  955. seed,440,0.007548594074353651,4
  956. finite_state,439,0.007531438178730121,12
  957. clause,439,0.007531438178730121,6
  958. rsultats,439,0.007531438178730121,8
  959. document_level,438,0.00751428228310659,14
  960. template,438,0.00751428228310659,8
  961. different_domain,437,0.0074971263874830585,16
  962. digital,437,0.0074971263874830585,7
  963. systme,437,0.0074971263874830585,6
  964. competition,436,0.007479970491859528,11
  965. f_measure,435,0.007462814596235996,9
  966. rank,433,0.007428502804988934,4
  967. human_judgment,432,0.007411346909365403,14
  968. encoder_decoder,432,0.007411346909365403,15
  969. cnn,432,0.007411346909365403,3
  970. pronoun,432,0.007411346909365403,7
  971. equal,431,0.007394191013741873,5
  972. new_approach,431,0.007394191013741873,12
  973. representative,431,0.007394191013741873,14
  974. match,430,0.007377035118118341,5
  975. passage,430,0.007377035118118341,7
  976. iterative,430,0.007377035118118341,9
  977. statement,429,0.0073598792224948105,9
  978. organization,429,0.0073598792224948105,12
  979. treatment,428,0.007342723326871279,9
  980. right,427,0.007325567431247748,5
  981. italian,426,0.007308411535624218,7
  982. consideration,426,0.007308411535624218,13
  983. toolkit,425,0.007291255640000686,7
  984. child,425,0.007291255640000686,5
  985. configuration,425,0.007291255640000686,13
  986. promising_result,425,0.007291255640000686,16
  987. universal_dependency,424,0.007274099744377155,20
  988. empirical_result,424,0.007274099744377155,16
  989. intent,424,0.007274099744377155,6
  990. section,424,0.007274099744377155,7
  991. new_dataset,423,0.007256943848753624,11
  992. proposons,423,0.007256943848753624,9
  993. implication,422,0.007239787953130093,11
  994. likelihood,421,0.0072226320575065625,10
  995. abstractive,421,0.0072226320575065625,11
  996. arbitrary,417,0.007154008475012438,9
  997. out_of_domain,417,0.007154008475012438,13
  998. audio,417,0.007154008475012438,5
  999. huge,416,0.007136852579388907,4
  1000. campaign,414,0.007102540788141845,8
  1001. outcome,413,0.007085384892518314,7
  1002. heterogeneous,413,0.007085384892518314,13
  1003. kernel,413,0.007085384892518314,6
  1004. pre_trained_model,413,0.007085384892518314,17
  1005. multiple_language,413,0.007085384892518314,17
  1006. expansion,412,0.007068228996894783,9
  1007. fine_tuned,412,0.007068228996894783,10
  1008. actual,412,0.007068228996894783,6
  1009. contrastive,412,0.007068228996894783,11
  1010. wsd,411,0.0070510731012712515,3
  1011. nous_proposons,411,0.0070510731012712515,14
  1012. unstructured,410,0.007033917205647721,12
  1013. chinese_english,410,0.007033917205647721,15
  1014. well_known,409,0.00701676131002419,10
  1015. formulation,409,0.00701676131002419,11
  1016. adaptive,406,0.0069652936231535964,8
  1017. transliteration,406,0.0069652936231535964,15
  1018. previous_study,405,0.006948137727530066,14
  1019. capture,405,0.006948137727530066,7
  1020. franais,405,0.006948137727530066,7
  1021. categorization,404,0.006930981831906535,14
  1022. encoding,404,0.006930981831906535,8
  1023. chinese_word,403,0.0069138259362830036,12
  1024. largest,402,0.006896670040659473,7
  1025. internal,402,0.006896670040659473,8
  1026. counterpart,402,0.006896670040659473,11
  1027. real_time,402,0.006896670040659473,9
  1028. post_editing,401,0.006879514145035941,12
  1029. index,401,0.006879514145035941,5
  1030. nlg,401,0.006879514145035941,3
  1031. game,401,0.006879514145035941,4
  1032. logic,400,0.006862358249412411,5
  1033. previous_approach,400,0.006862358249412411,17
  1034. iii,399,0.006845202353788879,3
  1035. high_level,399,0.006845202353788879,10
  1036. sparsity,399,0.006845202353788879,8
  1037. talk,398,0.0068280464581653485,4
  1038. conclusion,396,0.006793734666918286,10
  1039. visualization,394,0.006759422875671224,13
  1040. projection,394,0.006759422875671224,10
  1041. iwslt,394,0.006759422875671224,5
  1042. intermediate,393,0.006742266980047693,12
  1043. following,393,0.006742266980047693,9
  1044. task_specific,392,0.006725111084424163,13
  1045. avec,391,0.006707955188800631,4
  1046. intrinsic,391,0.006707955188800631,9
  1047. scoring,389,0.006673643397553569,7
  1048. emotional,389,0.006673643397553569,9
  1049. taxonomy,388,0.006656487501930038,8
  1050. ne,388,0.006656487501930038,2
  1051. natural_language_understanding,388,0.006656487501930038,30
  1052. relies,387,0.006639331606306508,6
  1053. empirical_study,387,0.006639331606306508,15
  1054. mutual,386,0.006622175710682976,6
  1055. scalable,386,0.006622175710682976,8
  1056. political,386,0.006622175710682976,9
  1057. relatedness,386,0.006622175710682976,11
  1058. concern,385,0.0066050198150594455,7
  1059. cet_article,385,0.0066050198150594455,11
  1060. generative_model,385,0.0066050198150594455,16
  1061. fashion,385,0.0066050198150594455,7
  1062. il,384,0.006587863919435914,2
  1063. trend,383,0.006570708023812383,5
  1064. commonsense,383,0.006570708023812383,11
  1065. distinction,382,0.006553552128188852,11
  1066. web_based,382,0.006553552128188852,9
  1067. map,382,0.006553552128188852,3
  1068. subjective,381,0.006536396232565321,10
  1069. synonym,380,0.00651924033694179,7
  1070. multiword,380,0.00651924033694179,9
  1071. life,379,0.006502084441318259,4
  1072. propagation,378,0.006484928545694728,11
  1073. google,376,0.006450616754447666,6
  1074. future_research,376,0.006450616754447666,15
  1075. inherent,375,0.006433460858824135,8
  1076. phonetic,375,0.006433460858824135,8
  1077. korean,375,0.006433460858824135,6
  1078. regular,375,0.006433460858824135,7
  1079. important_role,374,0.006416304963200604,14
  1080. classical,374,0.006416304963200604,9
  1081. transcript,373,0.006399149067577073,10
  1082. simplification,372,0.0063819931719535416,14
  1083. derivation,372,0.0063819931719535416,10
  1084. reasonable,370,0.00634768138070648,10
  1085. high_accuracy,370,0.00634768138070648,13
  1086. edge,369,0.006330525485082949,4
  1087. task_oriented,368,0.006313369589459418,13
  1088. natural_language_inference,368,0.006313369589459418,26
  1089. chain,367,0.0062962136938358865,5
  1090. shift,367,0.0062962136938358865,5
  1091. fluency,367,0.0062962136938358865,7
  1092. rnn,366,0.006279057798212356,3
  1093. collaborative,366,0.006279057798212356,13
  1094. device,366,0.006279057798212356,6
  1095. context_free,365,0.006261901902588824,12
  1096. realistic,364,0.006244746006965294,9
  1097. book,364,0.006244746006965294,4
  1098. dependent,364,0.006244746006965294,9
  1099. overlap,364,0.006244746006965294,7
  1100. website,364,0.006244746006965294,7
  1101. vision,363,0.006227590111341763,6
  1102. sophisticated,363,0.006227590111341763,13
  1103. run,363,0.006227590111341763,3
  1104. opportunity,363,0.006227590111341763,11
  1105. gradient,363,0.006227590111341763,8
  1106. pragmatic,362,0.006210434215718231,9
  1107. capacity,362,0.006210434215718231,8
  1108. short_term,361,0.006193278320094701,10
  1109. linguistic_knowledge,361,0.006193278320094701,20
  1110. introduction,360,0.006176122424471169,12
  1111. perplexity,359,0.0061589665288476385,10
  1112. pilot,359,0.0061589665288476385,5
  1113. linguist,359,0.0061589665288476385,8
  1114. offensive,359,0.0061589665288476385,9
  1115. granularity,358,0.006141810633224108,11
  1116. rapid,358,0.006141810633224108,5
  1117. future_work,358,0.006141810633224108,11
  1118. functional,357,0.006124654737600576,10
  1119. course,357,0.006124654737600576,6
  1120. neural_language,357,0.006124654737600576,15
  1121. weak,355,0.006090342946353514,4
  1122. slot,355,0.006090342946353514,4
  1123. few_shot,355,0.006090342946353514,8
  1124. electronic,354,0.0060731870507299834,10
  1125. perception,353,0.006056031155106452,10
  1126. rare,353,0.006056031155106452,4
  1127. donne,353,0.006056031155106452,5
  1128. textual_entailment,353,0.006056031155106452,18
  1129. partir,352,0.006038875259482921,6
  1130. advanced,352,0.006038875259482921,8
  1131. minimum,351,0.0060217193638593906,7
  1132. voice,351,0.0060217193638593906,5
  1133. fusion,351,0.0060217193638593906,6
  1134. competitive_result,350,0.006004563468235859,18
  1135. ai,350,0.006004563468235859,2
  1136. substitution,348,0.005970251676988797,12
  1137. combine,348,0.005970251676988797,7
  1138. intelligent,348,0.005970251676988797,11
  1139. fragment,348,0.005970251676988797,8
  1140. lm,348,0.005970251676988797,2
  1141. parallel_data,347,0.005953095781365266,13
  1142. mixture,347,0.005953095781365266,7
  1143. salient,346,0.0059359398857417355,7
  1144. correspondence,346,0.0059359398857417355,14
  1145. indicator,345,0.005918783990118204,9
  1146. new_task,345,0.005918783990118204,8
  1147. unlabeled_data,344,0.005901628094494673,14
  1148. cause,344,0.005901628094494673,5
  1149. regularization,344,0.005901628094494673,14
  1150. uncertainty,344,0.005901628094494673,11
  1151. adjective,344,0.005901628094494673,9
  1152. reordering,344,0.005901628094494673,10
  1153. prsente,344,0.005901628094494673,7
  1154. publication,343,0.005884472198871142,11
  1155. fewer,343,0.005884472198871142,5
  1156. semantic_role_labeling,342,0.005867316303247611,22
  1157. keywords,342,0.005867316303247611,8
  1158. metadata,342,0.005867316303247611,8
  1159. filtering,340,0.005833004512000549,9
  1160. suggestion,340,0.005833004512000549,10
  1161. costly,339,0.005815848616377018,6
  1162. massive,339,0.005815848616377018,7
  1163. transition,339,0.005815848616377018,10
  1164. modelling,339,0.005815848616377018,9
  1165. maximum_entropy,339,0.005815848616377018,15
  1166. ten,339,0.005815848616377018,3
  1167. simpler,339,0.005815848616377018,7
  1168. risk,339,0.005815848616377018,4
  1169. applicability,339,0.005815848616377018,13
  1170. mixed,338,0.005798692720753487,5
  1171. analyzer,337,0.005781536825129956,8
  1172. collocation,337,0.005781536825129956,11
  1173. bayes,337,0.005781536825129956,5
  1174. best_performance,337,0.005781536825129956,16
  1175. paragraph,337,0.005781536825129956,9
  1176. conll,337,0.005781536825129956,5
  1177. period,337,0.005781536825129956,6
  1178. cross_domain,336,0.0057643809295064245,12
  1179. part_of_speech_tagging,336,0.0057643809295064245,22
  1180. syntactic_information,336,0.0057643809295064245,21
  1181. encoders,336,0.0057643809295064245,8
  1182. instruction,335,0.005747225033882894,11
  1183. ground,335,0.005747225033882894,6
  1184. named_entity,335,0.005747225033882894,12
  1185. national,335,0.005747225033882894,8
  1186. quantity,334,0.005730069138259363,8
  1187. short_term_memory,332,0.005695757347012301,17
  1188. note,332,0.005695757347012301,4
  1189. transducer,331,0.005678601451388769,10
  1190. reliability,331,0.005678601451388769,11
  1191. library,330,0.005661445555765239,7
  1192. negation,329,0.005644289660141708,8
  1193. newspaper,329,0.005644289660141708,9
  1194. conference,329,0.005644289660141708,10
  1195. lemma,328,0.0056271337645181765,5
  1196. company,328,0.0056271337645181765,7
  1197. shared,328,0.0056271337645181765,6
  1198. best_performing,328,0.0056271337645181765,15
  1199. readability,328,0.0056271337645181765,11
  1200. measurement,328,0.0056271337645181765,11
  1201. easier,328,0.0056271337645181765,6
  1202. challenging_task,327,0.005609977868894646,16
  1203. greater,327,0.005609977868894646,7
  1204. contextualized,327,0.005609977868894646,14
  1205. manual_annotation,327,0.005609977868894646,17
  1206. aux,326,0.005592821973271114,3
  1207. completion,325,0.005575666077647584,10
  1208. behaviour,325,0.005575666077647584,9
  1209. feasibility,325,0.005575666077647584,11
  1210. numerous,325,0.005575666077647584,8
  1211. spoken_dialogue,324,0.005558510182024053,15
  1212. piece,324,0.005558510182024053,5
  1213. inter_annotator,324,0.005558510182024053,15
  1214. grammatical_error,323,0.005541354286400521,17
  1215. customer,323,0.005541354286400521,8
  1216. population,323,0.005541354286400521,10
  1217. discrete,323,0.005541354286400521,8
  1218. judgement,323,0.005541354286400521,9
  1219. second_language,323,0.005541354286400521,15
  1220. region,323,0.005541354286400521,6
  1221. preprocessing,323,0.005541354286400521,13
  1222. i.e.,322,0.005524198390776991,4
  1223. clue,322,0.005524198390776991,4
  1224. linguistic_resource,322,0.005524198390776991,19
  1225. linguistic_information,322,0.005524198390776991,22
  1226. propose,322,0.005524198390776991,7
  1227. self_attention,321,0.005507042495153459,14
  1228. thousand,321,0.005507042495153459,8
  1229. decade,320,0.0054898865995299286,6
  1230. pretraining,320,0.0054898865995299286,11
  1231. compression,319,0.005472730703906397,11
  1232. today,319,0.005472730703906397,5
  1233. czech,319,0.005472730703906397,5
  1234. accessible,319,0.005472730703906397,10
  1235. interpretability,319,0.005472730703906397,16
  1236. bert_based,318,0.005455574808282866,10
  1237. teacher,318,0.005455574808282866,7
  1238. dutch,318,0.005455574808282866,5
  1239. skill,318,0.005455574808282866,5
  1240. pairwise,317,0.005438418912659336,8
  1241. commercial,317,0.005438418912659336,10
  1242. graphical,317,0.005438418912659336,9
  1243. better_result,317,0.005438418912659336,13
  1244. count,316,0.005421263017035804,5
  1245. mandarin,316,0.005421263017035804,8
  1246. assignment,316,0.005421263017035804,10
  1247. marker,316,0.005421263017035804,6
  1248. specialized,316,0.005421263017035804,11
  1249. mthode,316,0.005421263017035804,6
  1250. efficacy,315,0.0054041071214122735,8
  1251. valid,315,0.0054041071214122735,5
  1252. approche,315,0.0054041071214122735,8
  1253. title,314,0.005386951225788742,5
  1254. us,314,0.005386951225788742,2
  1255. notre,314,0.005386951225788742,5
  1256. pa,313,0.005369795330165211,2
  1257. semantic_feature,313,0.005369795330165211,16
  1258. roberta,313,0.005369795330165211,7
  1259. crosslingual,312,0.005352639434541681,12
  1260. motivation,312,0.005352639434541681,10
  1261. former,311,0.005335483538918149,6
  1262. avon,311,0.005335483538918149,4
  1263. country,311,0.005335483538918149,7
  1264. volume,310,0.005318327643294618,6
  1265. stochastic,310,0.005318327643294618,10
  1266. previous_method,309,0.005301171747671087,15
  1267. nous_avon,309,0.005301171747671087,9
  1268. workflow,309,0.005301171747671087,8
  1269. english_language,309,0.005301171747671087,16
  1270. semantic_analysis,308,0.005284015852047556,17
  1271. expressive,308,0.005284015852047556,10
  1272. extra,308,0.005284015852047556,5
  1273. incorrect,307,0.0052668599564240255,9
  1274. textes,306,0.005249704060800494,6
  1275. realization,306,0.005249704060800494,11
  1276. best_model,306,0.005249704060800494,10
  1277. small_amount,305,0.005232548165176963,12
  1278. neural_architecture,305,0.005232548165176963,19
  1279. statistical_model,305,0.005232548165176963,17
  1280. synthesis,305,0.005232548165176963,9
  1281. reveals,305,0.005232548165176963,7
  1282. neural_language_model,305,0.005232548165176963,21
  1283. intelligence,305,0.005232548165176963,12
  1284. ongoing,305,0.005232548165176963,7
  1285. morphological_analysis,304,0.005215392269553432,22
  1286. deux,304,0.005215392269553432,4
  1287. foreign,304,0.005215392269553432,7
  1288. rouge,303,0.005198236373929901,5
  1289. multi_task_learning,303,0.005198236373929901,19
  1290. regard,303,0.005198236373929901,6
  1291. dense,302,0.00518108047830637,5
  1292. competitive_performance,302,0.00518108047830637,23
  1293. language_specific,302,0.00518108047830637,17
  1294. industry,301,0.005163924582682839,8
  1295. semeval_2020,301,0.005163924582682839,12
  1296. deep_learning_model,301,0.005163924582682839,19
  1297. comparable_corpus,301,0.005163924582682839,17
  1298. finite,301,0.005163924582682839,6
  1299. nlp_application,301,0.005163924582682839,15
  1300. estimate,299,0.005129612791435777,8
  1301. semeval_2020_task,299,0.005129612791435777,17
  1302. multi_document,299,0.005129612791435777,14
  1303. expectation,299,0.005129612791435777,11
  1304. decomposition,299,0.005129612791435777,13
  1305. pretrained_language,299,0.005129612791435777,19
  1306. distributed,299,0.005129612791435777,11
  1307. syntactic_feature,299,0.005129612791435777,17
  1308. suite,298,0.005112456895812246,5
  1309. longer,297,0.0050953010001887145,6
  1310. essay,297,0.0050953010001887145,5
  1311. http,297,0.0050953010001887145,4
  1312. recent_advance,297,0.0050953010001887145,14
  1313. disease,297,0.0050953010001887145,7
  1314. mode,296,0.005078145104565184,4
  1315. cross,296,0.005078145104565184,5
  1316. mental,296,0.005078145104565184,6
  1317. close,296,0.005078145104565184,5
  1318. age,296,0.005078145104565184,3
  1319. extended,296,0.005078145104565184,8
  1320. earlier,295,0.005060989208941653,7
  1321. flexibility,295,0.005060989208941653,11
  1322. static,295,0.005060989208941653,6
  1323. ou,294,0.005043833313318122,2
  1324. nominal,294,0.005043833313318122,7
  1325. approximation,294,0.005043833313318122,13
  1326. specification,294,0.005043833313318122,13
  1327. character_level,294,0.005043833313318122,15
  1328. assistant,292,0.005009521522071059,9
  1329. fixed,292,0.005009521522071059,5
  1330. chinese_word_segmentation,292,0.005009521522071059,25
  1331. performing,291,0.004992365626447529,10
  1332. cadre,290,0.004975209730823998,5
  1333. morpheme,290,0.004975209730823998,8
  1334. textual_similarity,290,0.004975209730823998,18
  1335. spatial,290,0.004975209730823998,7
  1336. virtual,290,0.004975209730823998,7
  1337. adequate,289,0.0049580538352004665,8
  1338. subsequent,289,0.0049580538352004665,10
  1339. sampling,289,0.0049580538352004665,8
  1340. edit,289,0.0049580538352004665,4
  1341. verification,288,0.004940897939576936,12
  1342. integrated,287,0.004923742043953404,10
  1343. functionality,287,0.004923742043953404,13
  1344. pretrained_language_model,286,0.004906586148329874,25
  1345. chunk,286,0.004906586148329874,5
  1346. site,286,0.004906586148329874,4
  1347. repository,286,0.004906586148329874,10
  1348. variational,286,0.004906586148329874,11
  1349. probabilistic_model,286,0.004906586148329874,19
  1350. hence,286,0.004906586148329874,5
  1351. ratio,286,0.004906586148329874,5
  1352. consisting,286,0.004906586148329874,10
  1353. seq2seq,286,0.004906586148329874,7
  1354. intuitive,286,0.004906586148329874,9
  1355. belief,285,0.004889430252706342,6
  1356. movie,285,0.004889430252706342,5
  1357. demand,285,0.004889430252706342,6
  1358. such_model,285,0.004889430252706342,10
  1359. new_domain,285,0.004889430252706342,10
  1360. filter,284,0.0048722743570828115,6
  1361. nli,284,0.0048722743570828115,3
  1362. thesaurus,284,0.0048722743570828115,9
  1363. drop,284,0.0048722743570828115,4
  1364. ablation,283,0.004855118461459281,8
  1365. amazon,283,0.004855118461459281,6
  1366. caption,283,0.004855118461459281,7
  1367. traitement,283,0.004855118461459281,10
  1368. noun_phrase,283,0.004855118461459281,11
  1369. academic,282,0.004837962565835749,8
  1370. feasible,282,0.004837962565835749,8
  1371. bottleneck,282,0.004837962565835749,10
  1372. business,282,0.004837962565835749,8
  1373. status,282,0.004837962565835749,6
  1374. interested,282,0.004837962565835749,10
  1375. nist,281,0.004820806670212219,4
  1376. many_language,281,0.004820806670212219,13
  1377. informal,281,0.004820806670212219,8
  1378. active_learning,281,0.004820806670212219,15
  1379. swedish,281,0.004820806670212219,7
  1380. deeper,281,0.004820806670212219,6
  1381. weakness,280,0.004803650774588687,8
  1382. presentation,280,0.004803650774588687,12
  1383. text_generation,280,0.004803650774588687,15
  1384. large_margin,280,0.004803650774588687,12
  1385. computational_model,280,0.004803650774588687,19
  1386. cross_language,279,0.004786494878965156,14
  1387. financial,279,0.004786494878965156,9
  1388. precise,278,0.004769338983341626,7
  1389. option,278,0.004769338983341626,6
  1390. predictor,278,0.004769338983341626,9
  1391. intuition,278,0.004769338983341626,9
  1392. portion,278,0.004769338983341626,7
  1393. naive,278,0.004769338983341626,5
  1394. linguistic_phenomenon,277,0.004752183087718094,21
  1395. compact,277,0.004752183087718094,7
  1396. body,277,0.004752183087718094,4
  1397. attention_based,277,0.004752183087718094,15
  1398. rhetorical,276,0.0047350271920945635,10
  1399. sound,276,0.0047350271920945635,5
  1400. different_approach,276,0.0047350271920945635,18
  1401. human_language,276,0.0047350271920945635,14
  1402. developer,275,0.004717871296471032,9
  1403. sign,275,0.004717871296471032,4
  1404. causal,275,0.004717871296471032,6
  1405. in_depth,275,0.004717871296471032,8
  1406. stance,275,0.004717871296471032,6
  1407. distillation,274,0.004700715400847501,12
  1408. combined,274,0.004700715400847501,8
  1409. unsupervised_method,273,0.004683559505223971,19
  1410. soft,273,0.004683559505223971,4
  1411. high_precision,273,0.004683559505223971,14
  1412. hour,272,0.004666403609600439,4
  1413. scarce,272,0.004666403609600439,6
  1414. phonological,272,0.004666403609600439,12
  1415. documentation,272,0.004666403609600439,13
  1416. different_level,272,0.004666403609600439,15
  1417. triple,271,0.004649247713976908,6
  1418. million,271,0.004649247713976908,7
  1419. distant_supervision,271,0.004649247713976908,19
  1420. time_consuming,271,0.004649247713976908,14
  1421. multi_word,270,0.004632091818353377,10
  1422. ainsi,270,0.004632091818353377,5
  1423. validity,270,0.004632091818353377,8
  1424. anaphora,270,0.004632091818353377,8
  1425. experiment_result,270,0.004632091818353377,17
  1426. logistic,270,0.004632091818353377,8
  1427. external_knowledge,269,0.004614935922729846,18
  1428. constituency,269,0.004614935922729846,12
  1429. fluent,269,0.004614935922729846,6
  1430. orthographic,269,0.004614935922729846,12
  1431. restriction,268,0.004597780027106315,11
  1432. improves,268,0.004597780027106315,8
  1433. preliminary_result,268,0.004597780027106315,18
  1434. consequence,268,0.004597780027106315,11
  1435. important_task,268,0.004597780027106315,14
  1436. false,268,0.004597780027106315,5
  1437. em,268,0.004597780027106315,2
  1438. tche,268,0.004597780027106315,4
  1439. analyse,268,0.004597780027106315,7
  1440. tre,268,0.004597780027106315,3
  1441. modular,268,0.004597780027106315,7
  1442. hand_crafted,267,0.004580624131482784,12
  1443. stream,267,0.004580624131482784,6
  1444. absence,267,0.004580624131482784,7
  1445. first_time,266,0.004563468235859253,10
  1446. simulation,266,0.004563468235859253,10
  1447. metaphor,265,0.004546312340235722,8
  1448. log,265,0.004546312340235722,3
  1449. langue,265,0.004546312340235722,6
  1450. big,265,0.004546312340235722,3
  1451. straightforward,265,0.004546312340235722,15
  1452. attribution,265,0.004546312340235722,11
  1453. inventory,264,0.004529156444612191,9
  1454. daily,264,0.004529156444612191,5
  1455. spontaneous,264,0.004529156444612191,11
  1456. preposition,264,0.004529156444612191,11
  1457. plausible,264,0.004529156444612191,9
  1458. vast,263,0.00451200054898866,4
  1459. supervised_learning,263,0.00451200054898866,19
  1460. synset,263,0.00451200054898866,6
  1461. lead,263,0.00451200054898866,4
  1462. extract,263,0.00451200054898866,7
  1463. hate,262,0.004494844653365129,4
  1464. transition_based,262,0.004494844653365129,16
  1465. ir,262,0.004494844653365129,2
  1466. indian,262,0.004494844653365129,6
  1467. popularity,261,0.004477688757741598,10
  1468. inclusion,261,0.004477688757741598,9
  1469. impressive,261,0.004477688757741598,10
  1470. multi_label,261,0.004477688757741598,11
  1471. raw_text,261,0.004477688757741598,8
  1472. enhancement,261,0.004477688757741598,11
  1473. movement,261,0.004477688757741598,8
  1474. high_performance,260,0.004460532862118067,16
  1475. mot,260,0.004460532862118067,3
  1476. syntactic_dependency,260,0.004460532862118067,20
  1477. magnitude,260,0.004460532862118067,9
  1478. update,260,0.004460532862118067,6
  1479. user_generated,259,0.004443376966494536,14
  1480. morphosyntactic,259,0.004443376966494536,15
  1481. debate,259,0.004443376966494536,6
  1482. conjunction,258,0.0044262210708710045,11
  1483. best_system,258,0.0044262210708710045,11
  1484. file,258,0.0044262210708710045,4
  1485. good_performance,258,0.0044262210708710045,16
  1486. pronunciation,258,0.0044262210708710045,13
  1487. nlp_system,258,0.0044262210708710045,10
  1488. entre,258,0.0044262210708710045,5
  1489. factual,257,0.004409065175247474,7
  1490. forest,257,0.004409065175247474,6
  1491. block,256,0.004391909279623943,5
  1492. n_best,256,0.004391909279623943,6
  1493. respective,256,0.004391909279623943,10
  1494. neutral,255,0.004374753384000412,7
  1495. matter,255,0.004374753384000412,6
  1496. un_corpus,255,0.004374753384000412,9
  1497. problematic,255,0.004374753384000412,11
  1498. equal_contribution,255,0.004374753384000412,18
  1499. state_of_the_art_system,255,0.004374753384000412,23
  1500. affect,254,0.004357597488376881,6
  1501. multi_modal,254,0.004357597488376881,11
  1502. shortcoming,254,0.004357597488376881,11
  1503. new_model,253,0.0043404415927533494,9
  1504. logistic_regression,253,0.0043404415927533494,19
  1505. character_based,253,0.0043404415927533494,15
  1506. language_independent,253,0.0043404415927533494,20
  1507. legal,253,0.0043404415927533494,5
  1508. controlled,252,0.004323285697129819,10
  1509. reward,252,0.004323285697129819,6
  1510. topical,252,0.004323285697129819,7
  1511. new_language,252,0.004323285697129819,12
  1512. non_native,251,0.004306129801506287,10
  1513. scarcity,251,0.004306129801506287,8
  1514. demonstration,251,0.004306129801506287,13
  1515. comme,251,0.004306129801506287,5
  1516. word2vec,251,0.004306129801506287,8
  1517. profile,250,0.004288973905882757,7
  1518. day,250,0.004288973905882757,3
  1519. human_annotation,250,0.004288973905882757,16
  1520. text_based,250,0.004288973905882757,10
  1521. extrinsic,250,0.004288973905882757,9
  1522. substantial_improvement,250,0.004288973905882757,23
  1523. bound,249,0.004271818010259226,5
  1524. trigger,249,0.004271818010259226,7
  1525. previous_research,249,0.004271818010259226,17
  1526. symbolic,249,0.004271818010259226,8
  1527. beam,249,0.004271818010259226,4
  1528. generalized,249,0.004271818010259226,11
  1529. richer,249,0.004271818010259226,6
  1530. binary_classification,248,0.004254662114635694,21
  1531. limit,248,0.004254662114635694,5
  1532. audience,248,0.004254662114635694,8
  1533. english_german,248,0.004254662114635694,14
  1534. non,248,0.004254662114635694,3
  1535. syntax_based,247,0.004237506219012164,12
  1536. synchronous,247,0.004237506219012164,11
  1537. incomplete,247,0.004237506219012164,10
  1538. divergence,246,0.004220350323388632,10
  1539. scene,246,0.004220350323388632,5
  1540. domaine,246,0.004220350323388632,7
  1541. discourse_relation,245,0.0042031944277651015,18
  1542. inflection,245,0.0042031944277651015,10
  1543. simultaneous,245,0.0042031944277651015,12
  1544. small_number,245,0.0042031944277651015,12
  1545. wide_variety,245,0.0042031944277651015,12
  1546. automatic_metric,245,0.0042031944277651015,16
  1547. phrasal,245,0.0042031944277651015,7
  1548. sub_tasks,245,0.0042031944277651015,9
  1549. attachment,245,0.0042031944277651015,10
  1550. journal,244,0.004186038532141571,7
  1551. growth,244,0.004186038532141571,6
  1552. resulting,244,0.004186038532141571,9
  1553. evolution,244,0.004186038532141571,9
  1554. writer,244,0.004186038532141571,6
  1555. modle,244,0.004186038532141571,5
  1556. education,244,0.004186038532141571,9
  1557. two_stage,244,0.004186038532141571,9
  1558. macro,243,0.004168882636518039,5
  1559. rich_language,243,0.004168882636518039,13
  1560. smantique,243,0.004168882636518039,9
  1561. recording,243,0.004168882636518039,9
  1562. linguistic_analysis,243,0.004168882636518039,19
  1563. unsupervised_approach,243,0.004168882636518039,21
  1564. proposition,243,0.004168882636518039,11
  1565. enhanced,242,0.004151726740894509,8
  1566. aggregation,242,0.004151726740894509,11
  1567. framenet,242,0.004151726740894509,8
  1568. scratch,241,0.004134570845270977,7
  1569. flow,241,0.004134570845270977,4
  1570. httpsgithub.com,241,0.004134570845270977,15
  1571. argumentation,241,0.004134570845270977,13
  1572. general_purpose,241,0.004134570845270977,15
  1573. compositionality,241,0.004134570845270977,16
  1574. truth,240,0.004117414949647446,5
  1575. educational,240,0.004117414949647446,11
  1576. neural_network_architecture,239,0.004100259054023916,27
  1577. question_answering,239,0.004100259054023916,18
  1578. crowdsourcing,239,0.004100259054023916,13
  1579. recent_study,239,0.004100259054023916,12
  1580. montrons,238,0.004083103158400384,8
  1581. rise,238,0.004083103158400384,4
  1582. aware,238,0.004083103158400384,5
  1583. semantic_parser,238,0.004083103158400384,15
  1584. small_set,238,0.004083103158400384,9
  1585. pre_processing,237,0.0040659472627768535,14
  1586. ie,237,0.0040659472627768535,2
  1587. correctness,237,0.0040659472627768535,11
  1588. simplicity,236,0.004048791367153322,10
  1589. attack,236,0.004048791367153322,6
  1590. collaboration,236,0.004048791367153322,13
  1591. insufficient,236,0.004048791367153322,12
  1592. extractor,235,0.004031635471529791,9
  1593. masked,235,0.004031635471529791,6
  1594. trade_off,235,0.004031635471529791,9
  1595. automatic_detection,235,0.004031635471529791,19
  1596. short_text,235,0.004031635471529791,10
  1597. se,235,0.004031635471529791,2
  1598. license,234,0.00401447957590626,7
  1599. ud,234,0.00401447957590626,2
  1600. typology,234,0.00401447957590626,8
  1601. deal,234,0.00401447957590626,4
  1602. testing,234,0.00401447957590626,7
  1603. context_free_grammar,234,0.00401447957590626,20
  1604. distributional_semantics,234,0.00401447957590626,24
  1605. monolingual_data,234,0.00401447957590626,16
  1606. member,233,0.003997323680282729,6
  1607. variability,233,0.003997323680282729,11
  1608. bilingual_dictionary,233,0.003997323680282729,20
  1609. shared_task,233,0.003997323680282729,11
  1610. bag_of_words,232,0.0039801677846591985,12
  1611. out_of_vocabulary,232,0.0039801677846591985,17
  1612. trait,232,0.0039801677846591985,5
  1613. diagnosis,232,0.0039801677846591985,9
  1614. faster,232,0.0039801677846591985,6
  1615. further_research,231,0.003963011889035667,16
  1616. desired,231,0.003963011889035667,7
  1617. protocol,231,0.003963011889035667,8
  1618. window,231,0.003963011889035667,6
  1619. andor,231,0.003963011889035667,5
  1620. creative,231,0.003963011889035667,8
  1621. approximate,231,0.003963011889035667,11
  1622. unknown_word,231,0.003963011889035667,12
  1623. dirichlet,231,0.003963011889035667,9
  1624. different_model,230,0.003945855993412136,15
  1625. brief,230,0.003945855993412136,5
  1626. remarkable,230,0.003945855993412136,10
  1627. unclear,230,0.003945855993412136,7
  1628. semeval_2019,230,0.003945855993412136,12
  1629. human_annotator,230,0.003945855993412136,15
  1630. multi_document_summarization,230,0.003945855993412136,28
  1631. aid,230,0.003945855993412136,3
  1632. mutual_information,229,0.003928700097788605,18
  1633. bootstrapping,229,0.003928700097788605,13
  1634. social_network,229,0.003928700097788605,14
  1635. paraphrasing,229,0.003928700097788605,12
  1636. prosodic,229,0.003928700097788605,8
  1637. literary,228,0.003911544202165074,8
  1638. semeval_2022,228,0.003911544202165074,12
  1639. descriptive,227,0.003894388306541543,11
  1640. abstractive_summarization,227,0.003894388306541543,25
  1641. semeval_2019_task,227,0.003894388306541543,17
  1642. weakly,227,0.003894388306541543,6
  1643. significance,227,0.003894388306541543,12
  1644. associated,226,0.003877232410918012,10
  1645. existence,226,0.003877232410918012,9
  1646. ordering,226,0.003877232410918012,8
  1647. thanks,226,0.003877232410918012,6
  1648. kb,226,0.003877232410918012,2
  1649. foundation,226,0.003877232410918012,10
  1650. deployment,226,0.003877232410918012,10
  1651. hmm,226,0.003877232410918012,3
  1652. intention,226,0.003877232410918012,9
  1653. semeval_2022_task,225,0.0038600765152944807,17
  1654. room,225,0.0038600765152944807,4
  1655. wider,224,0.00384292061967095,5
  1656. _a,224,0.00384292061967095,2
  1657. mobile,224,0.00384292061967095,6
  1658. inter_annotator_agreement,223,0.003825764724047419,25
  1659. word_based,223,0.003825764724047419,10
  1660. superiority,223,0.003825764724047419,11
  1661. semantic_annotation,223,0.003825764724047419,19
  1662. worse,222,0.003808608828423888,5
  1663. tuning,221,0.0037914529328003568,6
  1664. natural_language_text,221,0.0037914529328003568,21
  1665. blog,221,0.0037914529328003568,4
  1666. planning,221,0.0037914529328003568,8
  1667. turkish,221,0.0037914529328003568,7
  1668. neighbor,221,0.0037914529328003568,8
  1669. infrastructure,221,0.0037914529328003568,14
  1670. predicted,220,0.0037742970371768257,9
  1671. spoken_dialogue_system,220,0.0037742970371768257,22
  1672. semantic_model,220,0.0037742970371768257,14
  1673. ressources,220,0.0037742970371768257,10
  1674. learning_based,220,0.0037742970371768257,14
  1675. semeval_2016,220,0.0037742970371768257,12
  1676. call,219,0.003757141141553295,4
  1677. sub_task,219,0.003757141141553295,8
  1678. parallel_text,219,0.003757141141553295,13
  1679. predicate_argument,219,0.003757141141553295,18
  1680. elementary,219,0.003757141141553295,10
  1681. monolingual_corpus,219,0.003757141141553295,18
  1682. srl,219,0.003757141141553295,3
  1683. hybrid_approach,219,0.003757141141553295,15
  1684. cross_lingual_transfer,218,0.003739985245929764,22
  1685. semi_supervised_learning,218,0.003739985245929764,24
  1686. multi_domain,218,0.003739985245929764,12
  1687. moses,218,0.003739985245929764,5
  1688. coefficient,217,0.003722829350306233,11
  1689. convolution,217,0.003722829350306233,11
  1690. uniform,216,0.0037056734546827017,7
  1691. perceptron,216,0.0037056734546827017,10
  1692. refinement,216,0.0037056734546827017,10
  1693. acl,216,0.0037056734546827017,3
  1694. analogy,216,0.0037056734546827017,7
  1695. multitask,216,0.0037056734546827017,9
  1696. long_distance,216,0.0037056734546827017,13
  1697. stable,215,0.0036885175590591706,6
  1698. qualitative_analysis,215,0.0036885175590591706,20
  1699. knowledge_based,215,0.0036885175590591706,15
  1700. tracking,215,0.0036885175590591706,8
  1701. cultural,215,0.0036885175590591706,8
  1702. broader,214,0.0036713616634356395,7
  1703. bilingual_corpus,214,0.0036713616634356395,16
  1704. nmt_model,214,0.0036713616634356395,9
  1705. nous_montrons,214,0.0036713616634356395,13
  1706. contemporary,214,0.0036713616634356395,12
  1707. offensive_language,214,0.0036713616634356395,18
  1708. vital,214,0.0036713616634356395,5
  1709. lexical_feature,214,0.0036713616634356395,15
  1710. intervention,213,0.003654205767812109,12
  1711. inconsistency,213,0.003654205767812109,13
  1712. log_linear,212,0.0036370498721885777,10
  1713. prominent,212,0.0036370498721885777,9
  1714. construct,212,0.0036370498721885777,9
  1715. promise,212,0.0036370498721885777,7
  1716. tude,211,0.0036198939765650466,4
  1717. joint_model,211,0.0036198939765650466,11
  1718. travail,211,0.0036198939765650466,7
  1719. desirable,211,0.0036198939765650466,9
  1720. serious,211,0.0036198939765650466,7
  1721. enough,211,0.0036198939765650466,6
  1722. semi_automatic,211,0.0036198939765650466,14
  1723. native_speaker,210,0.0036027380809415155,14
  1724. connective,210,0.0036027380809415155,10
  1725. lattice,210,0.0036027380809415155,7
  1726. state_of_the_art_approach,210,0.0036027380809415155,25
  1727. xml,210,0.0036027380809415155,3
  1728. deterministic,210,0.0036027380809415155,13
  1729. oracle,210,0.0036027380809415155,6
  1730. manual_evaluation,209,0.0035855821853179844,17
  1731. post_processing,209,0.0035855821853179844,15
  1732. stronger,209,0.0035855821853179844,8
  1733. back_translation,209,0.0035855821853179844,16
  1734. semeval_2016_task,209,0.0035855821853179844,17
  1735. various_type,209,0.0035855821853179844,12
  1736. tokenization,209,0.0035855821853179844,12
  1737. observed,209,0.0035855821853179844,8
  1738. plan,209,0.0035855821853179844,4
  1739. bilingual_lexicon,209,0.0035855821853179844,17
  1740. release,208,0.0035684262896944533,7
  1741. citation,208,0.0035684262896944533,8
  1742. foreign_language,208,0.0035684262896944533,16
  1743. posterior,208,0.0035684262896944533,9
  1744. different_way,208,0.0035684262896944533,13
  1745. encouraging,208,0.0035684262896944533,11
  1746. context_aware,208,0.0035684262896944533,13
  1747. editor,208,0.0035684262896944533,6
  1748. keyword,208,0.0035684262896944533,7
  1749. th,208,0.0035684262896944533,2
  1750. multilingual_model,208,0.0035684262896944533,18
  1751. high_resource,207,0.0035512703940709226,13
  1752. morphological_analyzer,207,0.0035512703940709226,22
  1753. named,207,0.0035512703940709226,5
  1754. constrained,207,0.0035512703940709226,11
  1755. root,207,0.0035512703940709226,4
  1756. concrete,206,0.0035341144984473915,8
  1757. new_feature,206,0.0035341144984473915,11
  1758. confusion,206,0.0035341144984473915,9
  1759. threshold,206,0.0035341144984473915,9
  1760. adequacy,206,0.0035341144984473915,8
  1761. good_result,206,0.0035341144984473915,11
  1762. new_corpus,205,0.0035169586028238604,10
  1763. hundred,205,0.0035169586028238604,7
  1764. feature_based,205,0.0035169586028238604,13
  1765. tendency,205,0.0035169586028238604,8
  1766. subword,205,0.0035169586028238604,7
  1767. translated,204,0.0034998027072003293,10
  1768. ccg,204,0.0034998027072003293,3
  1769. argumentative,204,0.0034998027072003293,13
  1770. bigram,204,0.0034998027072003293,6
  1771. mismatch,204,0.0034998027072003293,8
  1772. symbol,204,0.0034998027072003293,6
  1773. off_the_shelf,204,0.0034998027072003293,13
  1774. bank,204,0.0034998027072003293,4
  1775. emphasis,203,0.0034826468115767982,8
  1776. center,203,0.0034826468115767982,6
  1777. multi_lingual,203,0.0034826468115767982,13
  1778. school,203,0.0034826468115767982,6
  1779. different_task,203,0.0034826468115767982,14
  1780. perform,203,0.0034826468115767982,7
  1781. lightweight,203,0.0034826468115767982,11
  1782. american,203,0.0034826468115767982,8
  1783. pivot,203,0.0034826468115767982,5
  1784. exercise,203,0.0034826468115767982,8
  1785. redundant,202,0.0034654909159532675,9
  1786. l'analyse,202,0.0034654909159532675,9
  1787. redundancy,202,0.0034654909159532675,10
  1788. greedy,202,0.0034654909159532675,6
  1789. acceptable,202,0.0034654909159532675,10
  1790. sota,202,0.0034654909159532675,4
  1791. sarcasm,202,0.0034654909159532675,7
  1792. crfs,202,0.0034654909159532675,4
  1793. prompt,201,0.0034483350203297364,6
  1794. categorial,201,0.0034483350203297364,10
  1795. demo,201,0.0034483350203297364,4
  1796. patent,201,0.0034483350203297364,6
  1797. on_line,201,0.0034483350203297364,7
  1798. syllable,201,0.0034483350203297364,8
  1799. failure,201,0.0034483350203297364,7
  1800. effective_method,201,0.0034483350203297364,16
  1801. finnish,201,0.0034483350203297364,7
  1802. superior_performance,201,0.0034483350203297364,20
  1803. phone,201,0.0034483350203297364,5
  1804. recursive,201,0.0034483350203297364,9
  1805. society,201,0.0034483350203297364,7
  1806. request,201,0.0034483350203297364,7
  1807. nlu,201,0.0034483350203297364,3
  1808. lstms,201,0.0034483350203297364,5
  1809. np,201,0.0034483350203297364,2
  1810. inflectional,200,0.0034311791247062053,12
  1811. token_level,200,0.0034311791247062053,11
  1812. reddit,200,0.0034311791247062053,6
  1813. detailed_analysis,200,0.0034311791247062053,17
  1814. semeval_2018,200,0.0034311791247062053,12
  1815. syntactic_parsing,199,0.0034140232290826742,17
  1816. clean,199,0.0034140232290826742,5
  1817. punctuation,199,0.0034140232290826742,11
  1818. judge,199,0.0034140232290826742,5
  1819. polish,199,0.0034140232290826742,6
  1820. old,199,0.0034140232290826742,3
  1821. literal,198,0.003396867333459143,7
  1822. parallel_sentence,198,0.003396867333459143,17
  1823. psycholinguistic,198,0.003396867333459143,16
  1824. channel,198,0.003396867333459143,7
  1825. recent_research,198,0.003396867333459143,15
  1826. overall_performance,198,0.003396867333459143,19
  1827. largescale,198,0.003396867333459143,10
  1828. percentage,198,0.003396867333459143,10
  1829. predefined,198,0.003396867333459143,10
  1830. covid_19,198,0.003396867333459143,8
  1831. cosine,198,0.003396867333459143,6
  1832. antecedent,197,0.003379711437835612,10
  1833. langues,197,0.003379711437835612,7
  1834. identity,197,0.003379711437835612,8
  1835. restaurant,197,0.003379711437835612,10
  1836. isolation,197,0.003379711437835612,9
  1837. da,197,0.003379711437835612,2
  1838. proportion,197,0.003379711437835612,10
  1839. intensity,197,0.003379711437835612,9
  1840. known,196,0.0033625555422120814,5
  1841. mwes,196,0.0033625555422120814,4
  1842. tamil,196,0.0033625555422120814,5
  1843. compatible,196,0.0033625555422120814,10
  1844. text_summarization,196,0.0033625555422120814,18
  1845. stylistic,196,0.0033625555422120814,9
  1846. care,196,0.0033625555422120814,4
  1847. robot,196,0.0033625555422120814,5
  1848. complement,195,0.0033453996465885503,10
  1849. different_method,195,0.0033453996465885503,16
  1850. comparable_performance,195,0.0033453996465885503,22
  1851. empirical_evaluation,195,0.0033453996465885503,20
  1852. sentiment_analysis,195,0.0033453996465885503,18
  1853. current_state,195,0.0033453996465885503,13
  1854. stanford,195,0.0033453996465885503,8
  1855. irrelevant,195,0.0033453996465885503,10
  1856. newswire,195,0.0033453996465885503,8
  1857. native_language,195,0.0033453996465885503,15
  1858. dual,195,0.0033453996465885503,4
  1859. indian_language,194,0.003328243750965019,15
  1860. amr,194,0.003328243750965019,3
  1861. canonical,194,0.003328243750965019,9
  1862. closed,194,0.003328243750965019,6
  1863. state_of_the_art_baseline,194,0.003328243750965019,25
  1864. long_term,194,0.003328243750965019,9
  1865. adversarial_training,194,0.003328243750965019,20
  1866. unsupervised_learning,194,0.003328243750965019,21
  1867. mt_system,194,0.003328243750965019,9
  1868. split,193,0.003311087855341488,5
  1869. numerical,193,0.003311087855341488,9
  1870. inconsistent,193,0.003311087855341488,12
  1871. semeval_2018_task,193,0.003311087855341488,17
  1872. code_mixed,193,0.003311087855341488,10
  1873. fine,192,0.003293931959717957,4
  1874. spelling,192,0.003293931959717957,8
  1875. picture,192,0.003293931959717957,7
  1876. single_word,192,0.003293931959717957,11
  1877. thorough,192,0.003293931959717957,8
  1878. task_oriented_dialogue,192,0.003293931959717957,22
  1879. nlp_model,192,0.003293931959717957,9
  1880. lexical_information,191,0.003276776064094426,19
  1881. abstraction,191,0.003276776064094426,11
  1882. galement,191,0.003276776064094426,8
  1883. classic,191,0.003276776064094426,7
  1884. diffrents,191,0.003276776064094426,9
  1885. many_application,191,0.003276776064094426,16
  1886. further_improvement,191,0.003276776064094426,19
  1887. widespread,191,0.003276776064094426,10
  1888. recognizer,191,0.003276776064094426,10
  1889. biomedical_text,191,0.003276776064094426,15
  1890. mistake,190,0.003259620168470895,7
  1891. real_life,190,0.003259620168470895,9
  1892. snippet,190,0.003259620168470895,7
  1893. linking,190,0.003259620168470895,7
  1894. demographic,189,0.003242464272847364,11
  1895. productivity,189,0.003242464272847364,12
  1896. discrimination,189,0.003242464272847364,14
  1897. leur,189,0.003242464272847364,4
  1898. automatic_extraction,188,0.003225308377223833,20
  1899. syntactic_analysis,188,0.003225308377223833,18
  1900. peut,188,0.003225308377223833,4
  1901. proficiency,188,0.003225308377223833,11
  1902. mind,187,0.003208152481600302,4
  1903. transformer_based_model,187,0.003208152481600302,23
  1904. contrary,187,0.003208152481600302,8
  1905. suffers,187,0.003208152481600302,7
  1906. satisfactory,187,0.003208152481600302,12
  1907. modified,187,0.003208152481600302,8
  1908. fourth,187,0.003208152481600302,6
  1909. reranking,187,0.003208152481600302,9
  1910. human_performance,187,0.003208152481600302,17
  1911. grammatical_error_correction,186,0.0031909965859767708,28
  1912. syntaxique,186,0.0031909965859767708,10
  1913. self_supervised,186,0.0031909965859767708,15
  1914. train,185,0.00317384069035324,5
  1915. inductive,185,0.00317384069035324,9
  1916. logical_form,185,0.00317384069035324,12
  1917. drawback,185,0.00317384069035324,8
  1918. so_called,185,0.00317384069035324,9
  1919. depth,185,0.00317384069035324,5
  1920. artificial_intelligence,185,0.00317384069035324,23
  1921. speech_recognition,185,0.00317384069035324,18
  1922. none,184,0.003156684794729709,4
  1923. transduction,184,0.003156684794729709,12
  1924. upper,184,0.003156684794729709,5
  1925. english_text,184,0.003156684794729709,12
  1926. semeval_2021,184,0.003156684794729709,12
  1927. autoencoder,184,0.003156684794729709,11
  1928. bottom_up,184,0.003156684794729709,9
  1929. density,184,0.003156684794729709,7
  1930. consistent_improvement,184,0.003156684794729709,22
  1931. temporal_relation,184,0.003156684794729709,17
  1932. lda,183,0.003139528899106178,3
  1933. figure,183,0.003139528899106178,6
  1934. experimental_evaluation,183,0.003139528899106178,23
  1935. tutorial,183,0.003139528899106178,8
  1936. contexte,183,0.003139528899106178,8
  1937. semeval_2021_task,183,0.003139528899106178,17
  1938. unannotated,183,0.003139528899106178,11
  1939. diagnostic,183,0.003139528899106178,10
  1940. identifier,183,0.003139528899106178,10
  1941. lexicalized,183,0.003139528899106178,11
  1942. broad_coverage,182,0.003122373003482647,14
  1943. dependency_based,182,0.003122373003482647,16
  1944. government,182,0.003122373003482647,10
  1945. human_judgement,182,0.003122373003482647,15
  1946. semantic_structure,182,0.003122373003482647,18
  1947. lowresource,182,0.003122373003482647,11
  1948. competitive_baseline,182,0.003122373003482647,20
  1949. integer,182,0.003122373003482647,7
  1950. l2,182,0.003122373003482647,2
  1951. variance,182,0.003122373003482647,8
  1952. supervised_machine,181,0.0031052171078591157,18
  1953. bad,181,0.0031052171078591157,3
  1954. biomedical_domain,181,0.0031052171078591157,17
  1955. meeting,181,0.0031052171078591157,7
  1956. offline,181,0.0031052171078591157,7
  1957. german_english,181,0.0031052171078591157,14
  1958. ter,181,0.0031052171078591157,3
  1959. thing,181,0.0031052171078591157,5
  1960. diachronic,181,0.0031052171078591157,10
  1961. statistical_method,181,0.0031052171078591157,18
  1962. operator,180,0.0030880612122355846,8
  1963. reconstruction,180,0.0030880612122355846,14
  1964. navigation,180,0.0030880612122355846,10
  1965. aligned,180,0.0030880612122355846,7
  1966. lexical_item,180,0.0030880612122355846,12
  1967. referential,180,0.0030880612122355846,11
  1968. iteration,180,0.0030880612122355846,9
  1969. institute,180,0.0030880612122355846,9
  1970. hidden_markov,180,0.0030880612122355846,13
  1971. human_like,180,0.0030880612122355846,10
  1972. allocation,180,0.0030880612122355846,10
  1973. different_feature,180,0.0030880612122355846,17
  1974. wrong,180,0.0030880612122355846,5
  1975. drug,180,0.0030880612122355846,4
  1976. equivalence,180,0.0030880612122355846,11
  1977. present_result,180,0.0030880612122355846,14
  1978. pretrained_model,179,0.003070905316612054,16
  1979. semeval_2017,179,0.003070905316612054,12
  1980. two_step,179,0.003070905316612054,8
  1981. grounding,179,0.003070905316612054,9
  1982. social_medium_platform,179,0.003070905316612054,22
  1983. categorial_grammar,179,0.003070905316612054,18
  1984. suffix,179,0.003070905316612054,6
  1985. traduction,179,0.003070905316612054,10
  1986. coarse_grained,179,0.003070905316612054,14
  1987. semantic_space,179,0.003070905316612054,14
  1988. differs,179,0.003070905316612054,7
  1989. affective,179,0.003070905316612054,9
  1990. duration,179,0.003070905316612054,8
  1991. subjectivity,179,0.003070905316612054,12
  1992. revision,178,0.003053749420988523,8
  1993. expertise,178,0.003053749420988523,9
  1994. obstacle,178,0.003053749420988523,8
  1995. whereas,178,0.003053749420988523,7
  1996. low_resource_setting,178,0.003053749420988523,20
  1997. synthetic_data,178,0.003053749420988523,14
  1998. gaussian,178,0.003053749420988523,8
  1999. specificity,178,0.003053749420988523,11
  2000. l'utilisation,178,0.003053749420988523,13
  2001. usability,177,0.0030365935253649917,9
  2002. automatic_identification,177,0.0030365935253649917,24
  2003. guidance,177,0.0030365935253649917,8
  2004. mechanical,177,0.0030365935253649917,10
  2005. exchange,177,0.0030365935253649917,8
  2006. organizer,177,0.0030365935253649917,9
  2007. chat,177,0.0030365935253649917,4
  2008. market,177,0.0030365935253649917,6
  2009. perturbation,177,0.0030365935253649917,12
  2010. formation,177,0.0030365935253649917,9
  2011. extractive_summarization,177,0.0030365935253649917,24
  2012. prior_knowledge,176,0.0030194376297414606,15
  2013. phoneme,176,0.0030194376297414606,7
  2014. specific_domain,176,0.0030194376297414606,15
  2015. session,176,0.0030194376297414606,7
  2016. single_model,176,0.0030194376297414606,12
  2017. ontological,176,0.0030194376297414606,11
  2018. different_datasets,176,0.0030194376297414606,18
  2019. phrase_based_smt,176,0.0030194376297414606,16
  2020. semantic_relatedness,176,0.0030194376297414606,20
  2021. calculation,176,0.0030194376297414606,11
  2022. discrepancy,175,0.0030022817341179295,11
  2023. barrier,175,0.0030022817341179295,7
  2024. pruning,175,0.0030022817341179295,7
  2025. headline,175,0.0030022817341179295,8
  2026. initiative,175,0.0030022817341179295,10
  2027. kg,175,0.0030022817341179295,2
  2028. asian,175,0.0030022817341179295,5
  2029. large_set,175,0.0030022817341179295,9
  2030. free_text,175,0.0030022817341179295,9
  2031. modifier,174,0.0029851258384943984,8
  2032. psychological,174,0.0029851258384943984,13
  2033. practitioner,173,0.0029679699428708677,12
  2034. excellent,173,0.0029679699428708677,9
  2035. utilisant,173,0.0029679699428708677,9
  2036. textual_data,173,0.0029679699428708677,12
  2037. voting,173,0.0029679699428708677,6
  2038. coordination,173,0.0029679699428708677,12
  2039. indexing,173,0.0029679699428708677,8
  2040. mthodes,173,0.0029679699428708677,7
  2041. versus,173,0.0029679699428708677,6
  2042. under_resourced,172,0.0029508140472473366,15
  2043. semeval_2017_task,172,0.0029508140472473366,17
  2044. local_context,172,0.0029508140472473366,13
  2045. physical,172,0.0029508140472473366,8
  2046. disorder,172,0.0029508140472473366,8
  2047. reaction,172,0.0029508140472473366,8
  2048. rnns,172,0.0029508140472473366,4
  2049. self_training,172,0.0029508140472473366,13
  2050. novel_framework,171,0.0029336581516238055,15
  2051. api,171,0.0029336581516238055,3
  2052. targeted,171,0.0029336581516238055,8
  2053. linguistic_annotation,171,0.0029336581516238055,21
  2054. dominant,171,0.0029336581516238055,8
  2055. latest,171,0.0029336581516238055,6
  2056. texte,171,0.0029336581516238055,5
  2057. smantiques,171,0.0029336581516238055,10
  2058. large_collection,171,0.0029336581516238055,16
  2059. communicative,171,0.0029336581516238055,13
  2060. different_aspect,170,0.0029165022560002744,16
  2061. different_word,170,0.0029165022560002744,14
  2062. referent,170,0.0029165022560002744,8
  2063. httpsgithub,170,0.0029165022560002744,11
  2064. relative_improvement,170,0.0029165022560002744,20
  2065. linguistiques,170,0.0029165022560002744,13
  2066. regularity,170,0.0029165022560002744,10
  2067. such_system,170,0.0029165022560002744,11
  2068. replacement,169,0.0028993463603767433,11
  2069. induced,169,0.0028993463603767433,7
  2070. leaderboard,169,0.0028993463603767433,11
  2071. semantic_knowledge,169,0.0028993463603767433,18
  2072. exploitation,169,0.0028993463603767433,12
  2073. lexical_semantics,169,0.0028993463603767433,17
  2074. norm,169,0.0028993463603767433,4
  2075. major_challenge,169,0.0028993463603767433,15
  2076. perfect,168,0.0028821904647532122,7
  2077. spectrum,168,0.0028821904647532122,8
  2078. premise,168,0.0028821904647532122,7
  2079. principled,168,0.0028821904647532122,10
  2080. ideal,168,0.0028821904647532122,5
  2081. crowdsourced,168,0.0028821904647532122,12
  2082. augmented,167,0.0028650345691296816,9
  2083. ace,167,0.0028650345691296816,3
  2084. masked_language,167,0.0028650345691296816,15
  2085. chinese_to_english,167,0.0028650345691296816,18
  2086. vowel,167,0.0028650345691296816,5
  2087. viable,167,0.0028650345691296816,6
  2088. several_language,167,0.0028650345691296816,16
  2089. pearson,166,0.0028478786735061505,7
  2090. significant_performance,166,0.0028478786735061505,23
  2091. flat,166,0.0028478786735061505,4
  2092. novelty,166,0.0028478786735061505,7
  2093. trained_model,166,0.0028478786735061505,13
  2094. une_approche,166,0.0028478786735061505,12
  2095. sensitivity,166,0.0028478786735061505,11
  2096. permet,166,0.0028478786735061505,6
  2097. personality,166,0.0028478786735061505,11
  2098. disagreement,166,0.0028478786735061505,12
  2099. adoption,165,0.0028307227778826194,8
  2100. labelling,165,0.0028307227778826194,9
  2101. turk,165,0.0028307227778826194,4
  2102. compte,165,0.0028307227778826194,6
  2103. hypernym,165,0.0028307227778826194,8
  2104. normal,165,0.0028307227778826194,6
  2105. ont,164,0.0028135668822590883,3
  2106. mechanical_turk,164,0.0028135668822590883,15
  2107. permettant,164,0.0028135668822590883,10
  2108. python,164,0.0028135668822590883,6
  2109. convolutional_network,164,0.0028135668822590883,21
  2110. degradation,164,0.0028135668822590883,11
  2111. dialectal,164,0.0028135668822590883,9
  2112. question_answer,164,0.0028135668822590883,15
  2113. typological,164,0.0028135668822590883,11
  2114. preliminary_experiment,164,0.0028135668822590883,22
  2115. innovation,164,0.0028135668822590883,10
  2116. relevant_information,163,0.002796410986635557,20
  2117. statistical_approach,163,0.002796410986635557,20
  2118. conversational_agent,163,0.002796410986635557,20
  2119. century,163,0.002796410986635557,7
  2120. objective_function,163,0.002796410986635557,18
  2121. linguistic_structure,163,0.002796410986635557,20
  2122. polysemy,163,0.002796410986635557,8
  2123. pseudo,163,0.002796410986635557,6
  2124. naive_bayes,163,0.002796410986635557,11
  2125. multi_hop,163,0.002796410986635557,9
  2126. theme,163,0.002796410986635557,5
  2127. law,162,0.0027792550910120265,3
  2128. simulated,162,0.0027792550910120265,9
  2129. weighting,162,0.0027792550910120265,9
  2130. latency,162,0.0027792550910120265,7
  2131. enable,162,0.0027792550910120265,6
  2132. franccais,162,0.0027792550910120265,9
  2133. extensible,162,0.0027792550910120265,10
  2134. first_attempt,162,0.0027792550910120265,13
  2135. mathematical,162,0.0027792550910120265,12
  2136. parole,162,0.0027792550910120265,6
  2137. difficult_task,162,0.0027792550910120265,14
  2138. hidden_markov_model,162,0.0027792550910120265,19
  2139. phrase_based_translation,162,0.0027792550910120265,24
  2140. sparseness,161,0.0027620991953884954,10
  2141. net,161,0.0027620991953884954,3
  2142. linguistique,161,0.0027620991953884954,12
  2143. ibm,161,0.0027620991953884954,3
  2144. innovative,161,0.0027620991953884954,10
  2145. multi_class,161,0.0027620991953884954,11
  2146. premier,161,0.0027620991953884954,7
  2147. glue,161,0.0027620991953884954,4
  2148. attractive,161,0.0027620991953884954,10
  2149. ranked,161,0.0027620991953884954,6
  2150. fake,160,0.0027449432997649643,4
  2151. ml,160,0.0027449432997649643,2
  2152. contains,160,0.0027449432997649643,8
  2153. modern_standard,160,0.0027449432997649643,15
  2154. everyday,160,0.0027449432997649643,8
  2155. automatiquement,160,0.0027449432997649643,15
  2156. finite_state_transducer,160,0.0027449432997649643,23
  2157. useful_information,160,0.0027449432997649643,18
  2158. edition,160,0.0027449432997649643,7
  2159. particle,160,0.0027449432997649643,8
  2160. dynamic_programming,160,0.0027449432997649643,19
  2161. black_box,159,0.002727787404141433,9
  2162. sts,159,0.002727787404141433,3
  2163. related_language,159,0.002727787404141433,16
  2164. bilstm,159,0.002727787404141433,6
  2165. varies,159,0.002727787404141433,6
  2166. email,159,0.002727787404141433,5
  2167. tf_idf,159,0.002727787404141433,6
  2168. consensus,159,0.002727787404141433,9
  2169. incorporation,159,0.002727787404141433,13
  2170. batch,159,0.002727787404141433,5
  2171. hpsg,159,0.002727787404141433,4
  2172. finetuning,158,0.002710631508517902,10
  2173. automatic_translation,158,0.002710631508517902,21
  2174. bi_directional,158,0.002710631508517902,14
  2175. latent_dirichlet,158,0.002710631508517902,16
  2176. structural_information,158,0.002710631508517902,22
  2177. scalability,158,0.002710631508517902,11
  2178. wide_coverage,158,0.002710631508517902,13
  2179. general_domain,158,0.002710631508517902,14
  2180. intensive,158,0.002710631508517902,9
  2181. facebook,157,0.002693475612894371,8
  2182. recherche,157,0.002693475612894371,9
  2183. subtle,157,0.002693475612894371,6
  2184. automatic_generation,157,0.002693475612894371,20
  2185. scientific_paper,157,0.002693475612894371,16
  2186. minority,157,0.002693475612894371,8
  2187. pre_trained_word,157,0.002693475612894371,16
  2188. letter,157,0.002693475612894371,6
  2189. main_contribution,157,0.002693475612894371,17
  2190. compare,157,0.002693475612894371,7
  2191. e_commerce,157,0.002693475612894371,10
  2192. mwe,157,0.002693475612894371,3
  2193. decrease,156,0.0026763197172708403,8
  2194. characterization,156,0.0026763197172708403,16
  2195. plain,156,0.0026763197172708403,5
  2196. satisfaction,156,0.0026763197172708403,12
  2197. automaton,156,0.0026763197172708403,9
  2198. afin,156,0.0026763197172708403,4
  2199. external_resource,156,0.0026763197172708403,17
  2200. ad,156,0.0026763197172708403,2
  2201. simple_method,156,0.0026763197172708403,13
  2202. archive,156,0.0026763197172708403,7
  2203. experimentation,155,0.002659163821647309,15
  2204. preparation,155,0.002659163821647309,11
  2205. lemmatization,155,0.002659163821647309,13
  2206. exploratory,155,0.002659163821647309,11
  2207. n_gram_language,155,0.002659163821647309,15
  2208. elmo,155,0.002659163821647309,4
  2209. preservation,155,0.002659163821647309,12
  2210. look,155,0.002659163821647309,4
  2211. bag,155,0.002659163821647309,3
  2212. standardized,155,0.002659163821647309,12
  2213. linguistic_data,155,0.002659163821647309,15
  2214. prevalent,155,0.002659163821647309,9
  2215. careful,154,0.002642007926023778,7
  2216. thread,154,0.002642007926023778,6
  2217. thematic,154,0.002642007926023778,8
  2218. re_ranking,154,0.002642007926023778,10
  2219. humanity,154,0.002642007926023778,8
  2220. new_data,154,0.002642007926023778,8
  2221. peuvent,154,0.002642007926023778,7
  2222. hierarchical_structure,154,0.002642007926023778,22
  2223. trainable,154,0.002642007926023778,9
  2224. latent_dirichlet_allocation,154,0.002642007926023778,27
  2225. higher_level,154,0.002642007926023778,12
  2226. vers,154,0.002642007926023778,4
  2227. attitude,153,0.002624852030400247,8
  2228. biological,153,0.002624852030400247,10
  2229. comparative_study,153,0.002624852030400247,17
  2230. exhibit,153,0.002624852030400247,7
  2231. english_french,153,0.002624852030400247,14
  2232. abundant,153,0.002624852030400247,8
  2233. strict,153,0.002624852030400247,6
  2234. auxiliary_task,153,0.002624852030400247,14
  2235. chunking,153,0.002624852030400247,8
  2236. temporal_information,152,0.002607696134776716,20
  2237. identical,152,0.002607696134776716,9
  2238. effective_approach,152,0.002607696134776716,18
  2239. nave,152,0.002607696134776716,4
  2240. shorter,152,0.002607696134776716,7
  2241. independence,152,0.002607696134776716,12
  2242. different_kind,152,0.002607696134776716,14
  2243. chinese_character,152,0.002607696134776716,17
  2244. closer,152,0.002607696134776716,6
  2245. oov,151,0.002590540239153185,3
  2246. consumer,151,0.002590540239153185,8
  2247. aspect_based,151,0.002590540239153185,12
  2248. consists,151,0.002590540239153185,8
  2249. cross_linguistic,151,0.002590540239153185,16
  2250. d'information,151,0.002590540239153185,13
  2251. clinical_text,151,0.002590540239153185,13
  2252. simplified,151,0.002590540239153185,10
  2253. common_sense,151,0.002590540239153185,12
  2254. squad,151,0.002590540239153185,5
  2255. montrent,151,0.002590540239153185,8
  2256. privacy,151,0.002590540239153185,7
  2257. intended,151,0.002590540239153185,8
  2258. son,151,0.002590540239153185,3
  2259. explainable,151,0.002590540239153185,11
  2260. other_domain,151,0.002590540239153185,12
  2261. rest,151,0.002590540239153185,4
  2262. current_approach,151,0.002590540239153185,16
  2263. microsoft,150,0.002573384343529654,9
  2264. semantic_class,150,0.002573384343529654,14
  2265. sharing,150,0.002573384343529654,7
  2266. repetition,150,0.002573384343529654,10
  2267. lab,150,0.002573384343529654,3
  2268. predicate_argument_structure,150,0.002573384343529654,28
  2269. worker,150,0.002573384343529654,6
  2270. boost,150,0.002573384343529654,5
  2271. correlate,150,0.002573384343529654,9
  2272. crowd,150,0.002573384343529654,5
  2273. first_order,150,0.002573384343529654,11
  2274. insertion,149,0.002556228447906123,9
  2275. examination,149,0.002556228447906123,11
  2276. detector,149,0.002556228447906123,8
  2277. automatic_method,149,0.002556228447906123,16
  2278. social_medium_text,149,0.002556228447906123,18
  2279. existing,149,0.002556228447906123,8
  2280. selectional,149,0.002556228447906123,11
  2281. distributional_similarity,149,0.002556228447906123,25
  2282. better_understanding,149,0.002556228447906123,20
  2283. ubiquitous,149,0.002556228447906123,10
  2284. trs,149,0.002556228447906123,3
  2285. generate,148,0.002539072552282592,8
  2286. non_english,148,0.002539072552282592,11
  2287. constant,148,0.002539072552282592,8
  2288. woman,148,0.002539072552282592,5
  2289. developed,148,0.002539072552282592,9
  2290. identifies,148,0.002539072552282592,10
  2291. multi_level,148,0.002539072552282592,11
  2292. convergence,148,0.002539072552282592,11
  2293. slow,148,0.002539072552282592,4
  2294. modern_standard_arabic,147,0.002521916656659061,22
  2295. advancement,147,0.002521916656659061,11
  2296. abbreviation,147,0.002521916656659061,12
  2297. reprsentation,147,0.002521916656659061,13
  2298. wer,147,0.002521916656659061,3
  2299. semantic_dependency,147,0.002521916656659061,19
  2300. new_word,147,0.002521916656659061,8
  2301. orientation,147,0.002521916656659061,11
  2302. non_standard,147,0.002521916656659061,12
  2303. cognate,147,0.002521916656659061,7
  2304. unable,147,0.002521916656659061,6
  2305. abusive,147,0.002521916656659061,7
  2306. non_trivial,147,0.002521916656659061,11
  2307. factorization,146,0.0025047607610355297,13
  2308. chart,146,0.0025047607610355297,5
  2309. psychology,146,0.0025047607610355297,10
  2310. party,146,0.0025047607610355297,5
  2311. erroneous,146,0.0025047607610355297,9
  2312. enrichment,146,0.0025047607610355297,10
  2313. rationale,146,0.0025047607610355297,9
  2314. une_mthode,146,0.0025047607610355297,10
  2315. valuation,146,0.0025047607610355297,9
  2316. concise,146,0.0025047607610355297,7
  2317. diffrentes,146,0.0025047607610355297,10
  2318. context_sensitive,146,0.0025047607610355297,17
  2319. humor,145,0.002487604865411999,5
  2320. phrase_based_machine,145,0.002487604865411999,20
  2321. neural_approach,145,0.002487604865411999,15
  2322. multiple_choice,145,0.002487604865411999,15
  2323. multilingual_bert,145,0.002487604865411999,17
  2324. web_search,145,0.002487604865411999,10
  2325. human_annotated,145,0.002487604865411999,15
  2326. network_based,145,0.002487604865411999,13
  2327. indirect,145,0.002487604865411999,8
  2328. mais,145,0.002487604865411999,4
  2329. human_translation,145,0.002487604865411999,17
  2330. unrestricted,145,0.002487604865411999,12
  2331. gloss,145,0.002487604865411999,5
  2332. top_down,144,0.002470448969788468,8
  2333. sentential,144,0.002470448969788468,10
  2334. gpt_2,144,0.002470448969788468,5
  2335. awareness,144,0.002470448969788468,9
  2336. tm,144,0.002470448969788468,2
  2337. lecture,144,0.002470448969788468,7
  2338. effective_way,144,0.002470448969788468,13
  2339. automatic_classification,144,0.002470448969788468,24
  2340. long_range,144,0.002470448969788468,10
  2341. modles,144,0.002470448969788468,6
  2342. half,144,0.002470448969788468,4
  2343. nearest,143,0.002453293074164937,7
  2344. domainspecific,143,0.002453293074164937,14
  2345. latin,143,0.002453293074164937,5
  2346. phrase_based_machine_translation,143,0.002453293074164937,32
  2347. curriculum,143,0.002453293074164937,10
  2348. st,143,0.002453293074164937,2
  2349. tal,143,0.002453293074164937,3
  2350. manager,143,0.002453293074164937,7
  2351. higher_accuracy,143,0.002453293074164937,15
  2352. langage,143,0.002453293074164937,7
  2353. statistical_mt,143,0.002453293074164937,14
  2354. assistance,143,0.002453293074164937,10
  2355. adjacent,142,0.0024361371785414057,8
  2356. start,142,0.0024361371785414057,5
  2357. other_method,142,0.0024361371785414057,12
  2358. gesture,142,0.0024361371785414057,7
  2359. plusieurs,142,0.0024361371785414057,9
  2360. extreme,142,0.0024361371785414057,7
  2361. dtection,142,0.0024361371785414057,8
  2362. morpho_syntactic,142,0.0024361371785414057,16
  2363. code_switching,142,0.0024361371785414057,14
  2364. eye,142,0.0024361371785414057,3
  2365. text_to_speech,142,0.0024361371785414057,14
  2366. formula,141,0.0024189812829178746,7
  2367. n_gram_language_model,141,0.0024189812829178746,21
  2368. probable,141,0.0024189812829178746,8
  2369. idiom,141,0.0024189812829178746,5
  2370. present_paper,141,0.0024189812829178746,13
  2371. _the,140,0.0024018253872943435,4
  2372. si,140,0.0024018253872943435,2
  2373. personalized,140,0.0024018253872943435,12
  2374. grammaticality,140,0.0024018253872943435,14
  2375. partner,140,0.0024018253872943435,7
  2376. automatic_text,140,0.0024018253872943435,14
  2377. balanced,140,0.0024018253872943435,8
  2378. such_data,140,0.0024018253872943435,9
  2379. symptom,140,0.0024018253872943435,7
  2380. additional_information,140,0.0024018253872943435,22
  2381. greek,140,0.0024018253872943435,5
  2382. tense,140,0.0024018253872943435,5
  2383. automatic_evaluation_metric,140,0.0024018253872943435,27
  2384. varied,140,0.0024018253872943435,6
  2385. reconnaissance,140,0.0024018253872943435,14
  2386. much_attention,140,0.0024018253872943435,14
  2387. understood,139,0.002384669491670813,10
  2388. english_word,139,0.002384669491670813,12
  2389. teaching,139,0.002384669491670813,8
  2390. identifying,139,0.002384669491670813,11
  2391. rapport,139,0.002384669491670813,7
  2392. proof,139,0.002384669491670813,5
  2393. perceptual,139,0.002384669491670813,10
  2394. healthcare,139,0.002384669491670813,10
  2395. computational_cost,139,0.002384669491670813,18
  2396. balance,139,0.002384669491670813,7
  2397. distributional_model,139,0.002384669491670813,20
  2398. inflected,139,0.002384669491670813,9
  2399. mental_health,139,0.002384669491670813,13
  2400. custom,139,0.002384669491670813,6
  2401. systmes,138,0.0023675135960472818,7
  2402. trivial,138,0.0023675135960472818,7
  2403. prefix,138,0.0023675135960472818,6
  2404. fair,138,0.0023675135960472818,4
  2405. trec,138,0.0023675135960472818,4
  2406. svms,138,0.0023675135960472818,4
  2407. usable,138,0.0023675135960472818,6
  2408. fit,138,0.0023675135960472818,3
  2409. pcfg,138,0.0023675135960472818,4
  2410. further_analysis,138,0.0023675135960472818,16
  2411. stability,138,0.0023675135960472818,9
  2412. rhetorical_structure,138,0.0023675135960472818,20
  2413. vanilla,138,0.0023675135960472818,7
  2414. stem,138,0.0023675135960472818,4
  2415. devlin,138,0.0023675135960472818,6
  2416. listener,138,0.0023675135960472818,8
  2417. copy,137,0.0023503577004237507,4
  2418. unstructured_text,137,0.0023503577004237507,17
  2419. fraction,137,0.0023503577004237507,8
  2420. utilise,137,0.0023503577004237507,7
  2421. romanian,137,0.0023503577004237507,8
  2422. medical_domain,137,0.0023503577004237507,14
  2423. oral,137,0.0023503577004237507,4
  2424. street,137,0.0023503577004237507,6
  2425. captioning,137,0.0023503577004237507,10
  2426. brazilian,137,0.0023503577004237507,9
  2427. city,137,0.0023503577004237507,4
  2428. other_word,137,0.0023503577004237507,10
  2429. main_challenge,137,0.0023503577004237507,14
  2430. distributed_representation,137,0.0023503577004237507,26
  2431. rule_based_system,137,0.0023503577004237507,17
  2432. chinese_language,137,0.0023503577004237507,16
  2433. learn,137,0.0023503577004237507,5
  2434. previous_model,136,0.0023332018048002195,14
  2435. different_source,136,0.0023332018048002195,16
  2436. text_simplification,136,0.0023332018048002195,19
  2437. complicated,136,0.0023332018048002195,11
  2438. authorship,136,0.0023332018048002195,10
  2439. opposite,136,0.0023332018048002195,8
  2440. morphological_feature,136,0.0023332018048002195,21
  2441. reviewer,136,0.0023332018048002195,8
  2442. extrinsic_evaluation,136,0.0023332018048002195,20
  2443. spoken_language_translation,136,0.0023332018048002195,27
  2444. origin,136,0.0023332018048002195,6
  2445. semantic_relationship,136,0.0023332018048002195,21
  2446. english_chinese,136,0.0023332018048002195,15
  2447. sa,136,0.0023332018048002195,2
  2448. chinese_text,136,0.0023332018048002195,12
  2449. significant_gain,136,0.0023332018048002195,16
  2450. combinatory,135,0.0023160459091766884,11
  2451. disfluency,135,0.0023160459091766884,10
  2452. nlp_research,135,0.0023160459091766884,12
  2453. pure,135,0.0023160459091766884,4
  2454. similar_language,135,0.0023160459091766884,16
  2455. scientist,135,0.0023160459091766884,9
  2456. box,135,0.0023160459091766884,3
  2457. alternation,135,0.0023160459091766884,11
  2458. prone,135,0.0023160459091766884,5
  2459. novel_model,135,0.0023160459091766884,11
  2460. severe,135,0.0023160459091766884,6
  2461. related_task,134,0.0022988900135531573,12
  2462. spurious,134,0.0022988900135531573,8
  2463. european_language,134,0.0022988900135531573,17
  2464. orthography,134,0.0022988900135531573,11
  2465. grounded,134,0.0022988900135531573,8
  2466. behavioral,134,0.0022988900135531573,10
  2467. ca,134,0.0022988900135531573,2
  2468. required,134,0.0022988900135531573,8
  2469. strong_performance,134,0.0022988900135531573,18
  2470. social_science,134,0.0022988900135531573,14
  2471. derivational,134,0.0022988900135531573,12
  2472. bitext,134,0.0022988900135531573,6
  2473. anaphoric,134,0.0022988900135531573,9
  2474. novel_task,134,0.0022988900135531573,10
  2475. restricted,134,0.0022988900135531573,10
  2476. english_sentence,134,0.0022988900135531573,16
  2477. vietnamese,134,0.0022988900135531573,10
  2478. polysemous,134,0.0022988900135531573,10
  2479. medicine,134,0.0022988900135531573,8
  2480. anaphora_resolution,133,0.0022817341179296267,19
  2481. responsible,133,0.0022817341179296267,11
  2482. initialization,133,0.0022817341179296267,14
  2483. several_baseline,133,0.0022817341179296267,16
  2484. transcribed,133,0.0022817341179296267,11
  2485. checking,133,0.0022817341179296267,8
  2486. human_human,133,0.0022817341179296267,11
  2487. culture,133,0.0022817341179296267,7
  2488. proposed,133,0.0022817341179296267,8
  2489. harder,133,0.0022817341179296267,6
  2490. tches,133,0.0022817341179296267,5
  2491. viewpoint,133,0.0022817341179296267,9
  2492. first_stage,133,0.0022817341179296267,11
  2493. bengali,132,0.0022645782223060956,7
  2494. quantifier,132,0.0022645782223060956,10
  2495. human_judge,132,0.0022645782223060956,11
  2496. lexicale,132,0.0022645782223060956,8
  2497. ensemble_model,132,0.0022645782223060956,14
  2498. cohesion,132,0.0022645782223060956,8
  2499. interview,132,0.0022645782223060956,9
  2500. last_year,132,0.0022645782223060956,9
  2501. propbank,132,0.0022645782223060956,8
  2502. spontaneous_speech,132,0.0022645782223060956,18
  2503. acoustic_model,132,0.0022645782223060956,14
  2504. informativeness,132,0.0022645782223060956,15
  2505. few_year,131,0.0022474223266825645,8
  2506. industrial,131,0.0022474223266825645,10
  2507. refers,131,0.0022474223266825645,6
  2508. cooccurrence,131,0.0022474223266825645,12
  2509. cell,131,0.0022474223266825645,4
  2510. keyphrase,131,0.0022474223266825645,9
  2511. modest,131,0.0022474223266825645,6
  2512. brown,131,0.0022474223266825645,5
  2513. d'apprentissage,131,0.0022474223266825645,15
  2514. human_translator,131,0.0022474223266825645,16
  2515. chance,131,0.0022474223266825645,6
  2516. adult,131,0.0022474223266825645,5
  2517. tone,131,0.0022474223266825645,4
  2518. offer,130,0.0022302664310590334,5
  2519. example_based,130,0.0022302664310590334,13
  2520. obvious,130,0.0022302664310590334,7
  2521. individual_word,130,0.0022302664310590334,15
  2522. discriminator,130,0.0022302664310590334,13
  2523. absolute_improvement,130,0.0022302664310590334,20
  2524. handling,130,0.0022302664310590334,8
  2525. wall,130,0.0022302664310590334,4
  2526. principal,130,0.0022302664310590334,9
  2527. imbalance,130,0.0022302664310590334,9
  2528. autoregressive,130,0.0022302664310590334,14
  2529. concatenation,130,0.0022302664310590334,13
  2530. other_type,130,0.0022302664310590334,10
  2531. positional,130,0.0022302664310590334,10
  2532. french_english,130,0.0022302664310590334,14
  2533. lesson,130,0.0022302664310590334,6
  2534. valence,130,0.0022302664310590334,7
  2535. cat,129,0.0022131105354355023,3
  2536. proxy,129,0.0022131105354355023,5
  2537. markup,129,0.0022131105354355023,6
  2538. face,129,0.0022131105354355023,4
  2539. unified_framework,129,0.0022131105354355023,17
  2540. general_framework,129,0.0022131105354355023,17
  2541. edits,129,0.0022131105354355023,5
  2542. live,129,0.0022131105354355023,4
  2543. outperform,129,0.0022131105354355023,10
  2544. trigram,129,0.0022131105354355023,7
  2545. provider,128,0.0021959546398119716,8
  2546. consist,128,0.0021959546398119716,7
  2547. private,128,0.0021959546398119716,7
  2548. discus,128,0.0021959546398119716,6
  2549. latent_variable,128,0.0021959546398119716,15
  2550. arabic_english,128,0.0021959546398119716,14
  2551. aspect_based_sentiment,128,0.0021959546398119716,22
  2552. dcrivons,128,0.0021959546398119716,8
  2553. significant_difference,128,0.0021959546398119716,22
  2554. fuzzy,128,0.0021959546398119716,5
  2555. additional_feature,128,0.0021959546398119716,18
  2556. travel,128,0.0021959546398119716,6
  2557. dimensionality,128,0.0021959546398119716,14
  2558. wsj,128,0.0021959546398119716,3
  2559. diverse_set,128,0.0021959546398119716,11
  2560. beginning,128,0.0021959546398119716,9
  2561. supervised_model,127,0.0021787987441884405,16
  2562. pre_defined,127,0.0021787987441884405,11
  2563. secondary,127,0.0021787987441884405,9
  2564. lexical_unit,127,0.0021787987441884405,12
  2565. practical_application,127,0.0021787987441884405,21
  2566. adversarial_attack,127,0.0021787987441884405,18
  2567. multimedia,127,0.0021787987441884405,10
  2568. shape,127,0.0021787987441884405,5
  2569. log_linear_model,127,0.0021787987441884405,16
  2570. indicative,127,0.0021787987441884405,10
  2571. chaque,126,0.0021616428485649094,6
  2572. ngram,126,0.0021616428485649094,5
  2573. better_translation,126,0.0021616428485649094,18
  2574. multi_layer,126,0.0021616428485649094,11
  2575. temp,126,0.0021616428485649094,4
  2576. basque,126,0.0021616428485649094,6
  2577. unrelated,126,0.0021616428485649094,9
  2578. various_language,126,0.0021616428485649094,16
  2579. semantic_frame,126,0.0021616428485649094,14
  2580. multi_word_expression,126,0.0021616428485649094,21
  2581. broadcast,126,0.0021616428485649094,9
  2582. activation,126,0.0021616428485649094,10
  2583. necessity,126,0.0021616428485649094,9
  2584. approches,126,0.0021616428485649094,9
  2585. hope,126,0.0021616428485649094,4
  2586. motivated,126,0.0021616428485649094,9
  2587. n_gram_model,126,0.0021616428485649094,12
  2588. un_systme,125,0.0021444869529413783,9
  2589. little_attention,125,0.0021444869529413783,16
  2590. expriences,125,0.0021444869529413783,10
  2591. adverse,125,0.0021444869529413783,7
  2592. discipline,125,0.0021444869529413783,10
  2593. default,125,0.0021444869529413783,7
  2594. ambiguous_word,125,0.0021444869529413783,14
  2595. devlin_et,125,0.0021444869529413783,9
  2596. fait,125,0.0021444869529413783,4
  2597. unsupervised_word,125,0.0021444869529413783,17
  2598. l'extraction,125,0.0021444869529413783,12
  2599. weak_supervision,125,0.0021444869529413783,16
  2600. compilation,125,0.0021444869529413783,11
  2601. human_effort,125,0.0021444869529413783,12
  2602. automation,125,0.0021444869529413783,10
  2603. player,125,0.0021444869529413783,6
  2604. immediate,125,0.0021444869529413783,9
  2605. impossible,124,0.002127331057317847,10
  2606. public_datasets,124,0.002127331057317847,15
  2607. meteor,124,0.002127331057317847,6
  2608. computer_assisted,124,0.002127331057317847,17
  2609. dont,124,0.002127331057317847,4
  2610. package,124,0.002127331057317847,7
  2611. open_domain_question,124,0.002127331057317847,20
  2612. bakeoff,124,0.002127331057317847,7
  2613. bionlp,124,0.002127331057317847,6
  2614. single_sentence,124,0.002127331057317847,15
  2615. gene,124,0.002127331057317847,4
  2616. manipulation,124,0.002127331057317847,12
  2617. scientific_article,124,0.002127331057317847,18
  2618. devlin_et_al.,124,0.002127331057317847,13
  2619. average_precision,124,0.002127331057317847,17
  2620. provided,124,0.002127331057317847,8
  2621. mesure,124,0.002127331057317847,6
  2622. lexique,123,0.002110175161694316,7
  2623. context_dependent,123,0.002110175161694316,17
  2624. leverage,123,0.002110175161694316,8
  2625. selon,123,0.002110175161694316,5
  2626. large_datasets,123,0.002110175161694316,14
  2627. tagset,123,0.002110175161694316,6
  2628. nowadays,123,0.002110175161694316,8
  2629. intersection,123,0.002110175161694316,12
  2630. conflict,123,0.002110175161694316,8
  2631. middle,123,0.002110175161694316,6
  2632. cross_lingual_word,123,0.002110175161694316,18
  2633. spread,122,0.0020930192660707854,6
  2634. low_level,122,0.0020930192660707854,9
  2635. subtitle,122,0.0020930192660707854,8
  2636. minute,122,0.0020930192660707854,6
  2637. empirical_evidence,122,0.0020930192660707854,18
  2638. comparable_result,122,0.0020930192660707854,17
  2639. domain_independent,122,0.0020930192660707854,18
  2640. danish,122,0.0020930192660707854,6
  2641. linguistic_property,122,0.0020930192660707854,19
  2642. terminological,122,0.0020930192660707854,14
  2643. dependence,122,0.0020930192660707854,10
  2644. generalizability,122,0.0020930192660707854,16
  2645. etc,122,0.0020930192660707854,3
  2646. client,122,0.0020930192660707854,6
  2647. intrinsic_evaluation,122,0.0020930192660707854,20
  2648. segmenter,122,0.0020930192660707854,9
  2649. cascade,122,0.0020930192660707854,7
  2650. walk,122,0.0020930192660707854,4
  2651. coding,122,0.0020930192660707854,6
  2652. social_medium_data,122,0.0020930192660707854,18
  2653. such_information,122,0.0020930192660707854,16
  2654. full_text,122,0.0020930192660707854,9
  2655. exponential,122,0.0020930192660707854,11
  2656. lors,122,0.0020930192660707854,4
  2657. in_depth_analysis,121,0.0020758633704472543,17
  2658. surprising,121,0.0020758633704472543,10
  2659. cloze,121,0.0020758633704472543,5
  2660. microblog,121,0.0020758633704472543,9
  2661. tv,121,0.0020758633704472543,2
  2662. nmt_system,121,0.0020758633704472543,10
  2663. controllable,121,0.0020758633704472543,12
  2664. attentive,121,0.0020758633704472543,9
  2665. machine_learning,121,0.0020758633704472543,16
  2666. emergence,121,0.0020758633704472543,9
  2667. recovery,121,0.0020758633704472543,8
  2668. generates,121,0.0020758633704472543,9
  2669. backbone,121,0.0020758633704472543,8
  2670. unlabelled,121,0.0020758633704472543,10
  2671. something,121,0.0020758633704472543,9
  2672. computational_approach,121,0.0020758633704472543,22
  2673. processus,121,0.0020758633704472543,9
  2674. problme,121,0.0020758633704472543,7
  2675. bien,120,0.002058707474823723,4
  2676. fine_tune,120,0.002058707474823723,9
  2677. fasttext,120,0.002058707474823723,8
  2678. github,120,0.002058707474823723,6
  2679. quantification,120,0.002058707474823723,14
  2680. supervised_approach,120,0.002058707474823723,19
  2681. ontonotes,120,0.002058707474823723,9
  2682. d'analyse,120,0.002058707474823723,9
  2683. in_domain_data,120,0.002058707474823723,14
  2684. selectional_preference,120,0.002058707474823723,22
  2685. exhaustive,119,0.002041551579200192,10
  2686. united,119,0.002041551579200192,6
  2687. main_goal,119,0.002041551579200192,9
  2688. spectral,119,0.002041551579200192,8
  2689. institution,119,0.002041551579200192,11
  2690. simple_approach,119,0.002041551579200192,15
  2691. projet,119,0.002041551579200192,6
  2692. higher_quality,119,0.002041551579200192,14
  2693. multiple_source,119,0.002041551579200192,15
  2694. discriminative_model,119,0.002041551579200192,20
  2695. dimensional,119,0.002041551579200192,11
  2696. prosody,119,0.002041551579200192,7
  2697. arabic_language,119,0.002041551579200192,15
  2698. notable,119,0.002041551579200192,7
  2699. guide,119,0.002041551579200192,5
  2700. increased,119,0.002041551579200192,9
  2701. aspect_based_sentiment_analysis,119,0.002041551579200192,31
  2702. figurative,118,0.002024395683576661,10
  2703. scholar,118,0.002024395683576661,7
  2704. brain,118,0.002024395683576661,5
  2705. higher_order,118,0.002024395683576661,12
  2706. internship,118,0.002024395683576661,10
  2707. toxic,118,0.002024395683576661,5
  2708. syntaxiques,118,0.002024395683576661,11
  2709. diverse_language,118,0.002024395683576661,16
  2710. command,118,0.002024395683576661,7
  2711. hebrew,118,0.002024395683576661,6
  2712. salience,118,0.002024395683576661,8
  2713. other_approach,118,0.002024395683576661,14
  2714. trial,118,0.002024395683576661,5
  2715. labor,118,0.002024395683576661,5
  2716. unigram,118,0.002024395683576661,7
  2717. algorithmic,118,0.002024395683576661,11
  2718. pre_trained_transformer,118,0.002024395683576661,23
  2719. nous_dcrivons,117,0.00200723978795313,13
  2720. localization,117,0.00200723978795313,12
  2721. clinical_note,117,0.00200723978795313,13
  2722. suitability,117,0.00200723978795313,11
  2723. evaluator,117,0.00200723978795313,9
  2724. synonymy,117,0.00200723978795313,8
  2725. laboratory,117,0.00200723978795313,10
  2726. pas,117,0.00200723978795313,3
  2727. empirical_analysis,117,0.00200723978795313,18
  2728. bidirectional_encoder,117,0.00200723978795313,21
  2729. storage,117,0.00200723978795313,7
  2730. sum,117,0.00200723978795313,3
  2731. categorical,116,0.0019900838923295992,11
  2732. transparent,116,0.0019900838923295992,11
  2733. splitting,116,0.0019900838923295992,9
  2734. d'valuation,116,0.0019900838923295992,11
  2735. minor,116,0.0019900838923295992,5
  2736. premire,116,0.0019900838923295992,7
  2737. speedup,116,0.0019900838923295992,7
  2738. niveau,116,0.0019900838923295992,6
  2739. selective,116,0.0019900838923295992,9
  2740. agglutinative,116,0.0019900838923295992,13
  2741. deletion,116,0.0019900838923295992,8
  2742. maintenance,116,0.0019900838923295992,11
  2743. mask,116,0.0019900838923295992,4
  2744. coarse,116,0.0019900838923295992,6
  2745. accessibility,116,0.0019900838923295992,13
  2746. analytics,116,0.0019900838923295992,9
  2747. pointer,116,0.0019900838923295992,7
  2748. lexical_database,116,0.0019900838923295992,16
  2749. multilingual_language,116,0.0019900838923295992,21
  2750. n_best_list,116,0.0019900838923295992,11
  2751. held_out,116,0.0019900838923295992,8
  2752. determination,116,0.0019900838923295992,13
  2753. multi_turn,115,0.001972927996706068,10
  2754. quantitative_analysis,115,0.001972927996706068,21
  2755. bidirectional_encoder_representation,115,0.001972927996706068,36
  2756. under_resourced_language,115,0.001972927996706068,24
  2757. plms,115,0.001972927996706068,4
  2758. ba,115,0.001972927996706068,2
  2759. different_corpus,115,0.001972927996706068,16
  2760. familiar,115,0.001972927996706068,8
  2761. engagement,115,0.001972927996706068,10
  2762. spanish_english,115,0.001972927996706068,15
  2763. fonction,115,0.001972927996706068,8
  2764. single_document,115,0.001972927996706068,15
  2765. bulgarian,115,0.001972927996706068,9
  2766. morphological_segmentation,115,0.001972927996706068,26
  2767. highlight,115,0.001972927996706068,9
  2768. fake_news,115,0.001972927996706068,9
  2769. reality,115,0.001972927996706068,7
  2770. qe,115,0.001972927996706068,2
  2771. bilingual_word,115,0.001972927996706068,14
  2772. board,115,0.001972927996706068,5
  2773. holistic,115,0.001972927996706068,8
  2774. realworld,114,0.001955772101082537,9
  2775. meme,114,0.001955772101082537,4
  2776. visual_question,114,0.001955772101082537,15
  2777. utilizes,114,0.001955772101082537,8
  2778. methodological,114,0.001955772101082537,14
  2779. address,114,0.001955772101082537,7
  2780. facility,114,0.001955772101082537,8
  2781. recipe,114,0.001955772101082537,6
  2782. domain_adaptation,114,0.001955772101082537,17
  2783. most_case,114,0.001955772101082537,9
  2784. text_classification_task,114,0.001955772101082537,24
  2785. mainstream,114,0.001955772101082537,10
  2786. play,114,0.001955772101082537,4
  2787. stress,114,0.001955772101082537,6
  2788. distinctive,114,0.001955772101082537,11
  2789. mt_evaluation,114,0.001955772101082537,13
  2790. part_ofspeech,114,0.001955772101082537,13
  2791. encoderdecoder,114,0.001955772101082537,14
  2792. automatic_summarization,113,0.001938616205459006,23
  2793. part_of_speech_tag,113,0.001938616205459006,18
  2794. left,113,0.001938616205459006,4
  2795. limited_amount,113,0.001938616205459006,14
  2796. lexical_knowledge,113,0.001938616205459006,17
  2797. underspecified,113,0.001938616205459006,14
  2798. nested,113,0.001938616205459006,6
  2799. l'valuation,113,0.001938616205459006,11
  2800. typed,113,0.001938616205459006,5
  2801. rule_based_approach,113,0.001938616205459006,19
  2802. month,113,0.001938616205459006,5
  2803. human_computer,113,0.001938616205459006,14
  2804. car,113,0.001938616205459006,3
  2805. natural_language_question,113,0.001938616205459006,25
  2806. check,113,0.001938616205459006,5
  2807. available_data,113,0.001938616205459006,14
  2808. blind,113,0.001938616205459006,5
  2809. integral,113,0.001938616205459006,8
  2810. large_dataset,113,0.001938616205459006,13
  2811. additional_training,113,0.001938616205459006,19
  2812. large_scale_corpus,113,0.001938616205459006,18
  2813. normalized,112,0.001921460309835475,10
  2814. poetry,112,0.001921460309835475,6
  2815. java,112,0.001921460309835475,4
  2816. low_dimensional,112,0.001921460309835475,15
  2817. non_local,112,0.001921460309835475,9
  2818. pre_trained_word_embeddings,112,0.001921460309835475,27
  2819. contrastive_learning,112,0.001921460309835475,20
  2820. japanese_english,112,0.001921460309835475,16
  2821. affix,112,0.001921460309835475,5
  2822. summarizer,112,0.001921460309835475,10
  2823. linear_programming,112,0.001921460309835475,18
  2824. mark,112,0.001921460309835475,4
  2825. human_machine,112,0.001921460309835475,13
  2826. gazetteer,112,0.001921460309835475,9
  2827. maximization,111,0.001904304414211944,12
  2828. gec,111,0.001904304414211944,3
  2829. highquality,111,0.001904304414211944,11
  2830. music,111,0.001904304414211944,5
  2831. productive,111,0.001904304414211944,10
  2832. prcision,111,0.001904304414211944,8
  2833. microblogs,111,0.001904304414211944,10
  2834. depression,111,0.001904304414211944,10
  2835. msa,111,0.001904304414211944,3
  2836. lexical_sample,111,0.001904304414211944,14
  2837. broad_range,111,0.001904304414211944,11
  2838. textual_information,111,0.001904304414211944,19
  2839. visual_information,111,0.001904304414211944,18
  2840. job,111,0.001904304414211944,3
  2841. chinese_treebank,111,0.001904304414211944,16
  2842. rst,110,0.0018871485185884128,3
  2843. smart,110,0.0018871485185884128,5
  2844. lexicales,110,0.0018871485185884128,9
  2845. hybrid_model,110,0.0018871485185884128,12
  2846. graphical_model,110,0.0018871485185884128,15
  2847. key_idea,110,0.0018871485185884128,8
  2848. convention,110,0.0018871485185884128,10
  2849. expected,110,0.0018871485185884128,8
  2850. penalty,110,0.0018871485185884128,7
  2851. discontinuous,110,0.0018871485185884128,13
  2852. bidirectional_lstm,110,0.0018871485185884128,18
  2853. mme,110,0.0018871485185884128,3
  2854. ocr,110,0.0018871485185884128,3
  2855. pose,110,0.0018871485185884128,4
  2856. implement,110,0.0018871485185884128,9
  2857. labelled,110,0.0018871485185884128,8
  2858. multi_party,110,0.0018871485185884128,11
  2859. lexical_entry,110,0.0018871485185884128,13
  2860. triplet,110,0.0018871485185884128,7
  2861. merit,110,0.0018871485185884128,5
  2862. hungarian,110,0.0018871485185884128,9
  2863. interlocutor,110,0.0018871485185884128,12
  2864. tree_based,110,0.0018871485185884128,10
  2865. used,110,0.0018871485185884128,4
  2866. real_world_datasets,110,0.0018871485185884128,19
  2867. europarl,109,0.001869992622964882,8
  2868. unification,109,0.001869992622964882,11
  2869. summarisation,109,0.001869992622964882,13
  2870. syntactic_parser,109,0.001869992622964882,16
  2871. south,109,0.001869992622964882,5
  2872. agnostic,109,0.001869992622964882,8
  2873. uncertain,109,0.001869992622964882,9
  2874. usual,109,0.001869992622964882,5
  2875. build,109,0.001869992622964882,5
  2876. portal,109,0.001869992622964882,6
  2877. prototypical,109,0.001869992622964882,12
  2878. mrc,109,0.001869992622964882,3
  2879. key_component,109,0.001869992622964882,13
  2880. several_method,109,0.001869992622964882,14
  2881. utilization,109,0.001869992622964882,11
  2882. collective,109,0.001869992622964882,10
  2883. arabic_dialect,109,0.001869992622964882,14
  2884. linear_model,109,0.001869992622964882,12
  2885. upper_bound,109,0.001869992622964882,11
  2886. semantic_network,109,0.001869992622964882,16
  2887. overall_accuracy,109,0.001869992622964882,16
  2888. contextual_word,109,0.001869992622964882,15
  2889. termes,109,0.001869992622964882,6
  2890. chatbot,109,0.001869992622964882,7
  2891. syntactic_annotation,108,0.0018528367273413508,20
  2892. portable,108,0.0018528367273413508,8
  2893. masked_language_model,108,0.0018528367273413508,21
  2894. original_text,108,0.0018528367273413508,13
  2895. spoken_language_understanding,108,0.0018528367273413508,29
  2896. genetic,108,0.0018528367273413508,7
  2897. obtained,108,0.0018528367273413508,8
  2898. source_side,108,0.0018528367273413508,11
  2899. urdu,108,0.0018528367273413508,4
  2900. move,108,0.0018528367273413508,4
  2901. scientific_literature,108,0.0018528367273413508,21
  2902. anchor,108,0.0018528367273413508,6
  2903. viability,108,0.0018528367273413508,9
  2904. pour_le,108,0.0018528367273413508,7
  2905. new_framework,108,0.0018528367273413508,13
  2906. semantic_property,108,0.0018528367273413508,17
  2907. unsupervised_model,108,0.0018528367273413508,18
  2908. phrasebased,108,0.0018528367273413508,11
  2909. monitoring,108,0.0018528367273413508,10
  2910. glove,108,0.0018528367273413508,5
  2911. low_frequency,107,0.0018356808317178197,13
  2912. d'extraction,107,0.0018356808317178197,12
  2913. social_medium_post,107,0.0018356808317178197,18
  2914. rich_feature,107,0.0018356808317178197,12
  2915. alternative_approach,107,0.0018356808317178197,20
  2916. model_based,107,0.0018356808317178197,11
  2917. representational,107,0.0018356808317178197,16
  2918. reliance,107,0.0018356808317178197,8
  2919. making,107,0.0018356808317178197,6
  2920. ellipsis,107,0.0018356808317178197,8
  2921. specific_task,107,0.0018356808317178197,13
  2922. current_research,107,0.0018356808317178197,16
  2923. part_of_speech_tagger,107,0.0018356808317178197,21
  2924. contextual_feature,107,0.0018356808317178197,18
  2925. ordinary,107,0.0018356808317178197,8
  2926. represent,107,0.0018356808317178197,9
  2927. english_tweet,107,0.0018356808317178197,13
  2928. lexica,107,0.0018356808317178197,6
  2929. pour_la,107,0.0018356808317178197,7
  2930. traditional_approach,107,0.0018356808317178197,20
  2931. many_case,106,0.0018185249360942889,9
  2932. handcrafted,106,0.0018185249360942889,11
  2933. syntactic_tree,106,0.0018185249360942889,14
  2934. widely_used,106,0.0018185249360942889,11
  2935. editing,106,0.0018185249360942889,7
  2936. eu,106,0.0018185249360942889,2
  2937. bi_lstm,106,0.0018185249360942889,7
  2938. marginal,106,0.0018185249360942889,8
  2939. human_expert,106,0.0018185249360942889,12
  2940. nlp_tool,106,0.0018185249360942889,8
  2941. joint_learning,106,0.0018185249360942889,14
  2942. pool,106,0.0018185249360942889,4
  2943. other_task,106,0.0018185249360942889,10
  2944. wall_street,106,0.0018185249360942889,11
  2945. temporal_expression,106,0.0018185249360942889,19
  2946. working,106,0.0018185249360942889,7
  2947. execution,106,0.0018185249360942889,9
  2948. interoperability,106,0.0018185249360942889,16
  2949. aussi,106,0.0018185249360942889,5
  2950. sou,106,0.0018185249360942889,3
  2951. visual_feature,106,0.0018185249360942889,14
  2952. tree_structure,106,0.0018185249360942889,14
  2953. considers,106,0.0018185249360942889,9
  2954. ease,106,0.0018185249360942889,4
  2955. runtime,106,0.0018185249360942889,7
  2956. multi_head,106,0.0018185249360942889,10
  2957. parent,106,0.0018185249360942889,6
  2958. stock,106,0.0018185249360942889,5
  2959. spite,105,0.0018013690404707578,5
  2960. rl,105,0.0018013690404707578,2
  2961. phrase_based_system,105,0.0018013690404707578,19
  2962. locality,105,0.0018013690404707578,8
  2963. annotated_dataset,105,0.0018013690404707578,17
  2964. acceptability,105,0.0018013690404707578,13
  2965. rigorous,105,0.0018013690404707578,8
  2966. non_native_speaker,105,0.0018013690404707578,18
  2967. idiomatic,105,0.0018013690404707578,9
  2968. testbed,105,0.0018013690404707578,7
  2969. proximity,105,0.0018013690404707578,9
  2970. data_driven_approach,105,0.0018013690404707578,20
  2971. new_state,105,0.0018013690404707578,9
  2972. neighborhood,105,0.0018013690404707578,12
  2973. related_work,105,0.0018013690404707578,12
  2974. non_projective,105,0.0018013690404707578,14
  2975. ancient,105,0.0018013690404707578,7
  2976. aligner,105,0.0018013690404707578,7
  2977. quick,105,0.0018013690404707578,5
  2978. filling,105,0.0018013690404707578,7
  2979. end_toend,105,0.0018013690404707578,9
  2980. large_data,105,0.0018013690404707578,10
  2981. cnns,105,0.0018013690404707578,4
  2982. key_challenge,105,0.0018013690404707578,13
  2983. protein,105,0.0018013690404707578,7
  2984. sarcastic,105,0.0018013690404707578,9
  2985. chatbots,105,0.0018013690404707578,8
  2986. souvent,105,0.0018013690404707578,7
  2987. l1,105,0.0018013690404707578,2
  2988. first_result,105,0.0018013690404707578,12
  2989. display,104,0.0017842131448472266,7
  2990. server,104,0.0017842131448472266,6
  2991. creative_common,104,0.0017842131448472266,15
  2992. discourse_level,104,0.0017842131448472266,15
  2993. notamment,104,0.0017842131448472266,9
  2994. connaissances,104,0.0017842131448472266,13
  2995. timeline,104,0.0017842131448472266,8
  2996. first_step_towards,104,0.0017842131448472266,18
  2997. available_resource,104,0.0017842131448472266,18
  2998. zero,104,0.0017842131448472266,4
  2999. organisation,104,0.0017842131448472266,12
  3000. compatibility,104,0.0017842131448472266,13
  3001. moderate,104,0.0017842131448472266,8
  3002. adverb,104,0.0017842131448472266,6
  3003. text_to_text,104,0.0017842131448472266,12
  3004. english_data,104,0.0017842131448472266,12
  3005. generality,104,0.0017842131448472266,10
  3006. guarantee,104,0.0017842131448472266,9
  3007. similar_word,104,0.0017842131448472266,12
  3008. other_system,104,0.0017842131448472266,12
  3009. relevant_document,103,0.0017670572492236958,17
  3010. imbalanced,103,0.0017670572492236958,10
  3011. finegrained,103,0.0017670572492236958,11
  3012. plot,103,0.0017670572492236958,4
  3013. pandemic,103,0.0017670572492236958,8
  3014. motion,103,0.0017670572492236958,6
  3015. few_shot_learning,103,0.0017670572492236958,17
  3016. avenue,103,0.0017670572492236958,6
  3017. hidden_state,103,0.0017670572492236958,12
  3018. prepositional,103,0.0017670572492236958,13
  3019. multilingual_corpus,103,0.0017670572492236958,19
  3020. directed,103,0.0017670572492236958,8
  3021. removal,103,0.0017670572492236958,7
  3022. different_data,103,0.0017670572492236958,14
  3023. cross_modal,103,0.0017670572492236958,11
  3024. starting,103,0.0017670572492236958,8
  3025. text_representation,103,0.0017670572492236958,19
  3026. home,103,0.0017670572492236958,4
  3027. tt,103,0.0017670572492236958,2
  3028. tradition,103,0.0017670572492236958,9
  3029. bayesian_model,103,0.0017670572492236958,14
  3030. electronic_health,103,0.0017670572492236958,17
  3031. phonology,103,0.0017670572492236958,9
  3032. competence,103,0.0017670572492236958,10
  3033. contain,102,0.0017499013536001647,7
  3034. bridge,102,0.0017499013536001647,6
  3035. predict,102,0.0017499013536001647,7
  3036. inverse,102,0.0017499013536001647,7
  3037. computational_complexity,102,0.0017499013536001647,24
  3038. neural_network_language,102,0.0017499013536001647,23
  3039. electronic_health_record,102,0.0017499013536001647,24
  3040. correspond,102,0.0017499013536001647,10
  3041. estimator,102,0.0017499013536001647,9
  3042. iv,102,0.0017499013536001647,2
  3043. lexicon_based,102,0.0017499013536001647,13
  3044. cycle,102,0.0017499013536001647,5
  3045. heavy,102,0.0017499013536001647,5
  3046. double,102,0.0017499013536001647,6
  3047. union,102,0.0017499013536001647,5
  3048. moment,102,0.0017499013536001647,6
  3049. convenient,102,0.0017499013536001647,10
  3050. thesis,102,0.0017499013536001647,6
  3051. meta_learning,102,0.0017499013536001647,13
  3052. multi_source,102,0.0017499013536001647,12
  3053. statistical_language,102,0.0017499013536001647,20
  3054. statistical_analysis,102,0.0017499013536001647,20
  3055. smoothing,102,0.0017499013536001647,9
  3056. lexical_substitution,102,0.0017499013536001647,20
  3057. sans,102,0.0017499013536001647,4
  3058. syntactic_pattern,102,0.0017499013536001647,17
  3059. particulier,102,0.0017499013536001647,11
  3060. semisupervised,102,0.0017499013536001647,14
  3061. tagged,102,0.0017499013536001647,6
  3062. large_language,102,0.0017499013536001647,14
  3063. une_tche,101,0.0017327454579766338,8
  3064. skip_gram,101,0.0017327454579766338,9
  3065. singular,101,0.0017327454579766338,8
  3066. readable,101,0.0017327454579766338,8
  3067. enormous,101,0.0017327454579766338,8
  3068. keyphrases,101,0.0017327454579766338,10
  3069. nous_intressons,101,0.0017327454579766338,15
  3070. small_corpus,101,0.0017327454579766338,12
  3071. translate,101,0.0017327454579766338,9
  3072. gate,101,0.0017327454579766338,4
  3073. data_to_text,101,0.0017327454579766338,12
  3074. new_type,101,0.0017327454579766338,8
  3075. artifact,101,0.0017327454579766338,8
  3076. backtranslation,101,0.0017327454579766338,15
  3077. multi_label_classification,101,0.0017327454579766338,26
  3078. new_algorithm,101,0.0017327454579766338,13
  3079. interval,101,0.0017327454579766338,8
  3080. forme,101,0.0017327454579766338,5
  3081. tensor,101,0.0017327454579766338,6
  3082. intressons,101,0.0017327454579766338,10
  3083. text_categorization,101,0.0017327454579766338,19
  3084. reproducibility,101,0.0017327454579766338,15
  3085. crucial_role,101,0.0017327454579766338,12
  3086. english_corpus,101,0.0017327454579766338,14
  3087. female,101,0.0017327454579766338,6
  3088. endto_end,101,0.0017327454579766338,9
  3089. causality,101,0.0017327454579766338,9
  3090. array,101,0.0017327454579766338,5
  3091. automatic_annotation,101,0.0017327454579766338,20
  3092. gated,101,0.0017327454579766338,5
  3093. tree_kernel,101,0.0017327454579766338,11
  3094. id,101,0.0017327454579766338,2
  3095. fundamental_task,101,0.0017327454579766338,16
  3096. various_task,100,0.0017155895623531027,12
  3097. best_practice,100,0.0017155895623531027,13
  3098. curve,100,0.0017155895623531027,5
  3099. complex_task,100,0.0017155895623531027,12
  3100. open_information,100,0.0017155895623531027,16
  3101. correct_answer,100,0.0017155895623531027,14
  3102. well_formed,100,0.0017155895623531027,11
  3103. enables,100,0.0017155895623531027,7
  3104. contextual_embeddings,100,0.0017155895623531027,21
  3105. peu,100,0.0017155895623531027,3
  3106. ensemble_method,100,0.0017155895623531027,15
  3107. extensive_evaluation,100,0.0017155895623531027,20
  3108. task_oriented_dialogue_system,100,0.0017155895623531027,29
  3109. unreliable,100,0.0017155895623531027,10
  3110. open_data,100,0.0017155895623531027,9
  3111. princeton,100,0.0017155895623531027,9
  3112. reverse,100,0.0017155895623531027,7
  3113. tant,100,0.0017155895623531027,4
  3114. sentencelevel,100,0.0017155895623531027,13
  3115. exists,100,0.0017155895623531027,6
  3116. other_model,100,0.0017155895623531027,11
  3117. traditional_method,100,0.0017155895623531027,18
  3118. mass,100,0.0017155895623531027,4
  3119. register,100,0.0017155895623531027,8
  3120. bert_model,99,0.0016984336667295716,10
  3121. factoid,99,0.0016984336667295716,7
  3122. centre,99,0.0016984336667295716,6
  3123. semantic_change,99,0.0016984336667295716,15
  3124. important_step,99,0.0016984336667295716,14
  3125. textual_feature,99,0.0016984336667295716,15
  3126. store,99,0.0016984336667295716,5
  3127. annotated_training,99,0.0016984336667295716,18
  3128. applied,99,0.0016984336667295716,7
  3129. exploit,99,0.0016984336667295716,7
  3130. smt_system,99,0.0016984336667295716,10
  3131. generated_text,99,0.0016984336667295716,14
  3132. textual_content,99,0.0016984336667295716,15
  3133. typing,99,0.0016984336667295716,6
  3134. unsupervised_manner,99,0.0016984336667295716,19
  3135. question_answer_pair,99,0.0016984336667295716,20
  3136. introduces,99,0.0016984336667295716,10
  3137. viterbi,99,0.0016984336667295716,7
  3138. agency,99,0.0016984336667295716,6
  3139. checker,99,0.0016984336667295716,7
  3140. spoken_dialog,99,0.0016984336667295716,13
  3141. important_information,99,0.0016984336667295716,21
  3142. state_of_art,99,0.0016984336667295716,12
  3143. plausibility,99,0.0016984336667295716,12
  3144. exposure,99,0.0016984336667295716,8
  3145. lexicographic,99,0.0016984336667295716,13
  3146. india,99,0.0016984336667295716,5
  3147. u.s.,99,0.0016984336667295716,4
  3148. cl,99,0.0016984336667295716,2
  3149. complex_word,98,0.0016812777711060407,12
  3150. open_information_extraction,98,0.0016812777711060407,27
  3151. deep_learning_method,98,0.0016812777711060407,20
  3152. low_resource_scenario,98,0.0016812777711060407,21
  3153. subcategorization,98,0.0016812777711060407,17
  3154. trois,98,0.0016812777711060407,5
  3155. deficiency,98,0.0016812777711060407,10
  3156. informed,98,0.0016812777711060407,8
  3157. hindi_english,98,0.0016812777711060407,13
  3158. inner,98,0.0016812777711060407,5
  3159. statistique,98,0.0016812777711060407,11
  3160. structured_prediction,98,0.0016812777711060407,21
  3161. budget,98,0.0016812777711060407,6
  3162. retrieved,98,0.0016812777711060407,9
  3163. comparative_analysis,98,0.0016812777711060407,20
  3164. briefly,98,0.0016812777711060407,7
  3165. prerequisite,98,0.0016812777711060407,12
  3166. new_challenge,98,0.0016812777711060407,13
  3167. price,98,0.0016812777711060407,5
  3168. croatian,98,0.0016812777711060407,8
  3169. important_aspect,98,0.0016812777711060407,16
  3170. presented,98,0.0016812777711060407,9
  3171. small_scale,98,0.0016812777711060407,11
  3172. tuples,98,0.0016812777711060407,6
  3173. generalizable,98,0.0016812777711060407,13
  3174. prevalence,98,0.0016812777711060407,10
  3175. large_scale_dataset,98,0.0016812777711060407,19
  3176. important_part,98,0.0016812777711060407,14
  3177. declarative,98,0.0016812777711060407,11
  3178. rich_set,98,0.0016812777711060407,8
  3179. vulnerable,98,0.0016812777711060407,10
  3180. semantic_content,98,0.0016812777711060407,16
  3181. cependant,98,0.0016812777711060407,9
  3182. sentiment_classification,97,0.0016641218754825096,24
  3183. different_strategy,97,0.0016641218754825096,18
  3184. separation,97,0.0016641218754825096,10
  3185. transformer_based_language,97,0.0016641218754825096,26
  3186. aforementioned,97,0.0016641218754825096,14
  3187. stack,97,0.0016641218754825096,5
  3188. second_stage,97,0.0016641218754825096,12
  3189. lookup,97,0.0016641218754825096,6
  3190. more_data,97,0.0016641218754825096,9
  3191. large_language_model,97,0.0016641218754825096,20
  3192. different_context,97,0.0016641218754825096,17
  3193. food,97,0.0016641218754825096,4
  3194. non_linear,97,0.0016641218754825096,10
  3195. grammaires,97,0.0016641218754825096,10
  3196. focused,97,0.0016641218754825096,7
  3197. consiste,97,0.0016641218754825096,8
  3198. such_method,97,0.0016641218754825096,11
  3199. new_resource,97,0.0016641218754825096,12
  3200. ground_truth,97,0.0016641218754825096,12
  3201. burden,97,0.0016641218754825096,6
  3202. present_work,97,0.0016641218754825096,12
  3203. biased,97,0.0016641218754825096,6
  3204. nearest_neighbor,97,0.0016641218754825096,16
  3205. current_model,97,0.0016641218754825096,13
  3206. hashtags,97,0.0016641218754825096,8
  3207. black,96,0.0016469659798589785,5
  3208. present_experiment,96,0.0016469659798589785,18
  3209. user_generated_content,96,0.0016469659798589785,22
  3210. malayalam,96,0.0016469659798589785,9
  3211. reuse,96,0.0016469659798589785,5
  3212. grand,96,0.0016469659798589785,5
  3213. british,96,0.0016469659798589785,7
  3214. faithful,96,0.0016469659798589785,8
  3215. transformer_based_language_model,96,0.0016469659798589785,32
  3216. dropout,96,0.0016469659798589785,7
  3217. vice,96,0.0016469659798589785,4
  3218. isolated,96,0.0016469659798589785,8
  3219. percent,96,0.0016469659798589785,7
  3220. probe,96,0.0016469659798589785,5
  3221. high_degree,96,0.0016469659798589785,11
  3222. hyperparameters,96,0.0016469659798589785,15
  3223. stimulus,96,0.0016469659798589785,8
  3224. semeval_2015,96,0.0016469659798589785,12
  3225. chinese_english_translation,96,0.0016469659798589785,27
  3226. resource_poor,96,0.0016469659798589785,13
  3227. semantic_web,96,0.0016469659798589785,12
  3228. gaze,96,0.0016469659798589785,4
  3229. geographical,96,0.0016469659798589785,12
  3230. analyser,96,0.0016469659798589785,8
  3231. regime,96,0.0016469659798589785,6
  3232. recent_approach,96,0.0016469659798589785,15
  3233. partof_speech,96,0.0016469659798589785,13
  3234. tape,96,0.0016469659798589785,4
  3235. rare_word,96,0.0016469659798589785,9
  3236. professional_translator,96,0.0016469659798589785,23
  3237. offensive_language_identification,95,0.0016298100842354476,33
  3238. utilized,95,0.0016298100842354476,8
  3239. adversarial_example,95,0.0016298100842354476,19
  3240. taiwan,95,0.0016298100842354476,6
  3241. cloud,95,0.0016298100842354476,5
  3242. tradeoff,95,0.0016298100842354476,8
  3243. multiple_domain,95,0.0016298100842354476,15
  3244. f_scores,95,0.0016298100842354476,8
  3245. questionnaire,95,0.0016298100842354476,13
  3246. grid,95,0.0016298100842354476,4
  3247. l'objectif,95,0.0016298100842354476,10
  3248. bart,95,0.0016298100842354476,4
  3249. indispensable,95,0.0016298100842354476,13
  3250. atomic,95,0.0016298100842354476,6
  3251. first_place,95,0.0016298100842354476,11
  3252. nave_bayes,95,0.0016298100842354476,10
  3253. coordinate,95,0.0016298100842354476,10
  3254. filler,95,0.0016298100842354476,6
  3255. improved_performance,95,0.0016298100842354476,20
  3256. economic,95,0.0016298100842354476,8
  3257. trajectory,95,0.0016298100842354476,10
  3258. richness,95,0.0016298100842354476,8
  3259. future_direction,95,0.0016298100842354476,16
  3260. rfrence,95,0.0016298100842354476,7
  3261. *_work,95,0.0016298100842354476,6
  3262. preliminary_evaluation,95,0.0016298100842354476,22
  3263. portability,95,0.0016298100842354476,11
  3264. reduced,95,0.0016298100842354476,7
  3265. distortion,95,0.0016298100842354476,10
  3266. text_corpus,95,0.0016298100842354476,11
  3267. novel_feature,95,0.0016298100842354476,13
  3268. present_study,95,0.0016298100842354476,13
  3269. orthogonal,95,0.0016298100842354476,10
  3270. open_ended,95,0.0016298100842354476,10
  3271. semantic_resource,95,0.0016298100842354476,17
  3272. exception,95,0.0016298100842354476,9
  3273. norwegian,95,0.0016298100842354476,9
  3274. english_spanish,95,0.0016298100842354476,15
  3275. memory_based,95,0.0016298100842354476,12
  3276. adapted,95,0.0016298100842354476,7
  3277. surprise,95,0.0016298100842354476,8
  3278. asian_language,95,0.0016298100842354476,14
  3279. d'etection,95,0.0016298100842354476,10
  3280. speaking,95,0.0016298100842354476,8
  3281. cela,94,0.0016126541886119165,4
  3282. dveloppement,94,0.0016126541886119165,12
  3283. low_quality,94,0.0016126541886119165,11
  3284. thought,94,0.0016126541886119165,7
  3285. named_entity_recognition,94,0.0016126541886119165,24
  3286. semi_structured,94,0.0016126541886119165,15
  3287. differentiable,94,0.0016126541886119165,14
  3288. li,94,0.0016126541886119165,2
  3289. lexical_semantic,94,0.0016126541886119165,16
  3290. brazilian_portuguese,94,0.0016126541886119165,20
  3291. curation,94,0.0016126541886119165,8
  3292. inductive_bias,94,0.0016126541886119165,14
  3293. infrequent,94,0.0016126541886119165,10
  3294. naturalness,94,0.0016126541886119165,11
  3295. force,94,0.0016126541886119165,5
  3296. metaphorical,94,0.0016126541886119165,12
  3297. new_evaluation,94,0.0016126541886119165,14
  3298. operational,94,0.0016126541886119165,11
  3299. understanding_task,94,0.0016126541886119165,18
  3300. different_system,94,0.0016126541886119165,16
  3301. encouraging_result,94,0.0016126541886119165,18
  3302. neural_mt,94,0.0016126541886119165,9
  3303. slight,94,0.0016126541886119165,6
  3304. china,94,0.0016126541886119165,5
  3305. freebase,94,0.0016126541886119165,8
  3306. actor,94,0.0016126541886119165,5
  3307. irony,94,0.0016126541886119165,5
  3308. thai,94,0.0016126541886119165,4
  3309. unavailable,94,0.0016126541886119165,11
  3310. facet,94,0.0016126541886119165,5
  3311. bert_based_model,94,0.0016126541886119165,16
  3312. new_benchmark,94,0.0016126541886119165,13
  3313. left_to_right,93,0.0015954982929883854,13
  3314. rdf,93,0.0015954982929883854,3
  3315. softmax,93,0.0015954982929883854,7
  3316. ted,93,0.0015954982929883854,3
  3317. target_side,93,0.0015954982929883854,11
  3318. code_switched,93,0.0015954982929883854,13
  3319. pitch,93,0.0015954982929883854,5
  3320. such_resource,93,0.0015954982929883854,13
  3321. important_problem,93,0.0015954982929883854,17
  3322. semantic_interpretation,93,0.0015954982929883854,23
  3323. adaptable,93,0.0015954982929883854,9
  3324. clarification,93,0.0015954982929883854,13
  3325. latent_space,93,0.0015954982929883854,12
  3326. apr,93,0.0015954982929883854,3
  3327. unambiguous,93,0.0015954982929883854,11
  3328. biomedical_literature,93,0.0015954982929883854,21
  3329. binary_classifier,93,0.0015954982929883854,17
  3330. composite,93,0.0015954982929883854,9
  3331. t5,93,0.0015954982929883854,2
  3332. statistical_parser,93,0.0015954982929883854,18
  3333. harmful,93,0.0015954982929883854,7
  3334. accent,93,0.0015954982929883854,6
  3335. era,93,0.0015954982929883854,3
  3336. transferability,93,0.0015954982929883854,15
  3337. current_method,93,0.0015954982929883854,14
  3338. several_experiment,93,0.0015954982929883854,18
  3339. sort,93,0.0015954982929883854,4
  3340. speech_to_speech,92,0.0015783423973648545,16
  3341. inefficient,92,0.0015783423973648545,11
  3342. grade,92,0.0015783423973648545,5
  3343. color,92,0.0015783423973648545,5
  3344. ultimate,92,0.0015783423973648545,8
  3345. current_work,92,0.0015783423973648545,12
  3346. interpolation,92,0.0015783423973648545,13
  3347. cross_document,92,0.0015783423973648545,14
  3348. contact,92,0.0015783423973648545,7
  3349. cross_entropy,92,0.0015783423973648545,13
  3350. substitute,92,0.0015783423973648545,10
  3351. novel_way,92,0.0015783423973648545,9
  3352. various_feature,92,0.0015783423973648545,15
  3353. more_attention,92,0.0015783423973648545,14
  3354. second_order,92,0.0015783423973648545,12
  3355. submitted,92,0.0015783423973648545,9
  3356. natural_language_sentence,92,0.0015783423973648545,25
  3357. mi,92,0.0015783423973648545,2
  3358. several_approach,92,0.0015783423973648545,16
  3359. decision_making,92,0.0015783423973648545,15
  3360. implemented,92,0.0015783423973648545,11
  3361. travaux,91,0.0015611865017413234,7
  3362. englishgerman,91,0.0015611865017413234,13
  3363. male,91,0.0015611865017413234,4
  3364. rhetorical_structure_theory,91,0.0015611865017413234,27
  3365. l'apprentissage,91,0.0015611865017413234,15
  3366. umls,91,0.0015611865017413234,4
  3367. little_work,91,0.0015611865017413234,11
  3368. systeme,91,0.0015611865017413234,7
  3369. best_performing_model,91,0.0015611865017413234,21
  3370. first_approach,91,0.0015611865017413234,14
  3371. comparative_evaluation,91,0.0015611865017413234,22
  3372. great_success,91,0.0015611865017413234,13
  3373. mbert,91,0.0015611865017413234,5
  3374. parsed,91,0.0015611865017413234,6
  3375. discriminative_training,91,0.0015611865017413234,23
  3376. verbnet,91,0.0015611865017413234,7
  3377. indication,91,0.0015611865017413234,10
  3378. combinatorial,91,0.0015611865017413234,13
  3379. utilizing,91,0.0015611865017413234,9
  3380. available_datasets,91,0.0015611865017413234,18
  3381. linear_time,91,0.0015611865017413234,11
  3382. appropriateness,91,0.0015611865017413234,15
  3383. dramatic,91,0.0015611865017413234,8
  3384. detecting,91,0.0015611865017413234,9
  3385. dictionary_based,91,0.0015611865017413234,16
  3386. proper_name,91,0.0015611865017413234,11
  3387. rte,91,0.0015611865017413234,3
  3388. statistical_translation,90,0.0015440306061177923,23
  3389. sql,90,0.0015440306061177923,3
  3390. race,90,0.0015440306061177923,4
  3391. versa,90,0.0015440306061177923,5
  3392. counterfactual,90,0.0015440306061177923,14
  3393. bleu_score,90,0.0015440306061177923,10
  3394. morphological_information,90,0.0015440306061177923,25
  3395. hybrid_system,90,0.0015440306061177923,13
  3396. post_edited,90,0.0015440306061177923,11
  3397. content_selection,90,0.0015440306061177923,17
  3398. l'aide,90,0.0015440306061177923,6
  3399. geographic,90,0.0015440306061177923,10
  3400. important_component,90,0.0015440306061177923,19
  3401. real_world_application,90,0.0015440306061177923,22
  3402. permettent,90,0.0015440306061177923,10
  3403. geometric,90,0.0015440306061177923,9
  3404. embedding_based,90,0.0015440306061177923,15
  3405. sm,90,0.0015440306061177923,2
  3406. cheap,90,0.0015440306061177923,5
  3407. lfg,90,0.0015440306061177923,3
  3408. huge_amount,90,0.0015440306061177923,11
  3409. labeled_training,90,0.0015440306061177923,16
  3410. out_of_domain_data,90,0.0015440306061177923,18
  3411. same_language,90,0.0015440306061177923,13
  3412. dialect_identification,90,0.0015440306061177923,22
  3413. doctor,90,0.0015440306061177923,6
  3414. available_corpus,90,0.0015440306061177923,16
  3415. overhead,90,0.0015440306061177923,8
  3416. cognition,90,0.0015440306061177923,9
  3417. certaines,90,0.0015440306061177923,9
  3418. task_based,90,0.0015440306061177923,10
  3419. polynomial,90,0.0015440306061177923,10
  3420. semantic_type,90,0.0015440306061177923,13
  3421. architectural,90,0.0015440306061177923,13
  3422. scholarly,89,0.0015268747104942614,9
  3423. sighan,89,0.0015268747104942614,6
  3424. grammar_based,89,0.0015268747104942614,13
  3425. phrase_level,89,0.0015268747104942614,12
  3426. non_expert,89,0.0015268747104942614,10
  3427. novel_dataset,89,0.0015268747104942614,13
  3428. hypernymy,89,0.0015268747104942614,9
  3429. morphological_inflection,89,0.0015268747104942614,24
  3430. dravidian,89,0.0015268747104942614,9
  3431. propaganda,89,0.0015268747104942614,10
  3432. sport,89,0.0015268747104942614,5
  3433. large_volume,89,0.0015268747104942614,12
  3434. autoencoders,89,0.0015268747104942614,12
  3435. abusive_language,89,0.0015268747104942614,16
  3436. europe,89,0.0015268747104942614,6
  3437. acyclic,89,0.0015268747104942614,7
  3438. figurative_language,89,0.0015268747104942614,19
  3439. semeval_2014,88,0.0015097188148707303,12
  3440. persian,88,0.0015097188148707303,7
  3441. unexplored,88,0.0015097188148707303,10
  3442. pervasive,88,0.0015097188148707303,9
  3443. dedicated,88,0.0015097188148707303,9
  3444. tremendous,88,0.0015097188148707303,10
  3445. alors,88,0.0015097188148707303,5
  3446. same_data,88,0.0015097188148707303,9
  3447. preliminary_study,88,0.0015097188148707303,17
  3448. _score,88,0.0015097188148707303,6
  3449. poor_performance,88,0.0015097188148707303,16
  3450. friend,88,0.0015097188148707303,6
  3451. many_task,88,0.0015097188148707303,9
  3452. realisation,88,0.0015097188148707303,11
  3453. added,88,0.0015097188148707303,5
  3454. multiple_sentence,88,0.0015097188148707303,17
  3455. different_language_pair,88,0.0015097188148707303,23
  3456. lexeme,88,0.0015097188148707303,6
  3457. resource_rich,88,0.0015097188148707303,13
  3458. transparency,88,0.0015097188148707303,12
  3459. significant_margin,88,0.0015097188148707303,18
  3460. identified,88,0.0015097188148707303,10
  3461. caractristiques,88,0.0015097188148707303,15
  3462. liu,88,0.0015097188148707303,3
  3463. conduct,88,0.0015097188148707303,7
  3464. technological,88,0.0015097188148707303,13
  3465. non_autoregressive,88,0.0015097188148707303,18
  3466. read,87,0.0014925629192471992,4
  3467. regular_expression,87,0.0014925629192471992,18
  3468. stereotype,87,0.0014925629192471992,10
  3469. nlp_community,87,0.0014925629192471992,13
  3470. benchmark_datasets,87,0.0014925629192471992,18
  3471. chosen,87,0.0014925629192471992,6
  3472. biology,87,0.0014925629192471992,7
  3473. ngrams,87,0.0014925629192471992,6
  3474. xlnet,87,0.0014925629192471992,5
  3475. bit,87,0.0014925629192471992,3
  3476. english_hindi,87,0.0014925629192471992,13
  3477. single_task,87,0.0014925629192471992,11
  3478. well_established,87,0.0014925629192471992,16
  3479. all_words,87,0.0014925629192471992,9
  3480. meta,87,0.0014925629192471992,4
  3481. arc,87,0.0014925629192471992,3
  3482. automatic_post_editing,87,0.0014925629192471992,22
  3483. semantic_graph,87,0.0014925629192471992,14
  3484. new_way,87,0.0014925629192471992,7
  3485. telugu,87,0.0014925629192471992,6
  3486. regional,87,0.0014925629192471992,8
  3487. cross_validation,87,0.0014925629192471992,16
  3488. disadvantage,87,0.0014925629192471992,12
  3489. indonesian,87,0.0014925629192471992,10
  3490. couple,87,0.0014925629192471992,6
  3491. apprentissage,87,0.0014925629192471992,13
  3492. dcrit,86,0.0014754070236236683,5
  3493. egyptian,86,0.0014754070236236683,8
  3494. commentary,86,0.0014754070236236683,10
  3495. medline,86,0.0014754070236236683,7
  3496. trust,86,0.0014754070236236683,5
  3497. procedural,86,0.0014754070236236683,10
  3498. security,86,0.0014754070236236683,8
  3499. maximal,86,0.0014754070236236683,7
  3500. syntactic_relation,86,0.0014754070236236683,18
  3501. load,86,0.0014754070236236683,4
  3502. court,86,0.0014754070236236683,5
  3503. try,86,0.0014754070236236683,3
  3504. long_document,86,0.0014754070236236683,13
  3505. multidimensional,86,0.0014754070236236683,16
  3506. abstract_meaning,86,0.0014754070236236683,16
  3507. eye_tracking,86,0.0014754070236236683,12
  3508. multilingual_language_model,86,0.0014754070236236683,27
  3509. semantic_category,86,0.0014754070236236683,17
  3510. pattern_based,86,0.0014754070236236683,13
  3511. additional_data,86,0.0014754070236236683,15
  3512. end_to_end_model,86,0.0014754070236236683,16
  3513. random_forest,86,0.0014754070236236683,13
  3514. faire,86,0.0014754070236236683,5
  3515. valency,86,0.0014754070236236683,7
  3516. chinese_sentence,86,0.0014754070236236683,16
  3517. wiktionary,86,0.0014754070236236683,10
  3518. modal,86,0.0014754070236236683,5
  3519. layout,86,0.0014754070236236683,6
  3520. collected,86,0.0014754070236236683,9
  3521. standard_datasets,86,0.0014754070236236683,17
  3522. run_time,86,0.0014754070236236683,8
  3523. unconstrained,85,0.0014582511280001372,13
  3524. standalone,85,0.0014582511280001372,10
  3525. cqa,85,0.0014582511280001372,3
  3526. multilingual_setting,85,0.0014582511280001372,20
  3527. nuanced,85,0.0014582511280001372,7
  3528. explosion,85,0.0014582511280001372,9
  3529. analytical,85,0.0014582511280001372,10
  3530. crowd_sourced,85,0.0014582511280001372,13
  3531. constraint_based,85,0.0014582511280001372,16
  3532. new_state_of_the_art,85,0.0014582511280001372,20
  3533. ungrammatical,85,0.0014582511280001372,13
  3534. exact_match,85,0.0014582511280001372,11
  3535. indomain,85,0.0014582511280001372,8
  3536. stacked,85,0.0014582511280001372,7
  3537. learned_representation,85,0.0014582511280001372,22
  3538. additive,85,0.0014582511280001372,8
  3539. context_information,85,0.0014582511280001372,19
  3540. se_meval,85,0.0014582511280001372,8
  3541. english_wikipedia,85,0.0014582511280001372,17
  3542. first_study,85,0.0014582511280001372,11
  3543. recent_progress,85,0.0014582511280001372,15
  3544. influential,85,0.0014582511280001372,11
  3545. first_work,85,0.0014582511280001372,10
  3546. african,85,0.0014582511280001372,7
  3547. enterprise,85,0.0014582511280001372,10
  3548. nouvelle,85,0.0014582511280001372,8
  3549. adverbial,85,0.0014582511280001372,9
  3550. genia,85,0.0014582511280001372,5
  3551. d'annotation,84,0.0014410952323766061,12
  3552. anglais,84,0.0014410952323766061,7
  3553. aggregate,84,0.0014410952323766061,9
  3554. switchboard,84,0.0014410952323766061,11
  3555. pooling,84,0.0014410952323766061,7
  3556. medical_text,84,0.0014410952323766061,12
  3557. maximum_entropy_model,84,0.0014410952323766061,21
  3558. _and,84,0.0014410952323766061,4
  3559. emoji,84,0.0014410952323766061,5
  3560. high_resource_language,84,0.0014410952323766061,22
  3561. vocal,84,0.0014410952323766061,5
  3562. computational_method,84,0.0014410952323766061,20
  3563. anaphor,84,0.0014410952323766061,7
  3564. prague,84,0.0014410952323766061,6
  3565. authentic,84,0.0014410952323766061,9
  3566. transferable,84,0.0014410952323766061,12
  3567. sequence_tosequence,84,0.0014410952323766061,19
  3568. transformer_model,84,0.0014410952323766061,17
  3569. situated,84,0.0014410952323766061,8
  3570. reproducible,84,0.0014410952323766061,12
  3571. controversial,84,0.0014410952323766061,13
  3572. sigmorphon,84,0.0014410952323766061,10
  3573. various_method,84,0.0014410952323766061,14
  3574. inadequate,84,0.0014410952323766061,10
  3575. sur_le,84,0.0014410952323766061,6
  3576. consumption,84,0.0014410952323766061,11
  3577. final_system,84,0.0014410952323766061,12
  3578. united_state,84,0.0014410952323766061,12
  3579. inversion,84,0.0014410952323766061,9
  3580. recent_development,84,0.0014410952323766061,18
  3581. deep_learning_architecture,84,0.0014410952323766061,26
  3582. hand_crafted_feature,83,0.0014239393367530752,20
  3583. learnt,83,0.0014239393367530752,6
  3584. politics,83,0.0014239393367530752,8
  3585. variable_model,83,0.0014239393367530752,14
  3586. construire,83,0.0014239393367530752,10
  3587. fifth,83,0.0014239393367530752,5
  3588. tail,83,0.0014239393367530752,4
  3589. maximum_likelihood,83,0.0014239393367530752,18
  3590. abuse,83,0.0014239393367530752,5
  3591. nombre,83,0.0014239393367530752,6
  3592. random_field,83,0.0014239393367530752,12
  3593. describe,83,0.0014239393367530752,8
  3594. reply,83,0.0014239393367530752,5
  3595. vocabulary_size,83,0.0014239393367530752,15
  3596. priori,83,0.0014239393367530752,6
  3597. linear_regression,83,0.0014239393367530752,17
  3598. instructional,83,0.0014239393367530752,13
  3599. grammaire,83,0.0014239393367530752,9
  3600. linguistic_pattern,83,0.0014239393367530752,18
  3601. most_language,83,0.0014239393367530752,13
  3602. explanatory,83,0.0014239393367530752,11
  3603. late,83,0.0014239393367530752,4
  3604. unlabeled_text,83,0.0014239393367530752,14
  3605. vise,83,0.0014239393367530752,4
  3606. grouping,83,0.0014239393367530752,8
  3607. analyseur,83,0.0014239393367530752,9
  3608. tractable,83,0.0014239393367530752,9
  3609. utiliss,82,0.0014067834411295441,7
  3610. membership,82,0.0014067834411295441,10
  3611. factored,82,0.0014067834411295441,8
  3612. toxicity,82,0.0014067834411295441,8
  3613. nd,82,0.0014067834411295441,2
  3614. youtube,82,0.0014067834411295441,7
  3615. supervised_method,82,0.0014067834411295441,17
  3616. vote,82,0.0014067834411295441,4
  3617. valuable_resource,82,0.0014067834411295441,17
  3618. short_answer,82,0.0014067834411295441,12
  3619. textbook,82,0.0014067834411295441,8
  3620. arabic_text,82,0.0014067834411295441,11
  3621. interpreter,82,0.0014067834411295441,11
  3622. reduces,82,0.0014067834411295441,7
  3623. partition,82,0.0014067834411295441,9
  3624. goal_oriented,82,0.0014067834411295441,13
  3625. intractable,82,0.0014067834411295441,11
  3626. large_text,82,0.0014067834411295441,10
  3627. natural_language_description,82,0.0014067834411295441,28
  3628. continuous_space,82,0.0014067834411295441,16
  3629. main_idea,82,0.0014067834411295441,9
  3630. neural_text,82,0.0014067834411295441,11
  3631. homogeneous,82,0.0014067834411295441,11
  3632. wall_street_journal,82,0.0014067834411295441,19
  3633. lexical_similarity,82,0.0014067834411295441,18
  3634. predictive_model,82,0.0014067834411295441,16
  3635. later,82,0.0014067834411295441,5
  3636. proposed_system,82,0.0014067834411295441,15
  3637. deep_learning_approach,82,0.0014067834411295441,22
  3638. human_written,82,0.0014067834411295441,13
  3639. branch,82,0.0014067834411295441,6
  3640. sub_word,82,0.0014067834411295441,8
  3641. handful,82,0.0014067834411295441,7
  3642. cascaded,82,0.0014067834411295441,8
  3643. multi,82,0.0014067834411295441,5
  3644. rulebased,82,0.0014067834411295441,9
  3645. evaluate,81,0.0013896275455060132,8
  3646. interplay,81,0.0013896275455060132,9
  3647. template_based,81,0.0013896275455060132,14
  3648. cooperative,81,0.0013896275455060132,11
  3649. older,81,0.0013896275455060132,5
  3650. hospital,81,0.0013896275455060132,8
  3651. optimisation,81,0.0013896275455060132,12
  3652. telephone,81,0.0013896275455060132,9
  3653. siamese,81,0.0013896275455060132,7
  3654. factuality,81,0.0013896275455060132,10
  3655. feeling,81,0.0013896275455060132,7
  3656. ethical,81,0.0013896275455060132,7
  3657. omission,81,0.0013896275455060132,8
  3658. complex_sentence,81,0.0013896275455060132,16
  3659. computing,81,0.0013896275455060132,9
  3660. drift,81,0.0013896275455060132,5
  3661. forward,81,0.0013896275455060132,7
  3662. efficient_algorithm,81,0.0013896275455060132,19
  3663. english_translation,81,0.0013896275455060132,19
  3664. indigenous,81,0.0013896275455060132,10
  3665. specific_language,81,0.0013896275455060132,17
  3666. young,81,0.0013896275455060132,5
  3667. conversational_speech,81,0.0013896275455060132,21
  3668. co_reference,81,0.0013896275455060132,12
  3669. well_studied,81,0.0013896275455060132,12
  3670. inappropriate,81,0.0013896275455060132,13
  3671. free_word,81,0.0013896275455060132,9
  3672. recent_success,81,0.0013896275455060132,14
  3673. learns,81,0.0013896275455060132,6
  3674. kappa,81,0.0013896275455060132,5
  3675. embedded,81,0.0013896275455060132,8
  3676. explainability,81,0.0013896275455060132,14
  3677. experimental_study,80,0.0013724716498824821,18
  3678. multiclass,80,0.0013724716498824821,10
  3679. analyze,80,0.0013724716498824821,7
  3680. micro,80,0.0013724716498824821,5
  3681. adjunct,80,0.0013724716498824821,7
  3682. subspace,80,0.0013724716498824821,8
  3683. phrase_based_model,80,0.0013724716498824821,18
  3684. pre_trained_bert,80,0.0013724716498824821,16
  3685. consortium,80,0.0013724716498824821,10
  3686. wang,80,0.0013724716498824821,4
  3687. ressource,80,0.0013724716498824821,9
  3688. contextual_representation,80,0.0013724716498824821,25
  3689. parallel_training,80,0.0013724716498824821,17
  3690. state_ofthe_art_performance,80,0.0013724716498824821,27
  3691. s'emantique,80,0.0013724716498824821,11
  3692. heritage,80,0.0013724716498824821,8
  3693. xlm_roberta,80,0.0013724716498824821,11
  3694. l'approche,80,0.0013724716498824821,10
  3695. hoc,80,0.0013724716498824821,3
  3696. visual_question_answering,80,0.0013724716498824821,25
  3697. feature_rich,80,0.0013724716498824821,12
  3698. treat,80,0.0013724716498824821,5
  3699. valuons,80,0.0013724716498824821,7
  3700. ingredient,80,0.0013724716498824821,10
  3701. energy,80,0.0013724716498824821,6
  3702. word_net,80,0.0013724716498824821,8
  3703. well_defined,80,0.0013724716498824821,12
  3704. creative_common_attribution,80,0.0013724716498824821,27
  3705. preferred,80,0.0013724716498824821,9
  3706. misinformation,80,0.0013724716498824821,14
  3707. human_rating,80,0.0013724716498824821,12
  3708. reveal,80,0.0013724716498824821,6
  3709. inspiration,80,0.0013724716498824821,11
  3710. visualisation,79,0.001355315754258951,13
  3711. achievement,79,0.001355315754258951,11
  3712. significant_progress,79,0.001355315754258951,20
  3713. vast_amount,79,0.001355315754258951,11
  3714. low_resourced,79,0.001355315754258951,13
  3715. cross_lingual_information,79,0.001355315754258951,25
  3716. residual,79,0.001355315754258951,8
  3717. best_performing_system,79,0.001355315754258951,22
  3718. free_word_order,79,0.001355315754258951,15
  3719. donc,79,0.001355315754258951,4
  3720. favor,79,0.001355315754258951,5
  3721. discourse_structure,79,0.001355315754258951,19
  3722. state_of_the,79,0.001355315754258951,12
  3723. repetitive,79,0.001355315754258951,10
  3724. extensive_analysis,79,0.001355315754258951,18
  3725. merging,79,0.001355315754258951,7
  3726. native_language_identification,79,0.001355315754258951,30
  3727. reporting,79,0.001355315754258951,9
  3728. clip,79,0.001355315754258951,4
  3729. open_question,79,0.001355315754258951,13
  3730. automatic_acquisition,79,0.001355315754258951,21
  3731. round,79,0.001355315754258951,5
  3732. such_task,79,0.001355315754258951,9
  3733. prsent,79,0.001355315754258951,6
  3734. pdtb,79,0.001355315754258951,4
  3735. on_going,79,0.001355315754258951,8
  3736. permutation,79,0.001355315754258951,11
  3737. scaling,79,0.001355315754258951,7
  3738. penn_discourse,79,0.001355315754258951,14
  3739. absa,79,0.001355315754258951,4
  3740. perceived,79,0.001355315754258951,9
  3741. alphabet,79,0.001355315754258951,8
  3742. nouveau,79,0.001355315754258951,7
  3743. automatic_analysis,78,0.0013381598586354201,18
  3744. specific_feature,78,0.0013381598586354201,16
  3745. outline,78,0.0013381598586354201,7
  3746. target_language,78,0.0013381598586354201,15
  3747. sarcasm_detection,78,0.0013381598586354201,17
  3748. unexpected,78,0.0013381598586354201,10
  3749. lexico_syntactic,78,0.0013381598586354201,16
  3750. rewriting,78,0.0013381598586354201,9
  3751. um,78,0.0013381598586354201,2
  3752. reprsentations,78,0.0013381598586354201,14
  3753. learnable,78,0.0013381598586354201,9
  3754. supervised_training,78,0.0013381598586354201,19
  3755. fairness,78,0.0013381598586354201,8
  3756. various_aspect,78,0.0013381598586354201,14
  3757. tedious,78,0.0013381598586354201,7
  3758. wikidata,78,0.0013381598586354201,8
  3759. human_subject,78,0.0013381598586354201,13
  3760. transitive,78,0.0013381598586354201,10
  3761. significant_challenge,78,0.0013381598586354201,21
  3762. relative_error,78,0.0013381598586354201,14
  3763. edinburgh,78,0.0013381598586354201,9
  3764. quantitative_evaluation,78,0.0013381598586354201,23
  3765. attentional,78,0.0013381598586354201,11
  3766. contribute,78,0.0013381598586354201,10
  3767. fiction,78,0.0013381598586354201,7
  3768. linguistic_theory,78,0.0013381598586354201,17
  3769. cover,78,0.0013381598586354201,5
  3770. impressive_performance,77,0.001321003963011889,22
  3771. lexicalization,77,0.001321003963011889,14
  3772. real_user,77,0.001321003963011889,9
  3773. semeval_2013,77,0.001321003963011889,12
  3774. estonian,77,0.001321003963011889,8
  3775. adapter,77,0.001321003963011889,7
  3776. bigger,77,0.001321003963011889,6
  3777. official_evaluation,77,0.001321003963011889,19
  3778. quelques,77,0.001321003963011889,8
  3779. probing,77,0.001321003963011889,7
  3780. analytic,77,0.001321003963011889,8
  3781. multinomial,77,0.001321003963011889,11
  3782. sequenceto_sequence,77,0.001321003963011889,19
  3783. sen,77,0.001321003963011889,3
  3784. gru,77,0.001321003963011889,3
  3785. normalisation,77,0.001321003963011889,13
  3786. proceeding,77,0.001321003963011889,10
  3787. differential,77,0.001321003963011889,12
  3788. important_feature,77,0.001321003963011889,17
  3789. iso,77,0.001321003963011889,3
  3790. notation,77,0.001321003963011889,8
  3791. narrow,77,0.001321003963011889,6
  3792. other_feature,77,0.001321003963011889,13
  3793. retrieval_based,77,0.001321003963011889,15
  3794. nuance,77,0.001321003963011889,6
  3795. task_oriented_dialog,77,0.001321003963011889,20
  3796. computational_resource,77,0.001321003963011889,22
  3797. rich_morphology,77,0.001321003963011889,15
  3798. multilayer,77,0.001321003963011889,10
  3799. final_model,77,0.001321003963011889,11
  3800. expressiveness,77,0.001321003963011889,14
  3801. topological,77,0.001321003963011889,11
  3802. co_training,77,0.001321003963011889,11
  3803. interdisciplinary,77,0.001321003963011889,17
  3804. contradiction,77,0.001321003963011889,13
  3805. first_one,77,0.001321003963011889,9
  3806. several_type,77,0.001321003963011889,12
  3807. different_genre,77,0.001321003963011889,15
  3808. select,77,0.001321003963011889,6
  3809. standard_benchmark,77,0.001321003963011889,18
  3810. easy_to_use,77,0.001321003963011889,11
  3811. out_of_vocabulary_word,76,0.001303848067388358,22
  3812. department,76,0.001303848067388358,10
  3813. faithfulness,76,0.001303848067388358,12
  3814. subtrees,76,0.001303848067388358,8
  3815. rd,76,0.001303848067388358,2
  3816. pointwise,76,0.001303848067388358,9
  3817. adjustment,76,0.001303848067388358,10
  3818. utilisation,76,0.001303848067388358,11
  3819. cross_language_information,76,0.001303848067388358,26
  3820. cancer,76,0.001303848067388358,6
  3821. various_kind,76,0.001303848067388358,12
  3822. simultaneous_translation,76,0.001303848067388358,24
  3823. different_translation,76,0.001303848067388358,21
  3824. wmt14,76,0.001303848067388358,5
  3825. slu,76,0.001303848067388358,3
  3826. formalization,76,0.001303848067388358,13
  3827. consonant,76,0.001303848067388358,9
  3828. global_context,76,0.001303848067388358,14
  3829. previous_system,76,0.001303848067388358,15
  3830. national_corpus,76,0.001303848067388358,15
  3831. semeval_2010,76,0.001303848067388358,12
  3832. quadratic,76,0.001303848067388358,9
  3833. simple_model,76,0.001303848067388358,12
  3834. aggressive,76,0.001303848067388358,10
  3835. medication,76,0.001303848067388358,10
  3836. d'amliorer,76,0.001303848067388358,10
  3837. comprehensive_experiment,76,0.001303848067388358,24
  3838. encoder_decoder_model,76,0.001303848067388358,21
  3839. poem,76,0.001303848067388358,4
  3840. solver,76,0.001303848067388358,6
  3841. nlg_system,76,0.001303848067388358,10
  3842. weakly_supervised,76,0.001303848067388358,17
  3843. language_agnostic,76,0.001303848067388358,17
  3844. beam_search,76,0.001303848067388358,11
  3845. qualit,76,0.001303848067388358,6
  3846. appearance,76,0.001303848067388358,10
  3847. ebmt,76,0.001303848067388358,4
  3848. synonymous,76,0.001303848067388358,10
  3849. last_decade,76,0.001303848067388358,11
  3850. relaxation,76,0.001303848067388358,10
  3851. imperfect,76,0.001303848067388358,9
  3852. adapt,76,0.001303848067388358,5
  3853. inaccurate,76,0.001303848067388358,10
  3854. instantiation,76,0.001303848067388358,13
  3855. chinese_corpus,76,0.001303848067388358,14
  3856. fact_checking,76,0.001303848067388358,13
  3857. consecutive,76,0.001303848067388358,11
  3858. strong_result,76,0.001303848067388358,13
  3859. binary_classification_task,76,0.001303848067388358,26
  3860. determiner,76,0.001303848067388358,10
  3861. return,76,0.001303848067388358,6
  3862. standard_evaluation,76,0.001303848067388358,19
  3863. lr,76,0.001303848067388358,2
  3864. higher_performance,76,0.001303848067388358,18
  3865. marking,76,0.001303848067388358,7
  3866. grammatical_relation,76,0.001303848067388358,20
  3867. spearman,75,0.001286692171764827,8
  3868. une_analyse,75,0.001286692171764827,11
  3869. mood,75,0.001286692171764827,4
  3870. tac,75,0.001286692171764827,3
  3871. semantic_processing,75,0.001286692171764827,19
  3872. macro_averaged,75,0.001286692171764827,14
  3873. current_system,75,0.001286692171764827,14
  3874. primitive,75,0.001286692171764827,9
  3875. second_step,75,0.001286692171764827,11
  3876. route,75,0.001286692171764827,5
  3877. unbalanced,75,0.001286692171764827,10
  3878. applies,75,0.001286692171764827,7
  3879. gpu,75,0.001286692171764827,3
  3880. refined,75,0.001286692171764827,7
  3881. ed,75,0.001286692171764827,2
  3882. allows,75,0.001286692171764827,6
  3883. duc,75,0.001286692171764827,3
  3884. ape,75,0.001286692171764827,3
  3885. wmt19,75,0.001286692171764827,5
  3886. complex_question,75,0.001286692171764827,16
  3887. noisy_data,75,0.001286692171764827,10
  3888. online_review,75,0.001286692171764827,13
  3889. invariant,75,0.001286692171764827,9
  3890. most_work,75,0.001286692171764827,9
  3891. pronominal,75,0.001286692171764827,10
  3892. assertion,75,0.001286692171764827,9
  3893. canada,75,0.001286692171764827,6
  3894. example_based_machine_translation,75,0.001286692171764827,33
  3895. international_workshop,75,0.001286692171764827,22
  3896. particulirement,75,0.001286692171764827,15
  3897. suboptimal,75,0.001286692171764827,10
  3898. optimized,75,0.001286692171764827,9
  3899. gnration,75,0.001286692171764827,8
  3900. current_study,75,0.001286692171764827,13
  3901. historical_text,74,0.001269536276141296,15
  3902. lexical_sample_task,74,0.001269536276141296,19
  3903. apparent,74,0.001269536276141296,8
  3904. average_accuracy,74,0.001269536276141296,16
  3905. advent,74,0.001269536276141296,6
  3906. utilis,74,0.001269536276141296,6
  3907. suggested,74,0.001269536276141296,9
  3908. projective,74,0.001269536276141296,10
  3909. lexicographer,74,0.001269536276141296,13
  3910. loop,74,0.001269536276141296,4
  3911. speech_to_speech_translation,74,0.001269536276141296,28
  3912. contextualized_word,74,0.001269536276141296,19
  3913. acceptance,74,0.001269536276141296,10
  3914. surprisal,74,0.001269536276141296,9
  3915. related_word,74,0.001269536276141296,12
  3916. colloquial,74,0.001269536276141296,10
  3917. passive,74,0.001269536276141296,7
  3918. prepositional_phrase,74,0.001269536276141296,20
  3919. programme,74,0.001269536276141296,9
  3920. multilingual_word,74,0.001269536276141296,17
  3921. wat,74,0.001269536276141296,3
  3922. final_result,74,0.001269536276141296,12
  3923. d'informations,74,0.001269536276141296,14
  3924. same_meaning,74,0.001269536276141296,12
  3925. sketch,74,0.001269536276141296,6
  3926. noisy_channel,74,0.001269536276141296,13
  3927. zeroshot,74,0.001269536276141296,8
  3928. new_annotation,74,0.001269536276141296,14
  3929. context_based,74,0.001269536276141296,13
  3930. literary_text,74,0.001269536276141296,13
  3931. example_based_machine,74,0.001269536276141296,21
  3932. threat,74,0.001269536276141296,6
  3933. qa_system,74,0.001269536276141296,9
  3934. romance,74,0.001269536276141296,7
  3935. similar_performance,74,0.001269536276141296,19
  3936. good_quality,74,0.001269536276141296,12
  3937. state_of_the_art_accuracy,74,0.001269536276141296,25
  3938. retriever,74,0.001269536276141296,9
  3939. limited_data,74,0.001269536276141296,12
  3940. equation,74,0.001269536276141296,8
  3941. processor,74,0.001269536276141296,9
  3942. resumo,74,0.001269536276141296,6
  3943. c'est,74,0.001269536276141296,5
  3944. pause,74,0.001269536276141296,5
  3945. non_parallel,74,0.001269536276141296,12
  3946. formality,73,0.0012523803805177649,9
  3947. domaines,73,0.0012523803805177649,8
  3948. pedagogical,73,0.0012523803805177649,11
  3949. academia,73,0.0012523803805177649,8
  3950. user_interface,73,0.0012523803805177649,14
  3951. online_discussion,73,0.0012523803805177649,17
  3952. l'identification,73,0.0012523803805177649,16
  3953. benchmarking,73,0.0012523803805177649,12
  3954. multiple_datasets,73,0.0012523803805177649,17
  3955. inexpensive,73,0.0012523803805177649,11
  3956. english_speaker,73,0.0012523803805177649,15
  3957. encyclopedia,73,0.0012523803805177649,12
  3958. integral_part,73,0.0012523803805177649,13
  3959. expense,73,0.0012523803805177649,7
  3960. statistical_parsing,73,0.0012523803805177649,19
  3961. new_datasets,73,0.0012523803805177649,12
  3962. ensuite,73,0.0012523803805177649,7
  3963. violation,73,0.0012523803805177649,9
  3964. suicide,73,0.0012523803805177649,7
  3965. syntactic_category,73,0.0012523803805177649,18
  3966. predictive_power,73,0.0012523803805177649,16
  3967. propositional,73,0.0012523803805177649,13
  3968. same_domain,73,0.0012523803805177649,11
  3969. psycholinguistics,73,0.0012523803805177649,17
  3970. comprhension,73,0.0012523803805177649,12
  3971. overall_quality,73,0.0012523803805177649,15
  3972. outil,73,0.0012523803805177649,5
  3973. annotated_training_data,73,0.0012523803805177649,23
  3974. semantic_meaning,73,0.0012523803805177649,16
  3975. detailed_description,73,0.0012523803805177649,20
  3976. scientific_publication,73,0.0012523803805177649,22
  3977. societal,73,0.0012523803805177649,8
  3978. investment,73,0.0012523803805177649,10
  3979. high_dimensional,73,0.0012523803805177649,16
  3980. multiple_task,73,0.0012523803805177649,13
  3981. transformerbased,73,0.0012523803805177649,16
  3982. definite,73,0.0012523803805177649,8
  3983. deviation,73,0.0012523803805177649,9
  3984. el,73,0.0012523803805177649,2
  3985. gigaword,73,0.0012523803805177649,8
  3986. emergent,73,0.0012523803805177649,8
  3987. abstract_meaning_representation,73,0.0012523803805177649,31
  3988. semantic_level,73,0.0012523803805177649,14
  3989. non_parametric,73,0.0012523803805177649,14
  3990. l'annotation,73,0.0012523803805177649,12
  3991. naturalistic,72,0.001235224484894234,12
  3992. statistiques,72,0.001235224484894234,12
  3993. information_theoretic,72,0.001235224484894234,21
  3994. internal_structure,72,0.001235224484894234,18
  3995. nl,72,0.001235224484894234,2
  3996. n_gram_feature,72,0.001235224484894234,14
  3997. sanskrit,72,0.001235224484894234,8
  3998. rule_based_machine,72,0.001235224484894234,18
  3999. anger,72,0.001235224484894234,5
  4000. english_japanese,72,0.001235224484894234,16
  4001. semantic_classification,72,0.001235224484894234,23
  4002. optional,72,0.001235224484894234,8
  4003. syntactic_knowledge,72,0.001235224484894234,19
  4004. cognitive_science,72,0.001235224484894234,17
  4005. chinese_to_english_translation,72,0.001235224484894234,30
  4006. stateof_the_art_performance,72,0.001235224484894234,27
  4007. special_case,72,0.001235224484894234,12
  4008. ainsi_que,72,0.001235224484894234,9
  4009. hotel,72,0.001235224484894234,5
  4010. clinical_domain,72,0.001235224484894234,15
  4011. near,72,0.001235224484894234,4
  4012. travers,72,0.001235224484894234,7
  4013. clir,72,0.001235224484894234,4
  4014. boundary_detection,72,0.001235224484894234,18
  4015. key_role,72,0.001235224484894234,8
  4016. puis,72,0.001235224484894234,4
  4017. neural_sequence,72,0.001235224484894234,15
  4018. nonparametric,72,0.001235224484894234,13
  4019. user_friendly,72,0.001235224484894234,13
  4020. york,72,0.001235224484894234,4
  4021. new_york,72,0.001235224484894234,8
  4022. generalisation,72,0.001235224484894234,14
  4023. large_quantity,72,0.001235224484894234,14
  4024. such_approach,72,0.001235224484894234,13
  4025. masking,72,0.001235224484894234,7
  4026. partie,72,0.001235224484894234,6
  4027. predominant,72,0.001235224484894234,11
  4028. progressive,72,0.001235224484894234,11
  4029. dbpedia,72,0.001235224484894234,7
  4030. proliferation,72,0.001235224484894234,13
  4031. early_stage,72,0.001235224484894234,11
  4032. initial_experiment,72,0.001235224484894234,18
  4033. smm4h,72,0.001235224484894234,5
  4034. pro,72,0.001235224484894234,3
  4035. textual_description,72,0.001235224484894234,19
  4036. spoken_dialog_system,72,0.001235224484894234,20
  4037. xlm_r,72,0.001235224484894234,5
  4038. zero_shot_setting,72,0.001235224484894234,17
  4039. negative_example,71,0.0012180685892707029,16
  4040. transition_based_dependency,71,0.0012180685892707029,27
  4041. supplementary,71,0.0012180685892707029,13
  4042. variational_autoencoder,71,0.0012180685892707029,23
  4043. text_analysis,71,0.0012180685892707029,13
  4044. math,71,0.0012180685892707029,4
  4045. state_ofthe_art_result,71,0.0012180685892707029,22
  4046. associative,71,0.0012180685892707029,11
  4047. signature,71,0.0012180685892707029,9
  4048. k_means,71,0.0012180685892707029,7
  4049. dnn,71,0.0012180685892707029,3
  4050. surge,71,0.0012180685892707029,5
  4051. asymmetric,71,0.0012180685892707029,10
  4052. second_place,71,0.0012180685892707029,12
  4053. predictable,71,0.0012180685892707029,11
  4054. lexical_choice,71,0.0012180685892707029,14
  4055. local_feature,71,0.0012180685892707029,13
  4056. persuasive,71,0.0012180685892707029,10
  4057. wmt16,71,0.0012180685892707029,5
  4058. multilingual_translation,71,0.0012180685892707029,24
  4059. promising_performance,71,0.0012180685892707029,21
  4060. entits,71,0.0012180685892707029,6
  4061. elicitation,71,0.0012180685892707029,11
  4062. men,71,0.0012180685892707029,3
  4063. limited_training,71,0.0012180685892707029,16
  4064. human_robot,71,0.0012180685892707029,11
  4065. feed_forward,71,0.0012180685892707029,12
  4066. wordlevel,71,0.0012180685892707029,9
  4067. bilingual_lexicon_induction,71,0.0012180685892707029,27
  4068. different_machine,71,0.0012180685892707029,17
  4069. supervised_system,71,0.0012180685892707029,17
  4070. ilp,71,0.0012180685892707029,3
  4071. text_normalization,71,0.0012180685892707029,18
  4072. official_test,71,0.0012180685892707029,13
  4073. mix,71,0.0012180685892707029,3
  4074. shift_reduce,71,0.0012180685892707029,12
  4075. bilingual_data,71,0.0012180685892707029,14
  4076. descent,71,0.0012180685892707029,7
  4077. comparaison,71,0.0012180685892707029,11
  4078. anonymous,71,0.0012180685892707029,9
  4079. landscape,71,0.0012180685892707029,9
  4080. humorous,71,0.0012180685892707029,8
  4081. imitation,71,0.0012180685892707029,9
  4082. syntactic_representation,71,0.0012180685892707029,24
  4083. spell,71,0.0012180685892707029,5
  4084. manuellement,71,0.0012180685892707029,12
  4085. recommender,71,0.0012180685892707029,11
  4086. linguistic_research,71,0.0012180685892707029,19
  4087. suggest,71,0.0012180685892707029,7
  4088. state_of_theart_performance,71,0.0012180685892707029,27
  4089. rapid_development,71,0.0012180685892707029,17
  4090. multilingue,71,0.0012180685892707029,11
  4091. various_domain,71,0.0012180685892707029,14
  4092. second_approach,71,0.0012180685892707029,15
  4093. abstractive_summary,71,0.0012180685892707029,19
  4094. reusable,70,0.0012009126936471718,8
  4095. single_language,70,0.0012009126936471718,15
  4096. transition_based_parser,70,0.0012009126936471718,23
  4097. cooperation,70,0.0012009126936471718,11
  4098. automatic_approach,70,0.0012009126936471718,18
  4099. pre_existing,70,0.0012009126936471718,12
  4100. word_aligned,70,0.0012009126936471718,12
  4101. novel_algorithm,70,0.0012009126936471718,15
  4102. japan,70,0.0012009126936471718,5
  4103. multiple_choice_question,70,0.0012009126936471718,24
  4104. classroom,70,0.0012009126936471718,9
  4105. high_frequency,70,0.0012009126936471718,14
  4106. full_sentence,70,0.0012009126936471718,13
  4107. accordance,70,0.0012009126936471718,10
  4108. minimization,70,0.0012009126936471718,12
  4109. practical_use,70,0.0012009126936471718,13
  4110. justification,70,0.0012009126936471718,13
  4111. latent_representation,70,0.0012009126936471718,21
  4112. automatic_system,70,0.0012009126936471718,16
  4113. noun_compound,70,0.0012009126936471718,13
  4114. circumstance,70,0.0012009126936471718,12
  4115. crisis,70,0.0012009126936471718,6
  4116. tudions,70,0.0012009126936471718,7
  4117. digital_humanity,70,0.0012009126936471718,16
  4118. understandable,70,0.0012009126936471718,14
  4119. syntactical,70,0.0012009126936471718,11
  4120. ranker,70,0.0012009126936471718,6
  4121. past_work,70,0.0012009126936471718,9
  4122. low_cost,70,0.0012009126936471718,8
  4123. enfin,70,0.0012009126936471718,5
  4124. indo_european,70,0.0012009126936471718,13
  4125. bible,70,0.0012009126936471718,5
  4126. rule_based_method,70,0.0012009126936471718,17
  4127. comparons,70,0.0012009126936471718,9
  4128. pp,70,0.0012009126936471718,2
  4129. competitor,70,0.0012009126936471718,10
  4130. require,70,0.0012009126936471718,7
  4131. slavic,70,0.0012009126936471718,6
  4132. atis,70,0.0012009126936471718,4
  4133. code_mixing,70,0.0012009126936471718,11
  4134. joint_training,70,0.0012009126936471718,14
  4135. derived,70,0.0012009126936471718,7
  4136. nlp_pipeline,70,0.0012009126936471718,12
  4137. web_scale,70,0.0012009126936471718,9
  4138. gf,69,0.0011837567980236409,2
  4139. man,69,0.0011837567980236409,3
  4140. limited_number,69,0.0011837567980236409,14
  4141. unseen_word,69,0.0011837567980236409,11
  4142. distant_language,69,0.0011837567980236409,16
  4143. solid,69,0.0011837567980236409,5
  4144. data_to_text_generation,69,0.0011837567980236409,23
  4145. constitution,69,0.0011837567980236409,12
  4146. several_model,69,0.0011837567980236409,13
  4147. joint_inference,69,0.0011837567980236409,15
  4148. conversational_system,69,0.0011837567980236409,21
  4149. corpus_based_approach,69,0.0011837567980236409,21
  4150. impressive_result,69,0.0011837567980236409,17
  4151. fonde,69,0.0011837567980236409,5
  4152. dravidian_language,69,0.0011837567980236409,18
  4153. human_reference,69,0.0011837567980236409,15
  4154. semi_supervised_approach,69,0.0011837567980236409,24
  4155. lexical_simplification,69,0.0011837567980236409,22
  4156. natural_question,69,0.0011837567980236409,16
  4157. exemple,69,0.0011837567980236409,7
  4158. specialist,69,0.0011837567980236409,10
  4159. current_state_of_the_art,69,0.0011837567980236409,24
  4160. various_way,69,0.0011837567980236409,11
  4161. clinician,69,0.0011837567980236409,9
  4162. shortage,69,0.0011837567980236409,8
  4163. nous_prsentons_dans,69,0.0011837567980236409,19
  4164. real_data,69,0.0011837567980236409,9
  4165. disparate,69,0.0011837567980236409,9
  4166. vqa,69,0.0011837567980236409,3
  4167. unsupervised_system,69,0.0011837567980236409,19
  4168. first_experiment,69,0.0011837567980236409,16
  4169. considerable_improvement,69,0.0011837567980236409,24
  4170. safety,69,0.0011837567980236409,6
  4171. main_task,69,0.0011837567980236409,9
  4172. efficient_method,69,0.0011837567980236409,16
  4173. mise,69,0.0011837567980236409,4
  4174. rule_based_machine_translation,69,0.0011837567980236409,30
  4175. b.,69,0.0011837567980236409,2
  4176. utilises,68,0.0011666009024001098,8
  4177. summarizers,68,0.0011666009024001098,11
  4178. human_language_technology,68,0.0011666009024001098,25
  4179. semantic_vector,68,0.0011666009024001098,15
  4180. daily_life,68,0.0011666009024001098,10
  4181. rgles,68,0.0011666009024001098,5
  4182. text_only,68,0.0011666009024001098,9
  4183. wikipedia_article,68,0.0011666009024001098,17
  4184. ad_hoc,68,0.0011666009024001098,6
  4185. large_improvement,68,0.0011666009024001098,17
  4186. manual_effort,68,0.0011666009024001098,13
  4187. a.,68,0.0011666009024001098,2
  4188. plural,68,0.0011666009024001098,6
  4189. traditional_machine,68,0.0011666009024001098,19
  4190. rsum,68,0.0011666009024001098,4
  4191. hierarchical_model,68,0.0011666009024001098,18
  4192. interlingua,68,0.0011666009024001098,11
  4193. unigrams,68,0.0011666009024001098,8
  4194. week,68,0.0011666009024001098,4
  4195. amliorer,68,0.0011666009024001098,8
  4196. impairment,68,0.0011666009024001098,10
  4197. veracity,68,0.0011666009024001098,8
  4198. other_baseline,68,0.0011666009024001098,14
  4199. preprocessing_step,68,0.0011666009024001098,18
  4200. dozen,68,0.0011666009024001098,5
  4201. web_page,68,0.0011666009024001098,8
  4202. enriched,68,0.0011666009024001098,8
  4203. sub_optimal,68,0.0011666009024001098,11
  4204. para,68,0.0011666009024001098,4
  4205. human_generated,68,0.0011666009024001098,15
  4206. grapheme_to_phoneme,68,0.0011666009024001098,19
  4207. important_research,68,0.0011666009024001098,18
  4208. strong_correlation,68,0.0011666009024001098,18
  4209. en_de,68,0.0011666009024001098,5
  4210. lsa,68,0.0011666009024001098,3
  4211. unlabeled_corpus,68,0.0011666009024001098,16
  4212. germanenglish,68,0.0011666009024001098,13
  4213. north,68,0.0011666009024001098,5
  4214. more_language,68,0.0011666009024001098,13
  4215. abundance,68,0.0011666009024001098,9
  4216. d'autres,68,0.0011666009024001098,8
  4217. sd,68,0.0011666009024001098,2
  4218. dsambigusation,68,0.0011666009024001098,14
  4219. facial,68,0.0011666009024001098,6
  4220. absent,68,0.0011666009024001098,6
  4221. initial_result,68,0.0011666009024001098,14
  4222. versatile,68,0.0011666009024001098,9
  4223. phonemic,68,0.0011666009024001098,8
  4224. une_valuation,67,0.0011494450067765787,13
  4225. tight,67,0.0011494450067765787,5
  4226. implicit_discourse,67,0.0011494450067765787,18
  4227. footprint,67,0.0011494450067765787,9
  4228. semeval_2007,67,0.0011494450067765787,12
  4229. significant_performance_improvement,67,0.0011494450067765787,35
  4230. descriptor,67,0.0011494450067765787,10
  4231. vardial,67,0.0011494450067765787,7
  4232. chapter,67,0.0011494450067765787,7
  4233. different_part,67,0.0011494450067765787,14
  4234. lowest,67,0.0011494450067765787,6
  4235. studied,67,0.0011494450067765787,7
  4236. pubmed,67,0.0011494450067765787,6
  4237. multi_sentence,67,0.0011494450067765787,14
  4238. new_technique,67,0.0011494450067765787,13
  4239. persona,67,0.0011494450067765787,7
  4240. valuable_information,67,0.0011494450067765787,20
  4241. recursion,67,0.0011494450067765787,9
  4242. strongest,67,0.0011494450067765787,9
  4243. large_text_corpus,67,0.0011494450067765787,17
  4244. specific_information,67,0.0011494450067765787,20
  4245. instructor,67,0.0011494450067765787,10
  4246. neural_based,67,0.0011494450067765787,12
  4247. speech_translation,67,0.0011494450067765787,18
  4248. user_feedback,67,0.0011494450067765787,13
  4249. multiwoz,67,0.0011494450067765787,8
  4250. chemical,67,0.0011494450067765787,8
  4251. observable,67,0.0011494450067765787,10
  4252. l'information,67,0.0011494450067765787,13
  4253. deception,67,0.0011494450067765787,9
  4254. different_modality,67,0.0011494450067765787,18
  4255. align,67,0.0011494450067765787,5
  4256. spcifiques,67,0.0011494450067765787,10
  4257. reported,67,0.0011494450067765787,8
  4258. environmental,67,0.0011494450067765787,13
  4259. statistical_language_model,67,0.0011494450067765787,26
  4260. new_information,67,0.0011494450067765787,15
  4261. college,67,0.0011494450067765787,7
  4262. grande,66,0.0011322891111530478,6
  4263. outside,66,0.0011322891111530478,7
  4264. wmt20,66,0.0011322891111530478,5
  4265. two_level,66,0.0011322891111530478,9
  4266. linguistic_expression,66,0.0011322891111530478,21
  4267. previous_result,66,0.0011322891111530478,15
  4268. effet,66,0.0011322891111530478,5
  4269. office,66,0.0011322891111530478,6
  4270. hot,66,0.0011322891111530478,3
  4271. open_source_software,66,0.0011322891111530478,20
  4272. tracker,66,0.0011322891111530478,7
  4273. nous_valuons,66,0.0011322891111530478,12
  4274. url,66,0.0011322891111530478,3
  4275. worth,66,0.0011322891111530478,5
  4276. lstm_based,66,0.0011322891111530478,10
  4277. shortest,66,0.0011322891111530478,8
  4278. factoid_question,66,0.0011322891111530478,16
  4279. browser,66,0.0011322891111530478,7
  4280. division,66,0.0011322891111530478,8
  4281. various_approach,66,0.0011322891111530478,16
  4282. catalan,66,0.0011322891111530478,7
  4283. grce,66,0.0011322891111530478,4
  4284. potential_application,66,0.0011322891111530478,21
  4285. gaussian_mixture,66,0.0011322891111530478,16
  4286. structural_feature,66,0.0011322891111530478,18
  4287. interlingual,66,0.0011322891111530478,12
  4288. natural_language_interface,66,0.0011322891111530478,26
  4289. semantic_composition,66,0.0011322891111530478,20
  4290. supervised_machine_learning,66,0.0011322891111530478,27
  4291. common_approach,66,0.0011322891111530478,15
  4292. victim,66,0.0011322891111530478,6
  4293. latent_topic,66,0.0011322891111530478,12
  4294. song,66,0.0011322891111530478,4
  4295. intelligibility,66,0.0011322891111530478,15
  4296. ltag,66,0.0011322891111530478,4
  4297. manuscript,66,0.0011322891111530478,10
  4298. authorship_attribution,66,0.0011322891111530478,22
  4299. long_sentence,66,0.0011322891111530478,13
  4300. medical_record,66,0.0011322891111530478,14
  4301. fear,66,0.0011322891111530478,4
  4302. lens,66,0.0011322891111530478,4
  4303. nous_tudions,66,0.0011322891111530478,12
  4304. automatic_construction,66,0.0011322891111530478,22
  4305. giza++,66,0.0011322891111530478,6
  4306. public_health,66,0.0011322891111530478,13
  4307. discourse_representation,66,0.0011322891111530478,24
  4308. unstable,66,0.0011322891111530478,8
  4309. le_corpus,66,0.0011322891111530478,9
  4310. monolingual_model,66,0.0011322891111530478,17
  4311. neural_method,66,0.0011322891111530478,13
  4312. undesirable,66,0.0011322891111530478,11
  4313. optical,66,0.0011322891111530478,7
  4314. prospect,66,0.0011322891111530478,8
  4315. possible_solution,66,0.0011322891111530478,17
  4316. such_feature,66,0.0011322891111530478,12
  4317. fmeasure,66,0.0011322891111530478,8
  4318. contextualized_representation,66,0.0011322891111530478,29
  4319. unique_challenge,65,0.0011151332155295167,16
  4320. commonality,65,0.0011151332155295167,11
  4321. maximum_entropy_classifier,65,0.0011151332155295167,26
  4322. great_deal,65,0.0011151332155295167,10
  4323. parliament,65,0.0011151332155295167,10
  4324. agglutinative_language,65,0.0011151332155295167,22
  4325. same_topic,65,0.0011151332155295167,10
  4326. high_coverage,65,0.0011151332155295167,13
  4327. ligne,65,0.0011151332155295167,5
  4328. previous_state,65,0.0011151332155295167,14
  4329. dvelopp,65,0.0011151332155295167,7
  4330. rich_source,65,0.0011151332155295167,11
  4331. content_based,65,0.0011151332155295167,13
  4332. multidocument,65,0.0011151332155295167,13
  4333. press,65,0.0011151332155295167,5
  4334. much_work,65,0.0011151332155295167,9
  4335. automatic_word,65,0.0011151332155295167,14
  4336. qualitative_evaluation,65,0.0011151332155295167,22
  4337. customization,65,0.0011151332155295167,13
  4338. adjective_noun,65,0.0011151332155295167,14
  4339. open_domain_dialogue,65,0.0011151332155295167,20
  4340. developmental,65,0.0011151332155295167,13
  4341. exam,65,0.0011151332155295167,4
  4342. rational,65,0.0011151332155295167,8
  4343. pitfall,65,0.0011151332155295167,7
  4344. available_online,65,0.0011151332155295167,16
  4345. tabular,65,0.0011151332155295167,7
  4346. n'est,65,0.0011151332155295167,5
  4347. interact,65,0.0011151332155295167,8
  4348. labeled_training_data,65,0.0011151332155295167,21
  4349. continuation,65,0.0011151332155295167,12
  4350. personal_name,65,0.0011151332155295167,13
  4351. source_language,65,0.0011151332155295167,15
  4352. relative_clause,65,0.0011151332155295167,15
  4353. multi_head_attention,65,0.0011151332155295167,20
  4354. acronym,65,0.0011151332155295167,7
  4355. specified,65,0.0011151332155295167,9
  4356. contenu,65,0.0011151332155295167,7
  4357. optimum,65,0.0011151332155295167,7
  4358. intermediate_representation,65,0.0011151332155295167,27
  4359. complex_language,65,0.0011151332155295167,16
  4360. yahoo,65,0.0011151332155295167,5
  4361. ted_talk,65,0.0011151332155295167,8
  4362. various_level,65,0.0011151332155295167,13
  4363. global_information,65,0.0011151332155295167,18
  4364. different_setting,65,0.0011151332155295167,17
  4365. such_corpus,65,0.0011151332155295167,11
  4366. aspect_term,65,0.0011151332155295167,11
  4367. user_utterance,65,0.0011151332155295167,14
  4368. long_text,65,0.0011151332155295167,9
  4369. online_news,65,0.0011151332155295167,11
  4370. choix,65,0.0011151332155295167,5
  4371. zero_shot_learning,64,0.0010979773199059858,18
  4372. pre_trained_embeddings,64,0.0010979773199059858,22
  4373. automatic_recognition,64,0.0010979773199059858,21
  4374. fewer_parameter,64,0.0010979773199059858,15
  4375. bot,64,0.0010979773199059858,3
  4376. available_training,64,0.0010979773199059858,18
  4377. dissemination,64,0.0010979773199059858,13
  4378. qu'il,64,0.0010979773199059858,5
  4379. long_tail,64,0.0010979773199059858,9
  4380. distributional_representation,64,0.0010979773199059858,29
  4381. specific_type,64,0.0010979773199059858,13
  4382. vast_majority,64,0.0010979773199059858,13
  4383. cross_lingual_word_embeddings,64,0.0010979773199059858,29
  4384. hmms,64,0.0010979773199059858,4
  4385. important_factor,64,0.0010979773199059858,16
  4386. macro_f1,64,0.0010979773199059858,8
  4387. white,64,0.0010979773199059858,5
  4388. election,64,0.0010979773199059858,8
  4389. catastrophic,64,0.0010979773199059858,12
  4390. divergent,64,0.0010979773199059858,9
  4391. repair,64,0.0010979773199059858,6
  4392. polynomial_time,64,0.0010979773199059858,15
  4393. tree_adjoining,64,0.0010979773199059858,14
  4394. optical_character,64,0.0010979773199059858,17
  4395. volunteer,64,0.0010979773199059858,9
  4396. bpe,64,0.0010979773199059858,3
  4397. neural_system,64,0.0010979773199059858,13
  4398. phrase_based_smt_system,64,0.0010979773199059858,23
  4399. trick,64,0.0010979773199059858,5
  4400. standard_approach,64,0.0010979773199059858,17
  4401. compositional_semantics,64,0.0010979773199059858,23
  4402. joy,64,0.0010979773199059858,3
  4403. semi_supervised_method,64,0.0010979773199059858,22
  4404. inspection,64,0.0010979773199059858,10
  4405. utilisons,64,0.0010979773199059858,9
  4406. reformulation,64,0.0010979773199059858,13
  4407. nous_utilisons,64,0.0010979773199059858,14
  4408. impractical,64,0.0010979773199059858,11
  4409. human_user,64,0.0010979773199059858,10
  4410. permis,64,0.0010979773199059858,6
  4411. finance,64,0.0010979773199059858,7
  4412. sentiment_lexicon,64,0.0010979773199059858,17
  4413. lexico_semantic,64,0.0010979773199059858,15
  4414. concreteness,64,0.0010979773199059858,12
  4415. hateful,64,0.0010979773199059858,7
  4416. higher_correlation,64,0.0010979773199059858,18
  4417. freedom,64,0.0010979773199059858,7
  4418. adverse_drug,64,0.0010979773199059858,12
  4419. cws,64,0.0010979773199059858,3
  4420. resource_poor_language,64,0.0010979773199059858,22
  4421. contributes,64,0.0010979773199059858,11
  4422. dissimilar,64,0.0010979773199059858,10
  4423. sein,64,0.0010979773199059858,4
  4424. multilingual_text,64,0.0010979773199059858,17
  4425. cfg,64,0.0010979773199059858,3
  4426. different_technique,64,0.0010979773199059858,19
  4427. jeu,64,0.0010979773199059858,3
  4428. heart,64,0.0010979773199059858,5
  4429. relaxed,64,0.0010979773199059858,7
  4430. multi_dimensional,63,0.0010808214242824547,17
  4431. arithmetic,63,0.0010808214242824547,10
  4432. levenshtein,63,0.0010808214242824547,11
  4433. hierarchical_attention,63,0.0010808214242824547,22
  4434. conception,63,0.0010808214242824547,10
  4435. dictionnaire,63,0.0010808214242824547,12
  4436. variational_inference,63,0.0010808214242824547,21
  4437. feed,63,0.0010808214242824547,4
  4438. html,63,0.0010808214242824547,4
  4439. networking,63,0.0010808214242824547,10
  4440. grammatical_structure,63,0.0010808214242824547,21
  4441. common_practice,63,0.0010808214242824547,15
  4442. que_le,63,0.0010808214242824547,6
  4443. formal_language,63,0.0010808214242824547,15
  4444. john,63,0.0010808214242824547,4
  4445. montre,63,0.0010808214242824547,6
  4446. wealth,63,0.0010808214242824547,6
  4447. lyric,63,0.0010808214242824547,5
  4448. albert,63,0.0010808214242824547,6
  4449. customized,63,0.0010808214242824547,10
  4450. analogous,63,0.0010808214242824547,9
  4451. more_information,63,0.0010808214242824547,16
  4452. toolkits,63,0.0010808214242824547,8
  4453. empathy,63,0.0010808214242824547,7
  4454. many_study,63,0.0010808214242824547,10
  4455. successive,63,0.0010808214242824547,10
  4456. annotated_data,63,0.0010808214242824547,14
  4457. profiling,63,0.0010808214242824547,9
  4458. calibration,63,0.0010808214242824547,11
  4459. ontology_based,63,0.0010808214242824547,14
  4460. multi_step,63,0.0010808214242824547,10
  4461. genuine,63,0.0010808214242824547,7
  4462. hallucination,63,0.0010808214242824547,13
  4463. d'obtenir,63,0.0010808214242824547,9
  4464. opendomain,63,0.0010808214242824547,10
  4465. penn_discourse_treebank,63,0.0010808214242824547,23
  4466. indic,63,0.0010808214242824547,5
  4467. journalist,63,0.0010808214242824547,10
  4468. few_shot_setting,63,0.0010808214242824547,16
  4469. rbmt,63,0.0010808214242824547,4
  4470. best_translation,63,0.0010808214242824547,16
  4471. fall,63,0.0010808214242824547,4
  4472. machine_readable,63,0.0010808214242824547,16
  4473. contextualized_embeddings,63,0.0010808214242824547,25
  4474. campagne,63,0.0010808214242824547,8
  4475. senseval_2,63,0.0010808214242824547,10
  4476. encode,63,0.0010808214242824547,6
  4477. mail,63,0.0010808214242824547,4
  4478. detect,63,0.0010808214242824547,6
  4479. unlikely,63,0.0010808214242824547,8
  4480. meet,63,0.0010808214242824547,4
  4481. less_resourced,63,0.0010808214242824547,14
  4482. labeler,63,0.0010808214242824547,7
  4483. closed_track,63,0.0010808214242824547,12
  4484. disability,63,0.0010808214242824547,10
  4485. japanese_language,62,0.0010636655286589236,17
  4486. conditional_probability,62,0.0010636655286589236,23
  4487. neural_network_approach,62,0.0010636655286589236,23
  4488. fidelity,62,0.0010636655286589236,8
  4489. end_to_end_system,62,0.0010636655286589236,17
  4490. d'entits,62,0.0010636655286589236,8
  4491. different_combination,62,0.0010636655286589236,21
  4492. graphic,62,0.0010636655286589236,7
  4493. taxonomic,62,0.0010636655286589236,9
  4494. morphologique,62,0.0010636655286589236,13
  4495. adversarial_network,62,0.0010636655286589236,19
  4496. fever,62,0.0010636655286589236,5
  4497. peer,62,0.0010636655286589236,4
  4498. calcul,62,0.0010636655286589236,6
  4499. linear_classifier,62,0.0010636655286589236,17
  4500. text_to_sql,62,0.0010636655286589236,11
  4501. different_granularity,62,0.0010636655286589236,21
  4502. noisy_text,62,0.0010636655286589236,10
  4503. specialised,62,0.0010636655286589236,11
  4504. ptb,62,0.0010636655286589236,3
  4505. fscore,62,0.0010636655286589236,6
  4506. lexical_complexity,62,0.0010636655286589236,18
  4507. substring,62,0.0010636655286589236,9
  4508. vague,62,0.0010636655286589236,5
  4509. licence,62,0.0010636655286589236,7
  4510. longitudinal,62,0.0010636655286589236,12
  4511. turn_taking,62,0.0010636655286589236,11
  4512. healthy,62,0.0010636655286589236,7
  4513. taskspecific,62,0.0010636655286589236,12
  4514. uas,62,0.0010636655286589236,3
  4515. continual,62,0.0010636655286589236,9
  4516. imperative,62,0.0010636655286589236,10
  4517. vector_space,62,0.0010636655286589236,12
  4518. involvement,62,0.0010636655286589236,11
  4519. effective_feature,62,0.0010636655286589236,17
  4520. text_document,62,0.0010636655286589236,13
  4521. stateof_the_art_result,62,0.0010636655286589236,22
  4522. nlp_researcher,62,0.0010636655286589236,14
  4523. same_task,62,0.0010636655286589236,9
  4524. le_attention,62,0.0010636655286589236,12
  4525. exemplar,62,0.0010636655286589236,8
  4526. large_model,62,0.0010636655286589236,11
  4527. offense,62,0.0010636655286589236,7
  4528. fine_grained_entity,62,0.0010636655286589236,19
  4529. new_system,62,0.0010636655286589236,10
  4530. full_use,62,0.0010636655286589236,8
  4531. localisation,62,0.0010636655286589236,12
  4532. sadness,62,0.0010636655286589236,7
  4533. tree_structured,62,0.0010636655286589236,15
  4534. unseen_data,62,0.0010636655286589236,11
  4535. senseval_3,62,0.0010636655286589236,10
  4536. systematic_study,62,0.0010636655286589236,16
  4537. conventional_method,62,0.0010636655286589236,19
  4538. adversarial_learning,62,0.0010636655286589236,20
  4539. relative_error_reduction,62,0.0010636655286589236,24
  4540. end_user,62,0.0010636655286589236,8
  4541. paired,62,0.0010636655286589236,6
  4542. well,62,0.0010636655286589236,4
  4543. f1_measure,62,0.0010636655286589236,10
  4544. forgetting,62,0.0010636655286589236,10
  4545. unnecessary,62,0.0010636655286589236,11
  4546. multi_view,62,0.0010636655286589236,10
  4547. disponibles,61,0.0010465096330353927,11
  4548. illness,61,0.0010465096330353927,7
  4549. semantic_unit,61,0.0010465096330353927,13
  4550. correct_translation,61,0.0010465096330353927,19
  4551. differ,61,0.0010465096330353927,6
  4552. monolingual_text,61,0.0010465096330353927,16
  4553. noun_noun,61,0.0010465096330353927,9
  4554. cpu,61,0.0010465096330353927,3
  4555. open_problem,61,0.0010465096330353927,12
  4556. significant_amount,61,0.0010465096330353927,18
  4557. light_verb,61,0.0010465096330353927,10
  4558. infeasible,61,0.0010465096330353927,10
  4559. out_ofdomain,61,0.0010465096330353927,12
  4560. distributional_information,61,0.0010465096330353927,26
  4561. wild,61,0.0010465096330353927,4
  4562. someone,61,0.0010465096330353927,7
  4563. leurs,61,0.0010465096330353927,5
  4564. user_generated_text,61,0.0010465096330353927,19
  4565. deceptive,61,0.0010465096330353927,9
  4566. keyboard,61,0.0010465096330353927,8
  4567. second_language_learner,61,0.0010465096330353927,23
  4568. algorithme,61,0.0010465096330353927,10
  4569. advice,61,0.0010465096330353927,6
  4570. regardless,61,0.0010465096330353927,10
  4571. mesures,61,0.0010465096330353927,7
  4572. symmetric,61,0.0010465096330353927,9
  4573. described,61,0.0010465096330353927,9
  4574. cleaning,61,0.0010465096330353927,8
  4575. deft,61,0.0010465096330353927,4
  4576. raters,61,0.0010465096330353927,6
  4577. con,61,0.0010465096330353927,3
  4578. tree_adjoining_grammar,61,0.0010465096330353927,22
  4579. annot,61,0.0010465096330353927,5
  4580. framing,61,0.0010465096330353927,7
  4581. offensive_language_detection,61,0.0010465096330353927,28
  4582. state_of_theart_result,61,0.0010465096330353927,22
  4583. similarity_based,61,0.0010465096330353927,16
  4584. neural_word,61,0.0010465096330353927,11
  4585. final_submission,61,0.0010465096330353927,16
  4586. recognizers,61,0.0010465096330353927,11
  4587. disaster,61,0.0010465096330353927,8
  4588. automatiques,61,0.0010465096330353927,12
  4589. lexical_relation,61,0.0010465096330353927,16
  4590. annual,61,0.0010465096330353927,6
  4591. suffer,61,0.0010465096330353927,6
  4592. mert,61,0.0010465096330353927,4
  4593. optical_character_recognition,61,0.0010465096330353927,29
  4594. carlo,61,0.0010465096330353927,5
  4595. real_world_scenario,61,0.0010465096330353927,19
  4596. emoticon,61,0.0010465096330353927,8
  4597. l'tude,61,0.0010465096330353927,6
  4598. harm,61,0.0010465096330353927,4
  4599. such_knowledge,61,0.0010465096330353927,14
  4600. animal,61,0.0010465096330353927,6
  4601. certain_type,61,0.0010465096330353927,12
  4602. trace,61,0.0010465096330353927,5
  4603. scientific_document,61,0.0010465096330353927,19
  4604. documentlevel,61,0.0010465096330353927,13
  4605. anthology,61,0.0010465096330353927,9
  4606. updated,61,0.0010465096330353927,7
  4607. reranker,61,0.0010465096330353927,8
  4608. encyclopedic,61,0.0010465096330353927,12
  4609. interannotator,60,0.0010293537374118616,14
  4610. computational_linguist,60,0.0010293537374118616,22
  4611. driven,60,0.0010293537374118616,6
  4612. gibbs,60,0.0010293537374118616,5
  4613. overt,60,0.0010293537374118616,5
  4614. mobile_device,60,0.0010293537374118616,13
  4615. human_level,60,0.0010293537374118616,11
  4616. c.,60,0.0010293537374118616,2
  4617. mitigation,60,0.0010293537374118616,10
  4618. acoustic_feature,60,0.0010293537374118616,16
  4619. empty,60,0.0010293537374118616,5
  4620. different_meaning,60,0.0010293537374118616,17
  4621. model_agnostic,60,0.0010293537374118616,14
  4622. basic_idea,60,0.0010293537374118616,10
  4623. maxent,60,0.0010293537374118616,6
  4624. backward,60,0.0010293537374118616,8
  4625. different_text,60,0.0010293537374118616,14
  4626. best_accuracy,60,0.0010293537374118616,13
  4627. weaker,60,0.0010293537374118616,6
  4628. machine_generated,60,0.0010293537374118616,17
  4629. main_focus,60,0.0010293537374118616,10
  4630. opensource,60,0.0010293537374118616,10
  4631. adversary,60,0.0010293537374118616,9
  4632. long_range_dependency,60,0.0010293537374118616,21
  4633. cosine_similarity,60,0.0010293537374118616,17
  4634. positive_result,60,0.0010293537374118616,15
  4635. expressive_power,60,0.0010293537374118616,16
  4636. alternate,60,0.0010293537374118616,9
  4637. neighbour,60,0.0010293537374118616,9
  4638. large_scale_datasets,60,0.0010293537374118616,20
  4639. scientific_text,60,0.0010293537374118616,15
  4640. paradigmatic,60,0.0010293537374118616,12
  4641. light_weight,60,0.0010293537374118616,12
  4642. multiple_document,60,0.0010293537374118616,17
  4643. such_language,60,0.0010293537374118616,13
  4644. several_technique,60,0.0010293537374118616,17
  4645. thinking,60,0.0010293537374118616,8
  4646. small_training,60,0.0010293537374118616,14
  4647. pronoun_resolution,60,0.0010293537374118616,18
  4648. cross_language_information_retrieval,60,0.0010293537374118616,36
  4649. additional_training_data,60,0.0010293537374118616,24
  4650. physician,60,0.0010293537374118616,9
  4651. inflected_form,60,0.0010293537374118616,14
  4652. instant,60,0.0010293537374118616,7
  4653. ongoing_work,60,0.0010293537374118616,12
  4654. f1_scores,60,0.0010293537374118616,9
  4655. important_issue,60,0.0010293537374118616,15
  4656. unimodal,60,0.0010293537374118616,8
  4657. pbsmt,60,0.0010293537374118616,5
  4658. antonym,60,0.0010293537374118616,7
  4659. informational,60,0.0010293537374118616,13
  4660. subjective_evaluation,60,0.0010293537374118616,21
  4661. ibm_model,60,0.0010293537374118616,9
  4662. syntactic_complexity,60,0.0010293537374118616,20
  4663. promising_approach,60,0.0010293537374118616,18
  4664. pagerank,60,0.0010293537374118616,8
  4665. inquiry,60,0.0010293537374118616,7
  4666. offenseval,60,0.0010293537374118616,10
  4667. uk,60,0.0010293537374118616,2
  4668. subsequence,60,0.0010293537374118616,11
  4669. similar_result,59,0.0010121978417883305,14
  4670. pertinence,59,0.0010121978417883305,10
  4671. idiosyncratic,59,0.0010121978417883305,13
  4672. in_house,59,0.0010121978417883305,8
  4673. new_perspective,59,0.0010121978417883305,15
  4674. stop,59,0.0010121978417883305,4
  4675. various_model,59,0.0010121978417883305,13
  4676. misspelling,59,0.0010121978417883305,11
  4677. experimental_setting,59,0.0010121978417883305,20
  4678. web_interface,59,0.0010121978417883305,13
  4679. code_mixed_text,59,0.0010121978417883305,15
  4680. diver,59,0.0010121978417883305,5
  4681. better_model,59,0.0010121978417883305,12
  4682. completeness,59,0.0010121978417883305,12
  4683. unsupervised_machine,59,0.0010121978417883305,20
  4684. instrument,59,0.0010121978417883305,10
  4685. mtl,59,0.0010121978417883305,3
  4686. subtree,59,0.0010121978417883305,7
  4687. resource_rich_language,59,0.0010121978417883305,22
  4688. unchanged,59,0.0010121978417883305,9
  4689. restoration,59,0.0010121978417883305,11
  4690. cf,59,0.0010121978417883305,2
  4691. east,59,0.0010121978417883305,4
  4692. non_linguistic,59,0.0010121978417883305,14
  4693. urgent,59,0.0010121978417883305,6
  4694. fly,59,0.0010121978417883305,3
  4695. different_degree,59,0.0010121978417883305,16
  4696. official_result,59,0.0010121978417883305,15
  4697. new_insight,59,0.0010121978417883305,11
  4698. discourse_analysis,59,0.0010121978417883305,18
  4699. creativecommons.orglicensesby4.0,59,0.0010121978417883305,32
  4700. sr,59,0.0010121978417883305,2
  4701. proof_of_concept,59,0.0010121978417883305,16
  4702. theorem,59,0.0010121978417883305,7
  4703. icelandic,59,0.0010121978417883305,9
  4704. cross_sentence,59,0.0010121978417883305,14
  4705. grant,59,0.0010121978417883305,5
  4706. machine_translated,59,0.0010121978417883305,18
  4707. state_of_the_art_machine,59,0.0010121978417883305,24
  4708. embodied,59,0.0010121978417883305,8
  4709. slection,59,0.0010121978417883305,8
  4710. nothing,59,0.0010121978417883305,7
  4711. experimental_setup,59,0.0010121978417883305,18
  4712. inability,59,0.0010121978417883305,9
  4713. acyclic_graph,59,0.0010121978417883305,13
  4714. submitted_system,59,0.0010121978417883305,16
  4715. ineffective,59,0.0010121978417883305,11
  4716. inferred,59,0.0010121978417883305,8
  4717. several_task,59,0.0010121978417883305,12
  4718. proprits,59,0.0010121978417883305,8
  4719. elegant,59,0.0010121978417883305,7
  4720. transductive,59,0.0010121978417883305,12
  4721. priority,59,0.0010121978417883305,8
  4722. radiology,59,0.0010121978417883305,9
  4723. topic_based,58,0.0009950419461647996,11
  4724. syntactic_property,58,0.0009950419461647996,18
  4725. novice,58,0.0009950419461647996,6
  4726. unified_model,58,0.0009950419461647996,13
  4727. multi_stage,58,0.0009950419461647996,11
  4728. slang,58,0.0009950419461647996,5
  4729. lexical_level,58,0.0009950419461647996,13
  4730. standard_test,58,0.0009950419461647996,13
  4731. combinaison,58,0.0009950419461647996,11
  4732. disjoint,58,0.0009950419461647996,8
  4733. non_english_language,58,0.0009950419461647996,20
  4734. syntactic_construction,58,0.0009950419461647996,22
  4735. content_word,58,0.0009950419461647996,12
  4736. comprehensive_evaluation,58,0.0009950419461647996,24
  4737. implicit_discourse_relation,58,0.0009950419461647996,27
  4738. gnralement,58,0.0009950419461647996,10
  4739. computational_analysis,58,0.0009950419461647996,22
  4740. past_decade,58,0.0009950419461647996,11
  4741. relative_importance,58,0.0009950419461647996,19
  4742. outstanding,58,0.0009950419461647996,11
  4743. monte,58,0.0009950419461647996,5
  4744. top_performing,58,0.0009950419461647996,14
  4745. understand,58,0.0009950419461647996,10
  4746. nous_comparons,58,0.0009950419461647996,14
  4747. linear_chain,58,0.0009950419461647996,12
  4748. key_feature,58,0.0009950419461647996,11
  4749. japanese_to_english,58,0.0009950419461647996,19
  4750. several_way,58,0.0009950419461647996,11
  4751. topology,58,0.0009950419461647996,8
  4752. taiwanese,58,0.0009950419461647996,9
  4753. scalar,58,0.0009950419461647996,6
  4754. neural_translation,58,0.0009950419461647996,18
  4755. ici,58,0.0009950419461647996,3
  4756. le_traitement,58,0.0009950419461647996,13
  4757. subwords,58,0.0009950419461647996,8
  4758. mr,58,0.0009950419461647996,2
  4759. human_assessment,58,0.0009950419461647996,16
  4760. linguistically_motivated,58,0.0009950419461647996,24
  4761. human_intervention,58,0.0009950419461647996,18
  4762. politician,58,0.0009950419461647996,10
  4763. authoring,58,0.0009950419461647996,9
  4764. constructed,58,0.0009950419461647996,11
  4765. click,58,0.0009950419461647996,5
  4766. rewrite,58,0.0009950419461647996,7
  4767. hyperparameter,58,0.0009950419461647996,14
  4768. generated_summary,58,0.0009950419461647996,17
  4769. aspect_level,58,0.0009950419461647996,12
  4770. different_set,58,0.0009950419461647996,13
  4771. unsupervised_fashion,58,0.0009950419461647996,20
  4772. cible,58,0.0009950419461647996,5
  4773. text_similarity,58,0.0009950419461647996,15
  4774. terme,58,0.0009950419461647996,5
  4775. long_standing,58,0.0009950419461647996,13
  4776. shallow_parsing,58,0.0009950419461647996,15
  4777. superficial,58,0.0009950419461647996,11
  4778. semantic_task,58,0.0009950419461647996,13
  4779. rseau,58,0.0009950419461647996,5
  4780. different_annotation,58,0.0009950419461647996,20
  4781. small_subset,58,0.0009950419461647996,12
  4782. span_based,58,0.0009950419461647996,10
  4783. aggression,58,0.0009950419461647996,10
  4784. interpersonal,58,0.0009950419461647996,13
  4785. geometry,58,0.0009950419461647996,8
  4786. lie,58,0.0009950419461647996,3
  4787. arabe,58,0.0009950419461647996,5
  4788. wisdom,58,0.0009950419461647996,6
  4789. simple_baseline,58,0.0009950419461647996,15
  4790. babelnet,58,0.0009950419461647996,8
  4791. similar_task,58,0.0009950419461647996,12
  4792. postediting,58,0.0009950419461647996,11
  4793. next_step,58,0.0009950419461647996,9
  4794. speech_to_text,57,0.0009778860505412685,14
  4795. lexicography,57,0.0009778860505412685,12
  4796. sub,57,0.0009778860505412685,3
  4797. human_evaluator,57,0.0009778860505412685,15
  4798. soit,57,0.0009778860505412685,4
  4799. diacritic,57,0.0009778860505412685,9
  4800. macro_f1_score,57,0.0009778860505412685,14
  4801. semeval_2015_task,57,0.0009778860505412685,17
  4802. datadriven,57,0.0009778860505412685,10
  4803. textual_inference,57,0.0009778860505412685,17
  4804. efficient_way,57,0.0009778860505412685,13
  4805. boosting,57,0.0009778860505412685,8
  4806. theoretic,57,0.0009778860505412685,9
  4807. same_entity,57,0.0009778860505412685,11
  4808. utilisant_de,57,0.0009778860505412685,12
  4809. unsupervised_domain_adaptation,57,0.0009778860505412685,30
  4810. unsupervised_domain,57,0.0009778860505412685,19
  4811. stateof_the_art_method,57,0.0009778860505412685,22
  4812. certainty,57,0.0009778860505412685,9
  4813. opinionated,57,0.0009778860505412685,11
  4814. graded,57,0.0009778860505412685,6
  4815. collins,57,0.0009778860505412685,7
  4816. noticeable,57,0.0009778860505412685,10
  4817. several_machine,57,0.0009778860505412685,15
  4818. better_accuracy,57,0.0009778860505412685,15
  4819. annotated_datasets,57,0.0009778860505412685,18
  4820. placement,57,0.0009778860505412685,9
  4821. different_evaluation,57,0.0009778860505412685,20
  4822. limited_training_data,57,0.0009778860505412685,21
  4823. natural_language_query,57,0.0009778860505412685,22
  4824. credibility,57,0.0009778860505412685,11
  4825. long_time,57,0.0009778860505412685,9
  4826. pivot_language,57,0.0009778860505412685,14
  4827. collocational,57,0.0009778860505412685,13
  4828. modlisation,57,0.0009778860505412685,11
  4829. chineseenglish,57,0.0009778860505412685,14
  4830. discours,57,0.0009778860505412685,8
  4831. hidden_layer,57,0.0009778860505412685,12
  4832. authority,57,0.0009778860505412685,9
  4833. modularity,57,0.0009778860505412685,10
  4834. same_word,57,0.0009778860505412685,9
  4835. linkage,57,0.0009778860505412685,7
  4836. highest_accuracy,57,0.0009778860505412685,16
  4837. less_resourced_language,57,0.0009778860505412685,23
  4838. moderation,57,0.0009778860505412685,10
  4839. supervised_classification,57,0.0009778860505412685,25
  4840. cohesive,57,0.0009778860505412685,8
  4841. speculation,57,0.0009778860505412685,11
  4842. fois,57,0.0009778860505412685,4
  4843. semantic_lexicon,57,0.0009778860505412685,16
  4844. higher_precision,57,0.0009778860505412685,16
  4845. ready,57,0.0009778860505412685,5
  4846. l'anglais,57,0.0009778860505412685,9
  4847. class_based,57,0.0009778860505412685,11
  4848. linguistic_unit,57,0.0009778860505412685,15
  4849. esl,57,0.0009778860505412685,3
  4850. naturel,57,0.0009778860505412685,7
  4851. joint_modeling,57,0.0009778860505412685,14
  4852. taux,56,0.0009607301549177375,4
  4853. multiple_level,56,0.0009607301549177375,14
  4854. irish,56,0.0009607301549177375,5
  4855. automated_system,56,0.0009607301549177375,16
  4856. reciprocal,56,0.0009607301549177375,10
  4857. multiparty,56,0.0009607301549177375,10
  4858. closest,56,0.0009607301549177375,7
  4859. positive_impact,56,0.0009607301549177375,15
  4860. grading,56,0.0009607301549177375,7
  4861. importante,56,0.0009607301549177375,10
  4862. technical_term,56,0.0009607301549177375,14
  4863. alignment_model,56,0.0009607301549177375,15
  4864. consuming,56,0.0009607301549177375,9
  4865. clarity,56,0.0009607301549177375,7
  4866. corporate,56,0.0009607301549177375,9
  4867. baseline_model,56,0.0009607301549177375,14
  4868. great_potential,56,0.0009607301549177375,15
  4869. reinforcement_learning,56,0.0009607301549177375,22
  4870. strategic,56,0.0009607301549177375,9
  4871. contour,56,0.0009607301549177375,7
  4872. detected,56,0.0009607301549177375,8
  4873. follow_up,56,0.0009607301549177375,9
  4874. user_query,56,0.0009607301549177375,10
  4875. geolocation,56,0.0009607301549177375,11
  4876. eleven,56,0.0009607301549177375,6
  4877. directional,56,0.0009607301549177375,11
  4878. bilingual_word_embeddings,56,0.0009607301549177375,25
  4879. transitivity,56,0.0009607301549177375,12
  4880. new_sentence,56,0.0009607301549177375,12
  4881. vertex,56,0.0009607301549177375,6
  4882. generated_question,56,0.0009607301549177375,18
  4883. emotional_state,56,0.0009607301549177375,15
  4884. neural_sequence_to_sequence,56,0.0009607301549177375,27
  4885. effective_use,56,0.0009607301549177375,13
  4886. tels,56,0.0009607301549177375,4
  4887. snli,56,0.0009607301549177375,4
  4888. statistical_technique,56,0.0009607301549177375,21
  4889. browsing,56,0.0009607301549177375,8
  4890. interoperable,56,0.0009607301549177375,13
  4891. user_satisfaction,56,0.0009607301549177375,17
  4892. regulation,56,0.0009607301549177375,10
  4893. first_model,56,0.0009607301549177375,11
  4894. available_dataset,56,0.0009607301549177375,17
  4895. continuous_speech,56,0.0009607301549177375,17
  4896. calculus,56,0.0009607301549177375,8
  4897. main_feature,56,0.0009607301549177375,12
  4898. nontrivial,56,0.0009607301549177375,10
  4899. svm_based,56,0.0009607301549177375,9
  4900. german_language,56,0.0009607301549177375,15
  4901. et_al,56,0.0009607301549177375,5
  4902. generated_sentence,56,0.0009607301549177375,18
  4903. formal_semantics,56,0.0009607301549177375,16
  4904. sociolinguistic,56,0.0009607301549177375,15
  4905. human_computer_interaction,56,0.0009607301549177375,26
  4906. original_model,56,0.0009607301549177375,14
  4907. new_training,56,0.0009607301549177375,12
  4908. high_recall,56,0.0009607301549177375,11
  4909. electronic_dictionary,56,0.0009607301549177375,21
  4910. several_study,56,0.0009607301549177375,13
  4911. marathi,56,0.0009607301549177375,7
  4912. kong,56,0.0009607301549177375,4
  4913. longest,56,0.0009607301549177375,7
  4914. parallelism,56,0.0009607301549177375,11
  4915. crf_based,56,0.0009607301549177375,9
  4916. ordinal,56,0.0009607301549177375,7
  4917. este,56,0.0009607301549177375,4
  4918. d'autre,56,0.0009607301549177375,7
  4919. biggest,56,0.0009607301549177375,7
  4920. serbian,56,0.0009607301549177375,7
  4921. word_sense,55,0.0009435742592942064,10
  4922. contributor,55,0.0009435742592942064,11
  4923. high_cost,55,0.0009435742592942064,9
  4924. crowd_sourcing,55,0.0009435742592942064,14
  4925. hit,55,0.0009435742592942064,3
  4926. lingual,55,0.0009435742592942064,7
  4927. sub_sentential,55,0.0009435742592942064,14
  4928. avoir,55,0.0009435742592942064,5
  4929. natural_language_task,55,0.0009435742592942064,21
  4930. asymmetry,55,0.0009435742592942064,9
  4931. certains,55,0.0009435742592942064,8
  4932. advertisement,55,0.0009435742592942064,13
  4933. red,55,0.0009435742592942064,3
  4934. log_likelihood,55,0.0009435742592942064,14
  4935. languageindependent,55,0.0009435742592942064,19
  4936. new_research,55,0.0009435742592942064,12
  4937. adaptability,55,0.0009435742592942064,12
  4938. expressivity,55,0.0009435742592942064,12
  4939. dominance,55,0.0009435742592942064,9
  4940. optimality,55,0.0009435742592942064,10
  4941. hong,55,0.0009435742592942064,4
  4942. rnn_based,55,0.0009435742592942064,9
  4943. hint,55,0.0009435742592942064,4
  4944. van,55,0.0009435742592942064,3
  4945. reach,55,0.0009435742592942064,5
  4946. bilingual_parallel,55,0.0009435742592942064,18
  4947. interference,55,0.0009435742592942064,12
  4948. peculiarity,55,0.0009435742592942064,11
  4949. first_language,55,0.0009435742592942064,14
  4950. compute,55,0.0009435742592942064,7
  4951. linguistic_rule,55,0.0009435742592942064,15
  4952. tat,55,0.0009435742592942064,3
  4953. quantization,55,0.0009435742592942064,12
  4954. papier,55,0.0009435742592942064,6
  4955. indo_european_language,55,0.0009435742592942064,22
  4956. syntactic_constraint,55,0.0009435742592942064,20
  4957. pipelined,55,0.0009435742592942064,9
  4958. query_expansion,55,0.0009435742592942064,15
  4959. moyen,55,0.0009435742592942064,5
  4960. non_projective_dependency,55,0.0009435742592942064,25
  4961. general_approach,55,0.0009435742592942064,16
  4962. open_source_toolkit,55,0.0009435742592942064,19
  4963. drawn,55,0.0009435742592942064,5
  4964. continuum,55,0.0009435742592942064,9
  4965. random_walk,55,0.0009435742592942064,11
  4966. mlm,55,0.0009435742592942064,3
  4967. favorable,55,0.0009435742592942064,9
  4968. graph_based_approach,55,0.0009435742592942064,20
  4969. overall_system,55,0.0009435742592942064,14
  4970. recent_effort,55,0.0009435742592942064,13
  4971. hardware,55,0.0009435742592942064,8
  4972. earlier_work,55,0.0009435742592942064,12
  4973. neuron,55,0.0009435742592942064,6
  4974. applique,55,0.0009435742592942064,8
  4975. different_category,55,0.0009435742592942064,18
  4976. single_system,55,0.0009435742592942064,13
  4977. short_paper,55,0.0009435742592942064,11
  4978. genetic_algorithm,55,0.0009435742592942064,17
  4979. laptop,55,0.0009435742592942064,6
  4980. empirical_comparison,55,0.0009435742592942064,20
  4981. whole_sentence,55,0.0009435742592942064,14
  4982. kernel_based,55,0.0009435742592942064,12
  4983. subgraph,55,0.0009435742592942064,8
  4984. viz,55,0.0009435742592942064,3
  4985. relevant_sentence,55,0.0009435742592942064,17
  4986. inferior,55,0.0009435742592942064,8
  4987. reinflection,55,0.0009435742592942064,12
  4988. user_experience,55,0.0009435742592942064,15
  4989. multilabel,55,0.0009435742592942064,10
  4990. evident,55,0.0009435742592942064,7
  4991. web_document,55,0.0009435742592942064,12
  4992. menes,55,0.0009435742592942064,5
  4993. grammatical_function,55,0.0009435742592942064,20
  4994. driver,55,0.0009435742592942064,6
  4995. negligible,55,0.0009435742592942064,10
  4996. state_of_the_art_parser,55,0.0009435742592942064,23
  4997. extraire,55,0.0009435742592942064,8
  4998. dictionary_definition,55,0.0009435742592942064,21
  4999. first_method,55,0.0009435742592942064,12
  5000. free_form,54,0.0009264183636706754,9
  5001. philosophy,54,0.0009264183636706754,10
  5002. morphological_complexity,54,0.0009264183636706754,24
  5003. original_document,54,0.0009264183636706754,17
  5004. btec,54,0.0009264183636706754,4
  5005. darpa,54,0.0009264183636706754,5
  5006. dst,54,0.0009264183636706754,3
  5007. evolutionary,54,0.0009264183636706754,12
  5008. well_suited,54,0.0009264183636706754,11
  5009. polysemous_word,54,0.0009264183636706754,15
  5010. economy,54,0.0009264183636706754,7
  5011. persuasion,54,0.0009264183636706754,10
  5012. vector_based,54,0.0009264183636706754,12
  5013. angle,54,0.0009264183636706754,5
  5014. employ,54,0.0009264183636706754,6
  5015. d'autre_part,54,0.0009264183636706754,12
  5016. back,54,0.0009264183636706754,4
  5017. slower,54,0.0009264183636706754,6
  5018. essence,54,0.0009264183636706754,7
  5019. pe,54,0.0009264183636706754,2
  5020. spatial_relation,54,0.0009264183636706754,16
  5021. tutoring,54,0.0009264183636706754,8
  5022. automatic_processing,54,0.0009264183636706754,20
  5023. western,54,0.0009264183636706754,7
  5024. proper_noun,54,0.0009264183636706754,11
  5025. several_benchmark,54,0.0009264183636706754,17
  5026. phylogenetic,54,0.0009264183636706754,12
  5027. moins,54,0.0009264183636706754,5
  5028. unsegmented,54,0.0009264183636706754,11
  5029. uma,54,0.0009264183636706754,3
  5030. fine_grained_sentiment,54,0.0009264183636706754,22
  5031. preferable,54,0.0009264183636706754,10
  5032. semantic_evaluation,54,0.0009264183636706754,19
  5033. various_application,54,0.0009264183636706754,19
  5034. disparity,54,0.0009264183636706754,9
  5035. gradient_based,54,0.0009264183636706754,14
  5036. wordnet_based,54,0.0009264183636706754,13
  5037. manning,54,0.0009264183636706754,7
  5038. rescoring,54,0.0009264183636706754,9
  5039. unbiased,54,0.0009264183636706754,8
  5040. defense,54,0.0009264183636706754,7
  5041. tous,54,0.0009264183636706754,4
  5042. vu,54,0.0009264183636706754,2
  5043. analogical,54,0.0009264183636706754,10
  5044. such_text,54,0.0009264183636706754,9
  5045. connectivity,54,0.0009264183636706754,12
  5046. such_case,54,0.0009264183636706754,9
  5047. lexical_ambiguity,54,0.0009264183636706754,17
  5048. *_*,54,0.0009264183636706754,3
  5049. social_medium_user,54,0.0009264183636706754,18
  5050. final_output,54,0.0009264183636706754,12
  5051. domain_specific_corpus,54,0.0009264183636706754,22
  5052. chen,54,0.0009264183636706754,4
  5053. manual_analysis,54,0.0009264183636706754,15
  5054. significant_increase,54,0.0009264183636706754,20
  5055. tend,54,0.0009264183636706754,4
  5056. important_word,54,0.0009264183636706754,14
  5057. raw_corpus,54,0.0009264183636706754,10
  5058. different_perspective,54,0.0009264183636706754,21
  5059. affinity,54,0.0009264183636706754,8
  5060. conceptnet,54,0.0009264183636706754,10
  5061. rsolution,54,0.0009264183636706754,9
  5062. deep_model,54,0.0009264183636706754,10
  5063. large_training,54,0.0009264183636706754,14
  5064. pertinent,53,0.0009092624680471444,9
  5065. intra_sentential,53,0.0009092624680471444,16
  5066. nonlinear,53,0.0009092624680471444,9
  5067. labor_intensive,53,0.0009092624680471444,15
  5068. situational,53,0.0009092624680471444,11
  5069. unbounded,53,0.0009092624680471444,9
  5070. translational,53,0.0009092624680471444,13
  5071. efficace,53,0.0009092624680471444,8
  5072. bipartite,53,0.0009092624680471444,9
  5073. unsatisfactory,53,0.0009092624680471444,14
  5074. patron,53,0.0009092624680471444,6
  5075. key_factor,53,0.0009092624680471444,10
  5076. numeric,53,0.0009092624680471444,7
  5077. ralisation,53,0.0009092624680471444,10
  5078. autres,53,0.0009092624680471444,6
  5079. hierarchical_clustering,53,0.0009092624680471444,23
  5080. autre,53,0.0009092624680471444,5
  5081. wide_web,53,0.0009092624680471444,8
  5082. logistic_regression_model,53,0.0009092624680471444,25
  5083. structuring,53,0.0009092624680471444,11
  5084. german_text,53,0.0009092624680471444,11
  5085. alexa,53,0.0009092624680471444,5
  5086. telles,53,0.0009092624680471444,6
  5087. learned_model,53,0.0009092624680471444,13
  5088. international_license,53,0.0009092624680471444,21
  5089. syntactic_parse,53,0.0009092624680471444,15
  5090. prose,53,0.0009092624680471444,5
  5091. draft,53,0.0009092624680471444,5
  5092. happy,53,0.0009092624680471444,5
  5093. yelp,53,0.0009092624680471444,4
  5094. sign_language,53,0.0009092624680471444,13
  5095. selfattention,53,0.0009092624680471444,13
  5096. glossary,53,0.0009092624680471444,8
  5097. new_set,53,0.0009092624680471444,7
  5098. s'appuie,53,0.0009092624680471444,8
  5099. traiter,53,0.0009092624680471444,7
  5100. elaborate,53,0.0009092624680471444,9
  5101. plm,53,0.0009092624680471444,3
  5102. preliminary_analysis,53,0.0009092624680471444,20
  5103. apple,53,0.0009092624680471444,5
  5104. weather,53,0.0009092624680471444,7
  5105. brand,53,0.0009092624680471444,5
  5106. single_document_summarization,53,0.0009092624680471444,29
  5107. cross_lingual_information_retrieval,53,0.0009092624680471444,35
  5108. multiple_model,53,0.0009092624680471444,14
  5109. sl,53,0.0009092624680471444,2
  5110. download,53,0.0009092624680471444,8
  5111. summary_sentence,53,0.0009092624680471444,16
  5112. gcn,53,0.0009092624680471444,3
  5113. arabic_tweet,53,0.0009092624680471444,12
  5114. d'abord,53,0.0009092624680471444,7
  5115. monotonic,53,0.0009092624680471444,9
  5116. extensibility,53,0.0009092624680471444,13
  5117. susceptible,53,0.0009092624680471444,11
  5118. first_system,53,0.0009092624680471444,12
  5119. big_data,53,0.0009092624680471444,8
  5120. special_attention,53,0.0009092624680471444,17
  5121. mrr,53,0.0009092624680471444,3
  5122. cours,53,0.0009092624680471444,5
  5123. averaged,53,0.0009092624680471444,8
  5124. l'ensemble,53,0.0009092624680471444,10
  5125. common_word,53,0.0009092624680471444,11
  5126. unannotated_corpus,53,0.0009092624680471444,18
  5127. outlier,53,0.0009092624680471444,7
  5128. publisher,53,0.0009092624680471444,9
  5129. lee,53,0.0009092624680471444,3
  5130. positive_effect,53,0.0009092624680471444,15
  5131. computer_aided,53,0.0009092624680471444,14
  5132. advantageous,53,0.0009092624680471444,12
  5133. useful_feature,53,0.0009092624680471444,14
  5134. high_order,53,0.0009092624680471444,10
  5135. afterwards,53,0.0009092624680471444,10
  5136. similarit,53,0.0009092624680471444,9
  5137. high_quality_translation,53,0.0009092624680471444,24
  5138. bayesian_network,53,0.0009092624680471444,16
  5139. simulator,53,0.0009092624680471444,9
  5140. dfinition,53,0.0009092624680471444,9
  5141. complex_model,53,0.0009092624680471444,13
  5142. comprehensive_analysis,53,0.0009092624680471444,22
  5143. ordered,52,0.0008921065724236133,7
  5144. open_ie,52,0.0008921065724236133,7
  5145. chunker,52,0.0008921065724236133,7
  5146. unsupervised_algorithm,52,0.0008921065724236133,22
  5147. empirical_investigation,52,0.0008921065724236133,23
  5148. ddi,52,0.0008921065724236133,3
  5149. wmt21,52,0.0008921065724236133,5
  5150. first_phase,52,0.0008921065724236133,11
  5151. graphbased,52,0.0008921065724236133,10
  5152. hmm_based,52,0.0008921065724236133,9
  5153. same_sentence,52,0.0008921065724236133,13
  5154. pcfgs,52,0.0008921065724236133,5
  5155. better_generalization,52,0.0008921065724236133,21
  5156. zero_shot_transfer,52,0.0008921065724236133,18
  5157. fewshot,52,0.0008921065724236133,7
  5158. citizen,52,0.0008921065724236133,7
  5159. major_problem,52,0.0008921065724236133,13
  5160. summary_generation,52,0.0008921065724236133,18
  5161. emnlp,52,0.0008921065724236133,5
  5162. different_form,52,0.0008921065724236133,14
  5163. specific_word,52,0.0008921065724236133,13
  5164. lexical_overlap,52,0.0008921065724236133,15
  5165. new_measure,52,0.0008921065724236133,11
  5166. sector,52,0.0008921065724236133,6
  5167. robust_model,52,0.0008921065724236133,12
  5168. rc,52,0.0008921065724236133,2
  5169. important_resource,52,0.0008921065724236133,18
  5170. vae,52,0.0008921065724236133,3
  5171. up_to_date,52,0.0008921065724236133,10
  5172. billion,52,0.0008921065724236133,7
  5173. episode,52,0.0008921065724236133,7
  5174. deep_reinforcement,52,0.0008921065724236133,18
  5175. highest_score,52,0.0008921065724236133,13
  5176. k_best,52,0.0008921065724236133,6
  5177. cultural_heritage,52,0.0008921065724236133,17
  5178. automatic_question,52,0.0008921065724236133,18
  5179. vaswani,52,0.0008921065724236133,7
  5180. trouble,52,0.0008921065724236133,7
  5181. predictability,52,0.0008921065724236133,14
  5182. synchronous_grammar,52,0.0008921065724236133,19
  5183. ensemble_approach,52,0.0008921065724236133,17
  5184. literacy,52,0.0008921065724236133,8
  5185. sixth,52,0.0008921065724236133,5
  5186. sizable,52,0.0008921065724236133,7
  5187. heterogeneity,52,0.0008921065724236133,13
  5188. small_size,52,0.0008921065724236133,10
  5189. post_editing_effort,52,0.0008921065724236133,19
  5190. dp,52,0.0008921065724236133,2
  5191. multiword_expression,52,0.0008921065724236133,20
  5192. external_data,52,0.0008921065724236133,13
  5193. cumulative,52,0.0008921065724236133,10
  5194. winner,52,0.0008921065724236133,6
  5195. timing,52,0.0008921065724236133,6
  5196. dictionary_entry,52,0.0008921065724236133,16
  5197. personalization,52,0.0008921065724236133,15
  5198. restrictive,52,0.0008921065724236133,11
  5199. different_size,52,0.0008921065724236133,14
  5200. posterior_probability,52,0.0008921065724236133,21
  5201. two_fold,52,0.0008921065724236133,8
  5202. many_to_many,52,0.0008921065724236133,12
  5203. alignment_error,52,0.0008921065724236133,15
  5204. com,52,0.0008921065724236133,3
  5205. celles,52,0.0008921065724236133,6
  5206. customizable,52,0.0008921065724236133,12
  5207. small_data,52,0.0008921065724236133,10
  5208. creativity,52,0.0008921065724236133,10
  5209. laborious,52,0.0008921065724236133,9
  5210. wellknown,52,0.0008921065724236133,9
  5211. new_translation,52,0.0008921065724236133,15
  5212. heuristic_rule,52,0.0008921065724236133,14
  5213. reproduction,52,0.0008921065724236133,12
  5214. auto_encoder,52,0.0008921065724236133,12
  5215. new_york_time,52,0.0008921065724236133,13
  5216. montr,52,0.0008921065724236133,5
  5217. negative_sentiment,52,0.0008921065724236133,18
  5218. aspectual,52,0.0008921065724236133,9
  5219. france,52,0.0008921065724236133,6
  5220. checkpoint,52,0.0008921065724236133,10
  5221. legal_document,52,0.0008921065724236133,14
  5222. understudied,52,0.0008921065724236133,12
  5223. different_classifier,52,0.0008921065724236133,20
  5224. inferential,52,0.0008921065724236133,11
  5225. lower_level,51,0.0008749506768000823,11
  5226. saliency,51,0.0008749506768000823,8
  5227. effective_strategy,51,0.0008749506768000823,18
  5228. many_researcher,51,0.0008749506768000823,15
  5229. grammatical_framework,51,0.0008749506768000823,21
  5230. surveillance,51,0.0008749506768000823,12
  5231. open_domain_question_answering,51,0.0008749506768000823,30
  5232. parallel_training_data,51,0.0008749506768000823,22
  5233. un_analyseur,51,0.0008749506768000823,12
  5234. analyst,51,0.0008749506768000823,7
  5235. low_resource_language_pair,51,0.0008749506768000823,26
  5236. informal_text,51,0.0008749506768000823,13
  5237. top_ranked,51,0.0008749506768000823,10
  5238. different_class,51,0.0008749506768000823,15
  5239. standard_language,51,0.0008749506768000823,17
  5240. predictive_performance,51,0.0008749506768000823,22
  5241. large_data_set,51,0.0008749506768000823,14
  5242. font,51,0.0008749506768000823,4
  5243. baseline_method,51,0.0008749506768000823,15
  5244. death,51,0.0008749506768000823,5
  5245. transformer_architecture,51,0.0008749506768000823,24
  5246. slavic_language,51,0.0008749506768000823,15
  5247. unlabelled_data,51,0.0008749506768000823,15
  5248. covid_19_pandemic,51,0.0008749506768000823,17
  5249. available_training_data,51,0.0008749506768000823,23
  5250. baseline_system,51,0.0008749506768000823,15
  5251. finitestate,51,0.0008749506768000823,11
  5252. er,51,0.0008749506768000823,2
  5253. debiasing,51,0.0008749506768000823,9
  5254. grapheme,51,0.0008749506768000823,8
  5255. same_way,51,0.0008749506768000823,8
  5256. worst,51,0.0008749506768000823,5
  5257. unlexicalized,51,0.0008749506768000823,13
  5258. multilingual_machine,51,0.0008749506768000823,20
  5259. searching,51,0.0008749506768000823,9
  5260. further_investigation,51,0.0008749506768000823,21
  5261. same_corpus,51,0.0008749506768000823,11
  5262. molecular,51,0.0008749506768000823,9
  5263. first_task,51,0.0008749506768000823,10
  5264. key_issue,51,0.0008749506768000823,9
  5265. catgories,51,0.0008749506768000823,9
  5266. subclass,51,0.0008749506768000823,8
  5267. additional_resource,51,0.0008749506768000823,19
  5268. front,51,0.0008749506768000823,5
  5269. flaw,51,0.0008749506768000823,4
  5270. parametric,51,0.0008749506768000823,10
  5271. non_compositional,51,0.0008749506768000823,17
  5272. english_verb,51,0.0008749506768000823,12
  5273. marked,51,0.0008749506768000823,6
  5274. emojis,51,0.0008749506768000823,6
  5275. slt,51,0.0008749506768000823,3
  5276. hand_annotated,51,0.0008749506768000823,14
  5277. tongue,51,0.0008749506768000823,6
  5278. adjectival,51,0.0008749506768000823,10
  5279. comparables,51,0.0008749506768000823,11
  5280. natural_language_application,51,0.0008749506768000823,28
  5281. visant,51,0.0008749506768000823,6
  5282. vidence,51,0.0008749506768000823,7
  5283. bilstm_crf,51,0.0008749506768000823,10
  5284. prosodic_feature,51,0.0008749506768000823,16
  5285. fake_news_detection,51,0.0008749506768000823,19
  5286. principe,51,0.0008749506768000823,8
  5287. similar_sentence,51,0.0008749506768000823,16
  5288. blind_test,51,0.0008749506768000823,10
  5289. medical_language,51,0.0008749506768000823,16
  5290. cantonese,51,0.0008749506768000823,9
  5291. contiguous,51,0.0008749506768000823,10
  5292. complex_word_identification,51,0.0008749506768000823,27
  5293. computer_assisted_translation,51,0.0008749506768000823,29
  5294. top_k,51,0.0008749506768000823,5
  5295. coarse_to_fine,51,0.0008749506768000823,14
  5296. open_access,51,0.0008749506768000823,11
  5297. under_explored,51,0.0008749506768000823,14
  5298. film,51,0.0008749506768000823,4
  5299. stateof_the_art_model,51,0.0008749506768000823,21
  5300. segmental,51,0.0008749506768000823,9
  5301. assist,51,0.0008749506768000823,6
  5302. intellectual,51,0.0008749506768000823,12
  5303. original_sentence,51,0.0008749506768000823,17
  5304. frequent_word,51,0.0008749506768000823,13
  5305. parse_tree,51,0.0008749506768000823,10
  5306. break,51,0.0008749506768000823,5
  5307. dev,50,0.0008577947811765513,3
  5308. phrase_based_mt,50,0.0008577947811765513,15
  5309. novel_data,50,0.0008577947811765513,10
  5310. utilize,50,0.0008577947811765513,7
  5311. mature,50,0.0008577947811765513,6
  5312. english_to_chinese,50,0.0008577947811765513,18
  5313. sentence_aligned,50,0.0008577947811765513,16
  5314. bottom,50,0.0008577947811765513,6
  5315. _which,50,0.0008577947811765513,6
  5316. massive_amount,50,0.0008577947811765513,14
  5317. parts_of_speech,50,0.0008577947811765513,15
  5318. safe,50,0.0008577947811765513,4
  5319. editorial,50,0.0008577947811765513,9
  5320. tutor,50,0.0008577947811765513,5
  5321. une_tude,50,0.0008577947811765513,8
  5322. screen,50,0.0008577947811765513,6
  5323. column,50,0.0008577947811765513,6
  5324. finer_grained,50,0.0008577947811765513,13
  5325. ralise,50,0.0008577947811765513,6
  5326. elementary_tree,50,0.0008577947811765513,15
  5327. objectif,50,0.0008577947811765513,8
  5328. dot,50,0.0008577947811765513,3
  5329. ranked_list,50,0.0008577947811765513,11
  5330. incoherent,50,0.0008577947811765513,10
  5331. lesser,50,0.0008577947811765513,6
  5332. microsoft_research,50,0.0008577947811765513,18
  5333. indigenous_language,50,0.0008577947811765513,19
  5334. statistical_mt_system,50,0.0008577947811765513,21
  5335. soft_constraint,50,0.0008577947811765513,15
  5336. bow,50,0.0008577947811765513,3
  5337. auc,50,0.0008577947811765513,3
  5338. bitexts,50,0.0008577947811765513,7
  5339. standardization,50,0.0008577947811765513,15
  5340. imdb,50,0.0008577947811765513,4
  5341. new_text,50,0.0008577947811765513,8
  5342. statistical_measure,50,0.0008577947811765513,19
  5343. chinese_language_processing,50,0.0008577947811765513,27
  5344. second_part,50,0.0008577947811765513,11
  5345. crosslingual_transfer,50,0.0008577947811765513,21
  5346. dog,50,0.0008577947811765513,3
  5347. routine,50,0.0008577947811765513,7
  5348. ample,50,0.0008577947811765513,5
  5349. anyone,50,0.0008577947811765513,6
  5350. lower_bound,50,0.0008577947811765513,11
  5351. therefore,50,0.0008577947811765513,9
  5352. simplest,50,0.0008577947811765513,8
  5353. post_hoc,50,0.0008577947811765513,8
  5354. other_resource,50,0.0008577947811765513,14
  5355. automated_evaluation,50,0.0008577947811765513,20
  5356. hybrid_method,50,0.0008577947811765513,13
  5357. two_phase,50,0.0008577947811765513,9
  5358. sensible,50,0.0008577947811765513,8
  5359. non_verbal,50,0.0008577947811765513,10
  5360. substantial_gain,50,0.0008577947811765513,16
  5361. supervise,50,0.0008577947811765513,9
  5362. copying,50,0.0008577947811765513,7
  5363. prise,50,0.0008577947811765513,5
  5364. ldc,50,0.0008577947811765513,3
  5365. obtains,50,0.0008577947811765513,7
  5366. first_version,50,0.0008577947811765513,13
  5367. final_translation,50,0.0008577947811765513,17
  5368. key_aspect,50,0.0008577947811765513,10
  5369. hedge,50,0.0008577947811765513,5
  5370. s'agit,50,0.0008577947811765513,6
  5371. historical_linguistics,50,0.0008577947811765513,22
  5372. textuelles,50,0.0008577947811765513,10
  5373. child_directed,50,0.0008577947811765513,14
  5374. zhang,50,0.0008577947811765513,5
  5375. bleu_point,50,0.0008577947811765513,10
  5376. english_to_german,50,0.0008577947811765513,17
  5377. seq2seq_model,50,0.0008577947811765513,13
  5378. manifold,50,0.0008577947811765513,8
  5379. reflection,50,0.0008577947811765513,10
  5380. trade,50,0.0008577947811765513,5
  5381. different_layer,50,0.0008577947811765513,15
  5382. depuis,50,0.0008577947811765513,6
  5383. second_language_acquisition,49,0.0008406388855530203,27
  5384. denotation,49,0.0008406388855530203,10
  5385. social_interaction,49,0.0008406388855530203,18
  5386. finer,49,0.0008406388855530203,5
  5387. qa_datasets,49,0.0008406388855530203,11
  5388. data_driven_method,49,0.0008406388855530203,18
  5389. une_reprsentation,49,0.0008406388855530203,17
  5390. semantic_role_label,49,0.0008406388855530203,19
  5391. bilingual_text,49,0.0008406388855530203,14
  5392. small_datasets,49,0.0008406388855530203,14
  5393. semantic_concept,49,0.0008406388855530203,16
  5394. satisfactory_result,49,0.0008406388855530203,19
  5395. littrature,49,0.0008406388855530203,10
  5396. app,49,0.0008406388855530203,3
  5397. edited,49,0.0008406388855530203,6
  5398. new_paradigm,49,0.0008406388855530203,12
  5399. new_tool,49,0.0008406388855530203,8
  5400. large_document,49,0.0008406388855530203,14
  5401. open_source_tool,49,0.0008406388855530203,16
  5402. md,49,0.0008406388855530203,2
  5403. sure,49,0.0008406388855530203,4
  5404. significant_performance_gain,49,0.0008406388855530203,28
  5405. comprises,49,0.0008406388855530203,9
  5406. portuguese_language,49,0.0008406388855530203,19
  5407. conventional_approach,49,0.0008406388855530203,21
  5408. clark,49,0.0008406388855530203,5
  5409. convex,49,0.0008406388855530203,6
  5410. whilst,49,0.0008406388855530203,6
  5411. distractors,49,0.0008406388855530203,11
  5412. agenda,49,0.0008406388855530203,6
  5413. more_detail,49,0.0008406388855530203,11
  5414. smooth,49,0.0008406388855530203,6
  5415. morphological_tagging,49,0.0008406388855530203,21
  5416. injection,49,0.0008406388855530203,9
  5417. offensive_content,49,0.0008406388855530203,17
  5418. next_word,49,0.0008406388855530203,9
  5419. k_nearest,49,0.0008406388855530203,9
  5420. translationese,49,0.0008406388855530203,14
  5421. essential_component,49,0.0008406388855530203,19
  5422. apis,49,0.0008406388855530203,4
  5423. essential_task,49,0.0008406388855530203,14
  5424. nomm'ees,49,0.0008406388855530203,8
  5425. annotated_sentence,49,0.0008406388855530203,18
  5426. vary,49,0.0008406388855530203,4
  5427. intern,49,0.0008406388855530203,6
  5428. mlp,49,0.0008406388855530203,3
  5429. fundamental_problem,49,0.0008406388855530203,19
  5430. english_russian,49,0.0008406388855530203,15
  5431. same_model,49,0.0008406388855530203,10
  5432. social_bias,49,0.0008406388855530203,11
  5433. segmented,49,0.0008406388855530203,9
  5434. misogyny,49,0.0008406388855530203,8
  5435. grammatical_error_detection,49,0.0008406388855530203,27
  5436. average_improvement,49,0.0008406388855530203,19
  5437. monolingual_word,49,0.0008406388855530203,16
  5438. upcoming,49,0.0008406388855530203,8
  5439. overfitting,49,0.0008406388855530203,11
  5440. main_finding,49,0.0008406388855530203,12
  5441. real_valued,49,0.0008406388855530203,11
  5442. hyponym,49,0.0008406388855530203,7
  5443. dmonstration,49,0.0008406388855530203,12
  5444. complementary_information,49,0.0008406388855530203,25
  5445. finite_state_automaton,49,0.0008406388855530203,22
  5446. further_experiment,49,0.0008406388855530203,18
  5447. labeled_example,49,0.0008406388855530203,15
  5448. primary_submission,49,0.0008406388855530203,18
  5449. charge,49,0.0008406388855530203,6
  5450. handle,49,0.0008406388855530203,6
  5451. bilingual_terminology,49,0.0008406388855530203,21
  5452. alignment_quality,49,0.0008406388855530203,17
  5453. parliamentary,49,0.0008406388855530203,13
  5454. global_feature,49,0.0008406388855530203,14
  5455. semcor,49,0.0008406388855530203,6
  5456. kit,49,0.0008406388855530203,3
  5457. language_dependent,49,0.0008406388855530203,18
  5458. bracketing,49,0.0008406388855530203,10
  5459. powerful_tool,49,0.0008406388855530203,13
  5460. contradictory,49,0.0008406388855530203,13
  5461. face_to_face,49,0.0008406388855530203,12
  5462. formalisme,49,0.0008406388855530203,10
  5463. first_part,49,0.0008406388855530203,10
  5464. cration,49,0.0008406388855530203,7
  5465. timeml,49,0.0008406388855530203,6
  5466. simple_feature,49,0.0008406388855530203,14
  5467. considerable_attention,49,0.0008406388855530203,22
  5468. linguistic_processing,49,0.0008406388855530203,21
  5469. door,49,0.0008406388855530203,4
  5470. tonal,48,0.0008234829899294892,5
  5471. encoded,48,0.0008234829899294892,7
  5472. noisy_channel_model,48,0.0008234829899294892,19
  5473. principled_way,48,0.0008234829899294892,14
  5474. linguistic_characteristic,48,0.0008234829899294892,25
  5475. agglomerative,48,0.0008234829899294892,13
  5476. large_vocabulary,48,0.0008234829899294892,16
  5477. back_off,48,0.0008234829899294892,8
  5478. social_medium_content,48,0.0008234829899294892,21
  5479. contest,48,0.0008234829899294892,7
  5480. phrase_structure,48,0.0008234829899294892,16
  5481. different_sens,48,0.0008234829899294892,14
  5482. axiom,48,0.0008234829899294892,5
  5483. wmt17,48,0.0008234829899294892,5
  5484. verb_noun,48,0.0008234829899294892,9
  5485. spcifique,48,0.0008234829899294892,9
  5486. transformation_based,48,0.0008234829899294892,20
  5487. hotpotqa,48,0.0008234829899294892,8
  5488. comparability,48,0.0008234829899294892,13
  5489. test_set,48,0.0008234829899294892,8
  5490. timely,48,0.0008234829899294892,6
  5491. limited_resource,48,0.0008234829899294892,16
  5492. _an,48,0.0008234829899294892,3
  5493. herein,48,0.0008234829899294892,6
  5494. rumor,48,0.0008234829899294892,5
  5495. holder,48,0.0008234829899294892,6
  5496. nlp_method,48,0.0008234829899294892,10
  5497. rich_resource,48,0.0008234829899294892,13
  5498. tagsets,48,0.0008234829899294892,7
  5499. unprecedented,48,0.0008234829899294892,13
  5500. nommes,48,0.0008234829899294892,6
  5501. curated,48,0.0008234829899294892,7
  5502. unsupervised_machine_translation,48,0.0008234829899294892,32
  5503. cost_effective,48,0.0008234829899294892,14
  5504. critical_role,48,0.0008234829899294892,13
  5505. many_downstream,48,0.0008234829899294892,15
  5506. negated,48,0.0008234829899294892,7
  5507. syntagmatic,48,0.0008234829899294892,11
  5508. proportional,48,0.0008234829899294892,12
  5509. syntactic_context,48,0.0008234829899294892,17
  5510. individual_sentence,48,0.0008234829899294892,19
  5511. visual_scene,48,0.0008234829899294892,12
  5512. user_review,48,0.0008234829899294892,11
  5513. systematic_comparison,48,0.0008234829899294892,21
  5514. incorporate,48,0.0008234829899294892,11
  5515. lexical_meaning,48,0.0008234829899294892,15
  5516. confident,48,0.0008234829899294892,9
  5517. prior_research,48,0.0008234829899294892,14
  5518. hashtag,48,0.0008234829899294892,7
  5519. money,48,0.0008234829899294892,5
  5520. rwth,48,0.0008234829899294892,4
  5521. significant_impact,48,0.0008234829899294892,18
  5522. asset,48,0.0008234829899294892,5
  5523. hand_written,48,0.0008234829899294892,12
  5524. lexicaux,48,0.0008234829899294892,8
  5525. bilingual_lexicon_extraction,48,0.0008234829899294892,28
  5526. final_prediction,48,0.0008234829899294892,16
  5527. post_editors,48,0.0008234829899294892,12
  5528. open_track,48,0.0008234829899294892,10
  5529. several_feature,48,0.0008234829899294892,15
  5530. tl,48,0.0008234829899294892,2
  5531. generated_response,48,0.0008234829899294892,18
  5532. compressed,48,0.0008234829899294892,10
  5533. actionable,48,0.0008234829899294892,10
  5534. many_domain,48,0.0008234829899294892,11
  5535. max,48,0.0008234829899294892,3
  5536. wmt18,48,0.0008234829899294892,5
  5537. bnc,48,0.0008234829899294892,3
  5538. multi_class_classification,48,0.0008234829899294892,26
  5539. useful_resource,48,0.0008234829899294892,15
  5540. negotiation,48,0.0008234829899294892,11
  5541. error_prone,48,0.0008234829899294892,11
  5542. linguistic_representation,48,0.0008234829899294892,25
  5543. shot,48,0.0008234829899294892,4
  5544. council,48,0.0008234829899294892,7
  5545. ultimate_goal,48,0.0008234829899294892,13
  5546. interactive_system,48,0.0008234829899294892,18
  5547. becomes,48,0.0008234829899294892,7
  5548. second_method,48,0.0008234829899294892,13
  5549. learning_based_approach,48,0.0008234829899294892,23
  5550. couverture,48,0.0008234829899294892,10
  5551. endeavor,48,0.0008234829899294892,8
  5552. factual_knowledge,48,0.0008234829899294892,17
  5553. promising_direction,47,0.0008063270943059582,19
  5554. locuteurs,47,0.0008063270943059582,9
  5555. cmu,47,0.0008063270943059582,3
  5556. semantic_equivalence,47,0.0008063270943059582,20
  5557. pretrained_transformer,47,0.0008063270943059582,22
  5558. semi_automated,47,0.0008063270943059582,14
  5559. biaffine,47,0.0008063270943059582,8
  5560. parmi,47,0.0008063270943059582,5
  5561. avant,47,0.0008063270943059582,5
  5562. individual_model,47,0.0008063270943059582,16
  5563. l'adaptation,47,0.0008063270943059582,12
  5564. different_target,47,0.0008063270943059582,16
  5565. different_user,47,0.0008063270943059582,14
  5566. syntax_based_machine_translation,47,0.0008063270943059582,32
  5567. visual_context,47,0.0008063270943059582,14
  5568. single_domain,47,0.0008063270943059582,13
  5569. continuous_vector,47,0.0008063270943059582,17
  5570. excerpt,47,0.0008063270943059582,7
  5571. executable,47,0.0008063270943059582,10
  5572. domain_specific_knowledge,47,0.0008063270943059582,25
  5573. different_sentence,47,0.0008063270943059582,18
  5574. syntax_based_machine,47,0.0008063270943059582,20
  5575. future_study,47,0.0008063270943059582,12
  5576. different_architecture,47,0.0008063270943059582,22
  5577. co_occurring,47,0.0008063270943059582,12
  5578. contraintes,47,0.0008063270943059582,11
  5579. gaussian_mixture_model,47,0.0008063270943059582,22
  5580. ideology,47,0.0008063270943059582,8
  5581. heterogeneous_graph,47,0.0008063270943059582,19
  5582. other_application,47,0.0008063270943059582,17
  5583. linearization,47,0.0008063270943059582,13
  5584. wide_margin,47,0.0008063270943059582,11
  5585. various_source,47,0.0008063270943059582,14
  5586. s'emantiques,47,0.0008063270943059582,12
  5587. workbench,47,0.0008063270943059582,9
  5588. further_development,47,0.0008063270943059582,19
  5589. public_opinion,47,0.0008063270943059582,14
  5590. one_to_many,47,0.0008063270943059582,11
  5591. morphological_analyser,47,0.0008063270943059582,22
  5592. aspect_category,47,0.0008063270943059582,15
  5593. linguistic_variation,47,0.0008063270943059582,20
  5594. e2e,47,0.0008063270943059582,3
  5595. severity,47,0.0008063270943059582,8
  5596. lieu,47,0.0008063270943059582,4
  5597. main_component,47,0.0008063270943059582,14
  5598. minimalist,47,0.0008063270943059582,10
  5599. detailed_error,47,0.0008063270943059582,14
  5600. nn,47,0.0008063270943059582,2
  5601. kannada,47,0.0008063270943059582,7
  5602. celui,47,0.0008063270943059582,5
  5603. rhetorical_relation,47,0.0008063270943059582,19
  5604. credit,47,0.0008063270943059582,6
  5605. progression,47,0.0008063270943059582,11
  5606. different_topic,47,0.0008063270943059582,15
  5607. second_phase,47,0.0008063270943059582,12
  5608. marketing,47,0.0008063270943059582,9
  5609. qg,47,0.0008063270943059582,2
  5610. planner,47,0.0008063270943059582,7
  5611. web_application,47,0.0008063270943059582,15
  5612. bridging,47,0.0008063270943059582,8
  5613. simple_sentence,47,0.0008063270943059582,15
  5614. provide,47,0.0008063270943059582,7
  5615. finite_state_machine,47,0.0008063270943059582,20
  5616. human_robot_interaction,47,0.0008063270943059582,23
  5617. syntactic_level,47,0.0008063270943059582,15
  5618. answer_selection,47,0.0008063270943059582,16
  5619. lexical_category,47,0.0008063270943059582,16
  5620. self,47,0.0008063270943059582,4
  5621. designer,47,0.0008063270943059582,8
  5622. delay,47,0.0008063270943059582,5
  5623. autonomous,47,0.0008063270943059582,10
  5624. best_score,47,0.0008063270943059582,10
  5625. phrase_based_translation_system,47,0.0008063270943059582,31
  5626. multilingual_resource,47,0.0008063270943059582,21
  5627. singular_value,47,0.0008063270943059582,14
  5628. regularizer,47,0.0008063270943059582,11
  5629. lexical_representation,47,0.0008063270943059582,22
  5630. pyramid,47,0.0008063270943059582,7
  5631. new_version,47,0.0008063270943059582,11
  5632. multilingual_data,47,0.0008063270943059582,17
  5633. commission,47,0.0008063270943059582,10
  5634. qu'une,47,0.0008063270943059582,6
  5635. subsystem,47,0.0008063270943059582,9
  5636. infinite,47,0.0008063270943059582,8
  5637. mit,47,0.0008063270943059582,3
  5638. long_sequence,47,0.0008063270943059582,13
  5639. exprience,47,0.0008063270943059582,9
  5640. profit,47,0.0008063270943059582,6
  5641. fouille,47,0.0008063270943059582,7
  5642. tale,47,0.0008063270943059582,4
  5643. median,47,0.0008063270943059582,6
  5644. berkeley,47,0.0008063270943059582,8
  5645. main_result,47,0.0008063270943059582,11
  5646. lorsque,46,0.0007891711986824273,7
  5647. alignment_based,46,0.0007891711986824273,15
  5648. possible_translation,46,0.0007891711986824273,20
  5649. nouvelles,46,0.0007891711986824273,9
  5650. vulnerability,46,0.0007891711986824273,13
  5651. violence,46,0.0007891711986824273,8
  5652. shallow_discourse,46,0.0007891711986824273,17
  5653. end_to_end_speech,46,0.0007891711986824273,17
  5654. several_datasets,46,0.0007891711986824273,16
  5655. word_by_word,46,0.0007891711986824273,12
  5656. high_correlation,46,0.0007891711986824273,16
  5657. stand_alone,46,0.0007891711986824273,11
  5658. naive_bayes_classifier,46,0.0007891711986824273,22
  5659. similar_context,46,0.0007891711986824273,15
  5660. byte,46,0.0007891711986824273,4
  5661. identifiable,46,0.0007891711986824273,12
  5662. previous_year,46,0.0007891711986824273,13
  5663. user_interaction,46,0.0007891711986824273,16
  5664. multiple_word,46,0.0007891711986824273,13
  5665. polar,46,0.0007891711986824273,5
  5666. negative_sample,46,0.0007891711986824273,15
  5667. general_language,46,0.0007891711986824273,16
  5668. japanese_sentence,46,0.0007891711986824273,17
  5669. context_vector,46,0.0007891711986824273,14
  5670. rich_information,46,0.0007891711986824273,16
  5671. entire_document,46,0.0007891711986824273,15
  5672. neural_net,46,0.0007891711986824273,10
  5673. ongoing_project,46,0.0007891711986824273,15
  5674. codemixed,46,0.0007891711986824273,9
  5675. tokenizer,46,0.0007891711986824273,9
  5676. abstractive_summarization_model,46,0.0007891711986824273,31
  5677. rsultat,46,0.0007891711986824273,7
  5678. in_domain_training,46,0.0007891711986824273,18
  5679. main_advantage,46,0.0007891711986824273,14
  5680. leaf,46,0.0007891711986824273,4
  5681. one_to_one,46,0.0007891711986824273,10
  5682. tested,46,0.0007891711986824273,6
  5683. visible,46,0.0007891711986824273,7
  5684. modified_version,46,0.0007891711986824273,16
  5685. medical_concept,46,0.0007891711986824273,15
  5686. sinica,46,0.0007891711986824273,6
  5687. document_classification,46,0.0007891711986824273,23
  5688. same_text,46,0.0007891711986824273,9
  5689. short_term_memory_network,46,0.0007891711986824273,25
  5690. ironic,46,0.0007891711986824273,6
  5691. unification_based,46,0.0007891711986824273,17
  5692. give,46,0.0007891711986824273,4
  5693. polysynthetic,46,0.0007891711986824273,13
  5694. equality,46,0.0007891711986824273,8
  5695. human_being,46,0.0007891711986824273,11
  5696. implicit_relation,46,0.0007891711986824273,17
  5697. hub,46,0.0007891711986824273,3
  5698. english_to_japanese,46,0.0007891711986824273,19
  5699. corpus_based_study,46,0.0007891711986824273,18
  5700. latvian,46,0.0007891711986824273,7
  5701. variable_length,46,0.0007891711986824273,15
  5702. graphical_user,46,0.0007891711986824273,14
  5703. nation,46,0.0007891711986824273,6
  5704. catastrophic_forgetting,46,0.0007891711986824273,23
  5705. ax,46,0.0007891711986824273,2
  5706. house,46,0.0007891711986824273,5
  5707. natural_language_instruction,46,0.0007891711986824273,28
  5708. past_year,46,0.0007891711986824273,9
  5709. pre_processing_step,46,0.0007891711986824273,19
  5710. commitment,46,0.0007891711986824273,10
  5711. new_application,46,0.0007891711986824273,15
  5712. mots_cls,46,0.0007891711986824273,8
  5713. explicit_discourse,46,0.0007891711986824273,18
  5714. diagram,46,0.0007891711986824273,7
  5715. standard_word,46,0.0007891711986824273,13
  5716. bilingue,46,0.0007891711986824273,8
  5717. porte,46,0.0007891711986824273,5
  5718. detailed_error_analysis,46,0.0007891711986824273,23
  5719. pronounced,46,0.0007891711986824273,10
  5720. probabilistic_approach,46,0.0007891711986824273,22
  5721. code_mixed_data,46,0.0007891711986824273,15
  5722. deaf,46,0.0007891711986824273,4
  5723. ensembling,46,0.0007891711986824273,10
  5724. tempeval,46,0.0007891711986824273,8
  5725. online_community,46,0.0007891711986824273,16
  5726. source_target,46,0.0007891711986824273,13
  5727. on_the_fly,46,0.0007891711986824273,10
  5728. multilingual_nmt,46,0.0007891711986824273,16
  5729. wizard_of_oz,46,0.0007891711986824273,12
  5730. vaswani_et,46,0.0007891711986824273,10
  5731. false_positive,46,0.0007891711986824273,14
  5732. 1_best,46,0.0007891711986824273,6
  5733. impression,46,0.0007891711986824273,10
  5734. observe,46,0.0007891711986824273,7
  5735. propos,46,0.0007891711986824273,6
  5736. elles,46,0.0007891711986824273,5
  5737. better_quality,46,0.0007891711986824273,14
  5738. different_data_set,46,0.0007891711986824273,18
  5739. backoff,46,0.0007891711986824273,7
  5740. discriminant,46,0.0007891711986824273,12
  5741. few_example,46,0.0007891711986824273,11
  5742. euclidean,46,0.0007891711986824273,9
  5743. graphical_user_interface,46,0.0007891711986824273,24
  5744. discursive,46,0.0007891711986824273,10
  5745. bird,46,0.0007891711986824273,4
  5746. assistive,46,0.0007891711986824273,9
  5747. bilingual_sentence,46,0.0007891711986824273,18
  5748. labeled_data,46,0.0007891711986824273,12
  5749. fail,46,0.0007891711986824273,4
  5750. indo_aryan,46,0.0007891711986824273,10
  5751. cohen,46,0.0007891711986824273,5
  5752. duplicate,46,0.0007891711986824273,9
  5753. visual_representation,45,0.0007720153030588961,21
  5754. english_datasets,45,0.0007720153030588961,16
  5755. first_author,45,0.0007720153030588961,12
  5756. cky,45,0.0007720153030588961,3
  5757. annotated_resource,45,0.0007720153030588961,18
  5758. gpt,45,0.0007720153030588961,3
  5759. twofold,45,0.0007720153030588961,7
  5760. neighboring,45,0.0007720153030588961,11
  5761. multilingual_parsing,45,0.0007720153030588961,20
  5762. question_answering_system,45,0.0007720153030588961,25
  5763. dfi,45,0.0007720153030588961,3
  5764. multimodal_machine,45,0.0007720153030588961,18
  5765. switch,45,0.0007720153030588961,6
  5766. uima,45,0.0007720153030588961,4
  5767. hinders,45,0.0007720153030588961,7
  5768. replication,45,0.0007720153030588961,11
  5769. minimum_error,45,0.0007720153030588961,13
  5770. un_modle,45,0.0007720153030588961,8
  5771. negative_sampling,45,0.0007720153030588961,17
  5772. hybrid_machine,45,0.0007720153030588961,14
  5773. english_dataset,45,0.0007720153030588961,15
  5774. state_of_theart_method,45,0.0007720153030588961,22
  5775. critres,45,0.0007720153030588961,7
  5776. negative_effect,45,0.0007720153030588961,15
  5777. pdf,45,0.0007720153030588961,3
  5778. little_research,45,0.0007720153030588961,15
  5779. morphological_reinflection,45,0.0007720153030588961,26
  5780. twelve,45,0.0007720153030588961,6
  5781. popular_approach,45,0.0007720153030588961,16
  5782. syntax_aware,45,0.0007720153030588961,12
  5783. oov_word,45,0.0007720153030588961,8
  5784. non_neural,45,0.0007720153030588961,10
  5785. next_generation,45,0.0007720153030588961,15
  5786. entropy_based,45,0.0007720153030588961,13
  5787. transform,45,0.0007720153030588961,9
  5788. centroid,45,0.0007720153030588961,8
  5789. pre_trained_bert_model,45,0.0007720153030588961,22
  5790. articulatory,45,0.0007720153030588961,12
  5791. vaswani_et_al.,45,0.0007720153030588961,14
  5792. non_experts,45,0.0007720153030588961,11
  5793. central_role,45,0.0007720153030588961,12
  5794. built_in,45,0.0007720153030588961,8
  5795. several_language_pair,45,0.0007720153030588961,21
  5796. current_paper,45,0.0007720153030588961,13
  5797. centrality,45,0.0007720153030588961,10
  5798. low_rank,45,0.0007720153030588961,8
  5799. na,45,0.0007720153030588961,2
  5800. presidential,45,0.0007720153030588961,12
  5801. corpus_level,45,0.0007720153030588961,12
  5802. argue,45,0.0007720153030588961,5
  5803. binding,45,0.0007720153030588961,7
  5804. confirmation,45,0.0007720153030588961,12
  5805. island,45,0.0007720153030588961,6
  5806. statistical_information,45,0.0007720153030588961,23
  5807. theoretical_framework,45,0.0007720153030588961,21
  5808. adaption,45,0.0007720153030588961,8
  5809. lengthy,45,0.0007720153030588961,7
  5810. expert_annotation,45,0.0007720153030588961,17
  5811. many_people,45,0.0007720153030588961,11
  5812. similar_meaning,45,0.0007720153030588961,15
  5813. semeval_2014_task,45,0.0007720153030588961,17
  5814. natural_way,45,0.0007720153030588961,11
  5815. clpsych,45,0.0007720153030588961,7
  5816. tourism,45,0.0007720153030588961,7
  5817. future_improvement,45,0.0007720153030588961,18
  5818. surrogate,45,0.0007720153030588961,9
  5819. other_researcher,45,0.0007720153030588961,16
  5820. crucial_step,45,0.0007720153030588961,12
  5821. irrespective,45,0.0007720153030588961,12
  5822. singular_value_decomposition,45,0.0007720153030588961,28
  5823. unaligned,45,0.0007720153030588961,9
  5824. free_grammar,45,0.0007720153030588961,12
  5825. word_to_word,45,0.0007720153030588961,12
  5826. experimental_data,45,0.0007720153030588961,17
  5827. multilingual_system,45,0.0007720153030588961,19
  5828. annots,45,0.0007720153030588961,6
  5829. intonation,45,0.0007720153030588961,10
  5830. segmenters,45,0.0007720153030588961,10
  5831. gated_recurrent,45,0.0007720153030588961,15
  5832. stemmer,45,0.0007720153030588961,7
  5833. null,45,0.0007720153030588961,4
  5834. undergraduate,45,0.0007720153030588961,13
  5835. phonetic_transcription,45,0.0007720153030588961,22
  5836. subject_verb,45,0.0007720153030588961,12
  5837. tiny,45,0.0007720153030588961,4
  5838. statistical_word,45,0.0007720153030588961,16
  5839. multitude,45,0.0007720153030588961,9
  5840. lexical_acquisition,45,0.0007720153030588961,19
  5841. politeness,45,0.0007720153030588961,10
  5842. conversational_context,45,0.0007720153030588961,22
  5843. unsupervised_setting,45,0.0007720153030588961,20
  5844. selector,45,0.0007720153030588961,8
  5845. recorded,45,0.0007720153030588961,8
  5846. arabic_to_english,45,0.0007720153030588961,17
  5847. cambridge,45,0.0007720153030588961,9
  5848. linear_combination,45,0.0007720153030588961,18
  5849. stacking,44,0.0007548594074353652,8
  5850. advertising,44,0.0007548594074353652,11
  5851. semantic_search,44,0.0007548594074353652,15
  5852. telle,44,0.0007548594074353652,5
  5853. dag,44,0.0007548594074353652,3
  5854. unsupervised_way,44,0.0007548594074353652,16
  5855. ct,44,0.0007548594074353652,2
  5856. proposes,44,0.0007548594074353652,8
  5857. cooccurrences,44,0.0007548594074353652,13
  5858. missing,44,0.0007548594074353652,7
  5859. robotic,44,0.0007548594074353652,7
  5860. new_data_set,44,0.0007548594074353652,12
  5861. better_representation,44,0.0007548594074353652,21
  5862. conclude,44,0.0007548594074353652,8
  5863. deeper_understanding,44,0.0007548594074353652,20
  5864. traductions,44,0.0007548594074353652,11
  5865. pmi,44,0.0007548594074353652,3
  5866. open_challenge,44,0.0007548594074353652,14
  5867. unseen_test,44,0.0007548594074353652,11
  5868. notre_approche,44,0.0007548594074353652,14
  5869. linguistic_context,44,0.0007548594074353652,18
  5870. african_language,44,0.0007548594074353652,16
  5871. linguistic_description,44,0.0007548594074353652,22
  5872. negative_impact,44,0.0007548594074353652,15
  5873. multilingual_machine_translation,44,0.0007548594074353652,32
  5874. alternative_method,44,0.0007548594074353652,18
  5875. stratgies,44,0.0007548594074353652,9
  5876. structured_representation,44,0.0007548594074353652,25
  5877. textual_representation,44,0.0007548594074353652,22
  5878. contextualization,44,0.0007548594074353652,17
  5879. disentanglement,44,0.0007548594074353652,15
  5880. light_verb_construction,44,0.0007548594074353652,23
  5881. pathway,44,0.0007548594074353652,7
  5882. novel_word,44,0.0007548594074353652,10
  5883. resolvers,44,0.0007548594074353652,9
  5884. see,44,0.0007548594074353652,3
  5885. rponse,44,0.0007548594074353652,6
  5886. frequency_based,44,0.0007548594074353652,15
  5887. bilingual_parallel_corpus,44,0.0007548594074353652,25
  5888. principal_component,44,0.0007548594074353652,19
  5889. salient_information,44,0.0007548594074353652,19
  5890. n_ary,44,0.0007548594074353652,5
  5891. tel,44,0.0007548594074353652,3
  5892. stochastic_gradient,44,0.0007548594074353652,19
  5893. narrative_text,44,0.0007548594074353652,14
  5894. pr,44,0.0007548594074353652,2
  5895. asian_translation,44,0.0007548594074353652,17
  5896. ethic,44,0.0007548594074353652,5
  5897. graduate,44,0.0007548594074353652,8
  5898. stakeholder,44,0.0007548594074353652,11
  5899. abusive_language_detection,44,0.0007548594074353652,26
  5900. rigid,44,0.0007548594074353652,5
  5901. owl,44,0.0007548594074353652,3
  5902. concordance,44,0.0007548594074353652,11
  5903. binary_classification_problem,44,0.0007548594074353652,29
  5904. mt_quality,44,0.0007548594074353652,10
  5905. main_objective,44,0.0007548594074353652,14
  5906. thmatique,44,0.0007548594074353652,9
  5907. donn,44,0.0007548594074353652,4
  5908. few_study,44,0.0007548594074353652,9
  5909. emergency,44,0.0007548594074353652,9
  5910. multilinguality,44,0.0007548594074353652,15
  5911. keystroke,44,0.0007548594074353652,9
  5912. serial,44,0.0007548594074353652,6
  5913. animation,44,0.0007548594074353652,9
  5914. clausal,44,0.0007548594074353652,7
  5915. graph_based_method,44,0.0007548594074353652,18
  5916. itg,44,0.0007548594074353652,3
  5917. connotation,44,0.0007548594074353652,11
  5918. excellent_performance,44,0.0007548594074353652,21
  5919. epoch,44,0.0007548594074353652,5
  5920. real_world_data,44,0.0007548594074353652,15
  5921. diffrences,44,0.0007548594074353652,10
  5922. cross_lingual_setting,44,0.0007548594074353652,21
  5923. knowledge_base,44,0.0007548594074353652,14
  5924. distinguish,44,0.0007548594074353652,11
  5925. neural_generation,44,0.0007548594074353652,17
  5926. occupation,44,0.0007548594074353652,10
  5927. random_baseline,44,0.0007548594074353652,15
  5928. pos_tagging,44,0.0007548594074353652,11
  5929. set_up,44,0.0007548594074353652,6
  5930. relative_position,44,0.0007548594074353652,17
  5931. overall_result,44,0.0007548594074353652,14
  5932. ideological,44,0.0007548594074353652,11
  5933. capsule,44,0.0007548594074353652,7
  5934. muc,44,0.0007548594074353652,3
  5935. worldwide,44,0.0007548594074353652,9
  5936. le_systme,44,0.0007548594074353652,9
  5937. such_question,44,0.0007548594074353652,13
  5938. plagiarism,44,0.0007548594074353652,10
  5939. committee,44,0.0007548594074353652,9
  5940. verse,44,0.0007548594074353652,5
  5941. manifest,44,0.0007548594074353652,8
  5942. transport,44,0.0007548594074353652,9
  5943. chinese_english_translation_task,44,0.0007548594074353652,32
  5944. produit,44,0.0007548594074353652,7
  5945. interdependency,44,0.0007548594074353652,15
  5946. algebra,44,0.0007548594074353652,7
  5947. large_scale_knowledge,44,0.0007548594074353652,21
  5948. legal_domain,44,0.0007548594074353652,12
  5949. encoder_decoder_architecture,44,0.0007548594074353652,28
  5950. automatic_machine,44,0.0007548594074353652,17
  5951. speech_synthesis,44,0.0007548594074353652,16
  5952. inclusive,44,0.0007548594074353652,9
  5953. semantic_distance,44,0.0007548594074353652,17
  5954. such_representation,44,0.0007548594074353652,19
  5955. systran,44,0.0007548594074353652,7
  5956. significant_reduction,44,0.0007548594074353652,21
  5957. saving,44,0.0007548594074353652,6
  5958. ensemble_learning,44,0.0007548594074353652,17
  5959. distributional_word,44,0.0007548594074353652,19
  5960. pearson_correlation,44,0.0007548594074353652,19
  5961. packed,44,0.0007548594074353652,6
  5962. ehrs,44,0.0007548594074353652,4
  5963. unsupervised_technique,44,0.0007548594074353652,22
  5964. specific_aspect,44,0.0007548594074353652,15
  5965. linguistic_complexity,44,0.0007548594074353652,21
  5966. larger_corpus,44,0.0007548594074353652,13
  5967. different_component,44,0.0007548594074353652,19