ngram,count,df,len semantic,8385,0.14385218480330766,8 problem,8348,0.14321741666523702,7 neural,8024,0.13765890648321297,6 set,7899,0.13551441953027157,3 training,7844,0.13457084527097737,8 learning,7580,0.1300416888263652,8 natural,7436,0.1275712398565767,7 representation,7396,0.12688500403163547,14 study,7346,0.12602720925045893,5 novel,6844,0.11741494964744635,5 english,6795,0.11657431076189333,7 natural_language,6704,0.115013124260152,16 baseline,6675,0.1145156032870696,8 large,6555,0.11245689581224588,5 knowledge,6474,0.11106726826673986,9 automatic,6388,0.10959186124311619,9 research,6362,0.10914580795690439,8 classification,6217,0.10665820309149239,14 human,6184,0.10609205853591587,5 state_of_the_art,6157,0.10562884935408053,16 dataset,6090,0.10447940434730395,7 accuracy,5992,0.10279812657619791,8 network,5892,0.10108253701384481,7 domain,5880,0.10087666626636244,6 datasets,5833,0.10007033917205647,8 context,5812,0.09971006536396232,7 improvement,5797,0.09945272692960937,11 available,5789,0.09931547976462111,9 structure,5781,0.09917823259963286,9 technique,5724,0.0982003465490916,9 type,5617,0.09636466571737377,4 framework,5608,0.096210262656762,9 several,5539,0.09502650585873836,7 use,5497,0.09430595824255006,3 application,5483,0.09406577570382062,11 algorithm,5379,0.09228156255897339,9 annotation,5360,0.0919556005421263,10 linguistic,5313,0.09114927344782034,10 first,5312,0.09113211755219681,5 source,5261,0.09025716687539673,6 resource,5234,0.0897939576935614,8 relation,5097,0.08744359999313764,8 many,5092,0.08735782051501999,4 processing,5081,0.08716910566316115,10 previous,5044,0.0865343375250905,8 quality,5027,0.08624268729949047,7 experimental,4812,0.0825541697404313,12 document,4773,0.08188508981111359,8 lexical,4722,0.08101013913431351,7 score,4660,0.07994647360565459,5 extraction,4655,0.07986069412753692,10 user,4595,0.07883134039012507,4 best,4585,0.07865978143388976,4 time,4563,0.07828235173017208,4 order,4519,0.0775274923227367,5 nlp,4515,0.07745886874024259,3 pair,4511,0.07739024515774846,4 various,4456,0.07644667089845425,7 question,4451,0.0763608914203366,8 important,4412,0.07569181149101889,9 generation,4373,0.07502273156170118,10 statistical,4361,0.0748168608142188,11 process,4344,0.07452521058861877,7 syntactic,4322,0.0741477808849011,9 term,4310,0.07394191013741873,4 multiple,4305,0.07385613065930106,8 entity,4291,0.07361594812057164,6 number,4287,0.07354732453807751,6 better,4260,0.07308411535624217,6 simple,4250,0.07291255640000686,6 standard,4206,0.07215769699257149,8 input,4090,0.0701676131002419,5 detection,4024,0.06903532398908885,9 recent,3982,0.06831477637290055,6 challenge,3963,0.06798881435605346,9 experimental_result,3960,0.06793734666918287,19 case,3956,0.06786872308668875,4 way,3953,0.06781725539981814,3 test,3952,0.06780009950419462,4 target,3915,0.06716533136612397,6 dependency,3884,0.0666334986017945,10 level,3870,0.06639331606306507,5 error,3783,0.06490075314381788,5 speech,3722,0.06385424351078248,6 prediction,3648,0.06258470723464118,10 recognition,3647,0.06256755133901766,11 significant,3620,0.062104342157182316,11 tool,3616,0.06203571857468819,4 effective,3569,0.061229391480382235,9 neural_network,3520,0.06038875259482921,14 article,3431,0.05886187788433495,7 similarity,3407,0.05845013638937021,10 architecture,3302,0.05664876734889945,12 output,3288,0.05640858481017001,6 example,3281,0.0562884935408053,7 classifier,3270,0.05609977868894646,10 embeddings,3260,0.05592821973271114,10 content,3245,0.055670881298358184,7 current,3227,0.05536207517713462,7 natural_language_processing,3190,0.05472730703906398,27 high,3160,0.054212630170358045,4 part,3118,0.05349208255416974,4 issue,3107,0.0533033677023109,5 second,3096,0.05311465285045206,6 specific,3094,0.053080341059205,8 development,3081,0.052857314416099095,11 chinese,3041,0.052171078591157855,7 particular,3006,0.051570622244334265,10 parsing,2946,0.05054126850692241,7 et,2929,0.05024961828132238,2 attention,2920,0.050095215220710594,9 form,2913,0.04997512395134588,4 present,2903,0.04980356499511057,7 metric,2888,0.049546226560757606,6 unsupervised,2883,0.04946044708263995,12 multilingual,2882,0.04944329118701642,12 benchmark,2870,0.049237420439534045,9 deep,2850,0.04889430252706343,4 le,2837,0.048671275883957525,2 phrase,2819,0.048362469762733964,6 vector,2787,0.04781348110278097,6 strategy,2778,0.04765907804216919,8 sequence,2764,0.04741889550343976,8 due,2753,0.04723018065158092,3 similar,2746,0.0471100893822162,7 possible,2741,0.047024309904098546,8 parser,2710,0.04649247713976908,6 addition,2695,0.046235138705416116,8 parallel,2691,0.04616651512292199,8 social,2684,0.046046423853557276,6 general,2639,0.04527440855049838,7 grammar,2627,0.04506853780301601,7 space,2627,0.04506853780301601,5 combination,2623,0.04499991422052188,11 complex,2612,0.04481119936866304,7 identification,2611,0.04479404347303951,14 topic,2608,0.044742575786168914,5 state,2605,0.04469110809929833,5 role,2604,0.044673952203674795,4 dialogue,2587,0.044382301978074766,8 tree,2587,0.044382301978074766,4 sentiment,2573,0.04414211943934533,9 component,2568,0.044056339961227674,9 effectiveness,2547,0.043696066153133525,13 small,2537,0.04352450719689822,5 step,2534,0.04347303951002762,4 setting,2500,0.042889739058827564,7 computational,2492,0.04275249189383932,13 common,2491,0.04273533599821579,6 single,2480,0.04254662114635695,6 able,2477,0.04249515345948635,4 graph,2467,0.042323594503251044,5 useful,2440,0.041860385321415707,6 rule,2416,0.04144864382645096,4 amount,2403,0.041225617183345054,6 point,2353,0.040367822402168504,5 inference,2310,0.03963011889035667,9 textual,2302,0.039492871725368424,7 pattern,2302,0.039492871725368424,7 web,2286,0.039218377395391926,3 label,2274,0.039012506647909555,5 strong,2257,0.038720856422309526,6 expression,2246,0.038532141570450686,10 effect,2237,0.03837773850983891,6 search,2222,0.03812040007548594,6 main,2218,0.038051776492991816,4 additional,2215,0.03800030880612122,10 understanding,2213,0.03796599701487416,13 alignment,2212,0.03794884111925063,9 online,2210,0.03791452932800357,6 aspect,2200,0.037742970371768256,6 meaning,2196,0.03767434678927414,7 measure,2195,0.037657190893650605,7 bleu,2174,0.03729691708555645,4 news,2162,0.03709104633807408,4 mt,2159,0.037039578651203484,2 medium,2154,0.03695379917308583,6 class,2150,0.03688517559059171,5 event,2149,0.036868019694968175,5 function,2143,0.03676508432122699,8 field,2135,0.03662783715623874,5 efficient,2117,0.03631903103501518,9 goal,2116,0.036301875139391655,4 show,2108,0.0361646279744034,4 large_scale,2099,0.036010224913791626,11 description,2081,0.035701418792568065,11 relevant,2074,0.03558132752320335,8 comparison,2058,0.035306833193226854,10 lexicon,2050,0.0351695860282386,7 semantics,2039,0.03498087117637976,9 base,2032,0.03486077990701505,4 mechanism,2031,0.034843624011391516,9 selection,2012,0.034517661994544424,9 effort,2001,0.034328947142685584,6 pre_trained,1993,0.03419169997769734,11 difference,1991,0.034157388186450276,10 year,1986,0.03407160870833262,4 future,1975,0.03388289385647378,6 collection,1968,0.03376280258710906,10 concept,1967,0.033745646691485526,7 interaction,1967,0.033745646691485526,11 good,1961,0.033642711317744343,4 difficult,1960,0.03362555542212081,9 potential,1948,0.03341968467463844,9 variety,1944,0.033351061092144314,7 statistical_machine,1936,0.03321381392715607,19 construction,1930,0.03311087855341488,12 code,1928,0.03307656676216782,4 bert,1921,0.0329564754928031,4 distribution,1915,0.032853540119061914,12 statistical_machine_translation,1899,0.032579045789085416,31 traditional,1894,0.032493266310967765,11 property,1886,0.03235601914597951,8 need,1882,0.032287395563485394,4 retrieval,1880,0.03225308377223833,9 discourse,1879,0.0322359278766148,9 solution,1878,0.03221877198099127,8 key,1872,0.03211583660725008,3 individual,1869,0.03206436892037949,10 overall,1868,0.03204721302475596,7 empirical,1866,0.032012901233508896,9 transformer,1865,0.031995745337885365,11 category,1853,0.03178987459040299,8 al.,1851,0.03175556279915593,3 sense,1825,0.031309509512944124,5 de,1813,0.031103638765461752,2 supervised,1808,0.031017859287344095,10 comparable,1784,0.030606117792379352,10 ability,1781,0.030554650105508757,7 modeling,1773,0.03041740294052051,8 original,1765,0.030280155775532263,8 relationship,1759,0.030177220401791077,12 range,1746,0.02995419375868517,5 parameter,1744,0.02991988196743811,9 rich,1738,0.029816946593696925,4 community,1733,0.029731167115579268,9 candidate,1733,0.029731167115579268,9 competitive,1732,0.029714011219955736,11 french,1731,0.029696855324332208,6 morphological,1727,0.029628231741838082,13 social_medium,1723,0.02955960815934396,13 project,1722,0.029542452263720428,7 summarization,1720,0.029508140472473365,13 bilingual,1716,0.029439516889979242,9 technology,1707,0.02928511382936746,10 contribution,1696,0.02909639897750862,12 precision,1695,0.02907924308188509,9 extensive,1692,0.029027775395014496,9 dictionary,1690,0.028993463603767436,10 higher,1688,0.028959151812520373,6 manual,1681,0.028839060543155656,6 la,1669,0.028633189795673284,2 size,1667,0.02859887800442622,4 constraint,1660,0.028478786735061504,10 verb,1660,0.028478786735061504,4 open,1651,0.028324383674449723,4 answer,1649,0.028290071883202664,6 robust,1645,0.028221448300708538,6 impact,1644,0.028204292405085006,6 e.g.,1639,0.028118512926967352,4 segmentation,1635,0.02804988934447323,12 towards,1629,0.027946953970732043,7 query,1620,0.027792550910120263,5 instance,1616,0.02772392732762614,8 support,1602,0.027483744788896706,7 average,1594,0.027346497623908457,7 advantage,1587,0.02722640635454374,9 scheme,1585,0.027192094563296677,6 disambiguation,1582,0.027140626876426086,14 german,1582,0.027140626876426086,6 contextual,1579,0.02708915918955549,10 transfer,1577,0.027054847398308428,8 neural_machine,1569,0.02691760023332018,14 neural_machine_translation,1559,0.02674604127708487,26 fact,1556,0.026694573590214276,4 previous_work,1554,0.026660261798967216,13 utterance,1544,0.026488702842731904,9 scenario,1541,0.026437235155861313,8 adaptation,1535,0.026334299782120124,10 une,1532,0.026282832095249533,3 un,1524,0.026145584930261284,2 nous,1515,0.025991181869649504,4 submission,1510,0.02590540239153185,10 one,1506,0.025836778809037727,3 phenomenon,1500,0.02573384343529654,10 character,1499,0.02571668753967301,9 reference,1497,0.025682375748425947,9 monolingual,1495,0.025648063957178883,11 evidence,1494,0.025630908061555352,8 dans,1494,0.025630908061555352,4 joint,1490,0.02556228447906123,5 argument,1484,0.025459349105320044,8 version,1481,0.02540788141844945,7 speaker,1477,0.025339257835955326,7 token,1475,0.025304946044708263,5 value,1472,0.025253478357837672,5 annotated,1468,0.025184854775343546,9 rate,1464,0.025116231192849423,4 team,1460,0.025047607610355297,4 objective,1459,0.02503045171473177,9 limited,1455,0.024961828132237643,7 people,1449,0.024858892758496457,6 unit,1445,0.024790269176002334,4 spoken,1442,0.02473880148913174,6 prior,1438,0.024670177906637617,5 group,1437,0.024653022011014086,5 purpose,1434,0.02460155432414349,7 par,1432,0.02456724253289643,3 finding,1423,0.02441283947228465,7 tweet,1423,0.02441283947228465,5 conversation,1420,0.024361371785414056,12 correlation,1418,0.024327059994166997,11 cross_lingual,1415,0.024275592307296402,13 accurate,1407,0.024138345142308153,8 hierarchical,1404,0.024086877455437562,12 related,1397,0.023966786186072845,7 random,1396,0.023949630290449313,6 complexity,1382,0.02370944775171988,10 alternative,1373,0.0235550446911081,11 decision,1372,0.023537888795484567,8 lack,1368,0.023469265212990444,4 kind,1367,0.023452109317366913,4 popular,1365,0.02341779752611985,7 short,1358,0.023297706256755132,5 design,1355,0.02324623856988454,6 summary,1354,0.02322908267426101,7 gain,1351,0.023177614987390415,4 characteristic,1349,0.023143303196143356,14 response,1343,0.02304036782240217,8 literature,1342,0.023023211926778638,10 diverse,1340,0.022988900135531575,7 twitter,1329,0.022800185283672735,7 major,1327,0.022765873492425672,5 treebank,1324,0.022714405805555078,8 grammatical,1323,0.02269724990993155,11 sample,1317,0.02259431453619036,6 module,1317,0.02259431453619036,6 significant_improvement,1314,0.02254284684931977,23 local,1314,0.02254284684931977,5 relative,1314,0.02254284684931977,8 low,1313,0.022525690953696238,3 f1,1313,0.022525690953696238,2 tag,1311,0.022491379162449174,3 direction,1309,0.022457067371202115,9 art,1306,0.02240559968433152,3 factor,1299,0.022285508414966803,6 researcher,1299,0.022285508414966803,10 area,1295,0.02221688483247268,4 interest,1292,0.022165417145602086,8 implementation,1291,0.022148261249978554,14 latent,1286,0.0220624817718609,6 final,1286,0.0220624817718609,5 probability,1282,0.021993858189366777,11 noun,1282,0.021993858189366777,4 layer,1278,0.02192523460687265,5 aim,1275,0.02187376692000206,3 world,1269,0.021770831546260874,5 importance,1266,0.02171936385939028,10 low_resource,1261,0.021633584381272625,12 theory,1257,0.0215649607987785,6 long,1257,0.0215649607987785,4 much,1253,0.021496337216284377,4 tagging,1250,0.021444869529413782,7 procedure,1250,0.021444869529413782,9 japanese,1245,0.021359090051296128,8 database,1237,0.02122184288630788,8 real,1234,0.021170375199437288,4 idea,1233,0.021153219303813756,4 variation,1230,0.02110175161694316,9 memory,1228,0.021067439825696102,6 correct,1223,0.020981660347578444,7 resolution,1222,0.020964504451954913,10 hypothesis,1215,0.020844413182590196,10 methodology,1210,0.02075863370447254,11 mean,1206,0.02069001012197842,4 arabic,1205,0.020672854226354887,6 focus,1201,0.020604230643860764,5 list,1201,0.020604230643860764,4 real_world,1195,0.020501295270119575,10 change,1194,0.020484139374496047,6 global,1192,0.020449827583248984,6 account,1191,0.020432671687625453,7 certain,1188,0.020381204000754858,7 sur,1187,0.02036404810513133,3 participant,1187,0.02036404810513133,11 full,1185,0.020329736313884267,4 linear,1185,0.020329736313884267,6 pour,1184,0.020312580418260735,4 coverage,1183,0.020295424522637204,8 image,1183,0.020295424522637204,5 challenging,1181,0.02026111273139014,11 wordnet,1179,0.02022680094014308,7 wide,1175,0.020158177357648955,4 basic,1152,0.019763591758307743,5 crucial,1144,0.019626344593319495,7 smt,1138,0.01952340921957831,3 interface,1133,0.01943762974146065,9 end,1131,0.01940331795021359,3 ensemble,1130,0.01938616205459006,8 cost,1129,0.01936900615896653,4 bias,1127,0.019334694367719465,4 distributional,1125,0.019300382576472406,14 probabilistic,1124,0.019283226680848874,13 dynamic,1123,0.019266070785225343,7 success,1122,0.01924891488960181,7 benefit,1122,0.01924891488960181,7 platform,1121,0.01923175899397828,8 difficulty,1120,0.019214603098354748,10 wikipedia,1118,0.01918029130710769,9 insight,1117,0.019163135411484157,7 nature,1116,0.019145979515860626,6 vocabulary,1114,0.019111667724613562,10 recurrent,1114,0.019111667724613562,9 respect,1113,0.01909451182899003,7 perspective,1106,0.018974420559625314,11 frequency,1103,0.018922952872754722,9 recall,1101,0.01888864108150766,6 end_to_end,1101,0.01888864108150766,10 high_quality,1100,0.018871485185884128,12 positive,1100,0.018871485185884128,8 promising,1099,0.018854329290260596,9 downstream,1093,0.01875139391651941,10 opinion,1092,0.018734238020895883,7 practical,1090,0.01869992622964882,9 fine_grained,1089,0.018682770334025288,12 visual,1088,0.018665614438401756,6 appropriate,1086,0.018631302647154693,11 preliminary,1085,0.018614146751531165,11 du,1084,0.018596990855907634,2 choice,1078,0.018494055482166448,6 scale,1078,0.018494055482166448,5 name,1078,0.018494055482166448,4 public,1074,0.018425431899672322,6 pipeline,1074,0.018425431899672322,8 negative,1069,0.018339652421554668,8 behavior,1067,0.018305340630307605,8 gap,1066,0.018288184734684073,3 syntax,1064,0.018253872943437013,6 external,1061,0.01820240525656642,8 consistent,1058,0.018150937569695828,10 answering,1056,0.018116625778448765,9 initial,1050,0.01801369040470758,7 learner,1047,0.017962222717836984,7 phrase_based,1046,0.017945066822213453,12 review,1044,0.017910755030966393,6 deep_learning,1038,0.017807819657225204,13 po,1037,0.017790663761601676,2 loss,1033,0.01772204017910755,4 conditional,1031,0.017687728387860487,11 generative,1031,0.017687728387860487,10 e.g,1027,0.017619104805366364,3 conversational,1026,0.017601948909742832,14 author,1025,0.0175847930141193,6 usage,1022,0.01753332532724871,5 little,1021,0.017516169431625178,6 environment,1021,0.017516169431625178,11 mining,1020,0.017499013536001647,6 ce,1020,0.017499013536001647,2 linguistics,1013,0.01737892226663693,11 communication,1009,0.017310298684142807,13 supervision,1009,0.017310298684142807,11 variant,1009,0.017310298684142807,7 explicit,1008,0.017293142788519275,8 expert,1007,0.017275986892895744,6 limitation,1007,0.017275986892895744,10 length,1006,0.017258830997272212,6 basis,1005,0.01724167510164868,5 part_of_speech,1004,0.01722451920602515,14 parallel_corpus,997,0.01710442793666043,15 noisy,994,0.01705296024978984,5 generalization,994,0.01705296024978984,14 ranking,988,0.016950024876048655,7 necessary,988,0.016950024876048655,9 labeling,987,0.016932868980425123,8 distance,986,0.01691571308480159,8 top,986,0.01691571308480159,3 access,986,0.01691571308480159,6 hybrid,986,0.01691571308480159,6 contrast,986,0.01691571308480159,8 mention,984,0.01688140129355453,7 extension,981,0.016829933606683938,9 ii,976,0.016744154128566283,2 interpretation,976,0.016744154128566283,14 acquisition,974,0.01670984233731922,11 nmt,972,0.016675530546072157,3 agreement,970,0.016641218754825094,9 temporal,966,0.01657259517233097,8 rule_based,966,0.01657259517233097,10 estimation,965,0.01655543927670744,10 structural,965,0.01655543927670744,10 report,963,0.016521127485460377,6 annotator,961,0.016486815694213317,9 gold,960,0.016469659798589786,4 est,959,0.016452503902966254,3 essential,958,0.016435348007342723,9 degree,954,0.0163667244248486,6 reduction,953,0.01634956852922507,9 service,949,0.016280944946730946,7 larger,948,0.016263789051107414,6 different_language,948,0.016263789051107414,18 position,947,0.016246633155483883,8 spanish,945,0.01621232136423682,7 i.e,941,0.016143697781742697,3 condition,931,0.015972138825507385,9 abstract,929,0.015937827034260322,8 neural_model,922,0.015817735764895608,12 universal,920,0.015783423973648545,9 capability,917,0.01573195628677795,10 emotion,917,0.01573195628677795,7 weight,915,0.01569764449553089,6 style,911,0.015629020913036765,5 human_evaluation,910,0.015611865017413235,16 decoder,907,0.01556039733054264,7 structured,905,0.015526085539295579,10 efficiency,903,0.015491773748048518,10 scientific,903,0.015491773748048518,10 subject,902,0.015474617852424986,7 independent,901,0.015457461956801455,11 engine,897,0.01538883837430733,6 view,892,0.015303058896189676,4 progress,891,0.015285903000566144,8 detail,889,0.015251591209319083,6 manner,887,0.01521727941807202,6 medical,886,0.01520012352244849,7 stage,886,0.01520012352244849,5 coreference,882,0.015131499939954366,11 detailed,881,0.015114344044330834,8 corresponding,879,0.015080032253083773,13 building,876,0.01502856456621318,8 practice,876,0.01502856456621318,8 suitable,876,0.01502856456621318,8 object,875,0.015011408670589648,6 encoder,873,0.014977096879342585,7 open_source,873,0.014977096879342585,11 creation,870,0.014925629192471992,8 fine_tuning,868,0.014891317401224931,11 semeval,867,0.0148741615056014,7 student,867,0.0148741615056014,7 que,866,0.014857005609977868,3 embedding,865,0.014839849714354338,9 definition,864,0.014822693818730807,10 automated,863,0.014805537923107275,9 paradigm,862,0.014788382027483745,8 correction,862,0.014788382027483745,10 multimodal,861,0.014771226131860214,10 segment,861,0.014771226131860214,7 increase,860,0.014754070236236682,8 discussion,860,0.014754070236236682,10 attempt,854,0.014651134862495497,7 dialog,853,0.014633978966871965,6 substantial,853,0.014633978966871965,11 reason,851,0.014599667175624904,6 modern,851,0.014599667175624904,6 assessment,845,0.014496731801883718,10 great,844,0.014479575906260186,5 nlp_task,841,0.014428108219389594,8 biomedical,840,0.014410952323766062,10 comprehension,840,0.014410952323766062,13 regression,839,0.01439379642814253,10 unlabeled,836,0.014342328741271938,9 binary,836,0.014342328741271938,6 variable,836,0.014342328741271938,8 convolutional,835,0.014325172845648408,13 interactive,834,0.014308016950024876,11 cluster,828,0.01420508157628369,7 discriminative,828,0.01420508157628369,14 hand,827,0.014187925680660159,4 maximum,822,0.014102146202542503,7 mapping,820,0.014067834411295442,7 critical,820,0.014067834411295442,8 al,815,0.013982054933177786,2 reading,814,0.013964899037554256,7 comprehensive,814,0.013964899037554256,13 generated,813,0.013947743141930724,9 university,812,0.013930587246307193,10 agent,811,0.013913431350683663,5 conventional,810,0.013896275455060132,12 subset,809,0.0138791195594366,6 computer,809,0.0138791195594366,8 cet,806,0.013827651872566007,3 parse,805,0.013810495976942476,5 n_gram,805,0.013810495976942476,6 judgment,802,0.013759028290071883,8 signal,800,0.013724716498824821,6 heuristic,799,0.01370756060320129,9 formal,799,0.01370756060320129,6 assumption,796,0.013656092916330697,10 reasoning,793,0.013604625229460104,9 augmentation,790,0.013553157542589511,12 action,789,0.01353600164696598,6 series,787,0.013501689855718918,6 clustering,787,0.013501689855718918,10 others,787,0.013501689855718918,6 ambiguity,786,0.013484533960095387,9 place,785,0.013467378064471855,5 extensive_experiment,783,0.013433066273224794,20 product,783,0.013433066273224794,7 polarity,782,0.013415910377601262,8 unified,781,0.01339875448197773,7 subtask,781,0.01339875448197773,7 unseen,778,0.013347286795107138,6 qa,777,0.013330130899483608,2 message,777,0.013330130899483608,7 integration,776,0.013312975003860077,11 ontology,776,0.013312975003860077,8 core,774,0.013278663212613015,4 robustness,774,0.013278663212613015,10 yield,773,0.013261507316989484,5 software,769,0.01319288373449536,8 element,769,0.01319288373449536,7 induction,768,0.013175727838871828,9 generic,768,0.013175727838871828,7 state_of_the_art_performance,763,0.013089948360754174,28 semantic_role,761,0.01305563656950711,13 lstm,758,0.013004168882636518,4 attribute,757,0.012987012987012988,9 item,757,0.012987012987012988,4 performs,756,0.012969857091389456,8 pretrained,755,0.012952701195765925,10 f1_score,755,0.012952701195765925,8 experience,754,0.012935545300142393,10 strong_baseline,754,0.012935545300142393,15 post,749,0.012849765822024739,4 capable,742,0.012729674552660022,7 clinical,742,0.012729674552660022,8 morphology,742,0.012729674552660022,10 format,742,0.012729674552660022,6 improved,740,0.01269536276141296,8 participation,739,0.012678206865789429,13 novel_approach,738,0.012661050970165897,14 last,736,0.012626739178918836,4 implicit,736,0.012626739178918836,8 situation,735,0.012609583283295304,9 domain_specific,734,0.012592427387671773,15 surface,733,0.012575271492048243,7 span,732,0.012558115596424712,4 statistic,732,0.012558115596424712,9 past,729,0.012506647909554119,4 investigation,727,0.012472336118307056,13 likely,726,0.012455180222683526,6 recent_year,725,0.012438024327059994,11 ner,725,0.012438024327059994,3 paraphrase,723,0.012403712535812931,10 easy,723,0.012403712535812931,4 science,722,0.012386556640189401,7 large_amount,722,0.012386556640189401,12 hard,720,0.012352244848942338,4 workshop,719,0.012335088953318809,8 sens,718,0.012317933057695277,4 unique,718,0.012317933057695277,6 multi_task,717,0.012300777162071745,10 tagger,710,0.012180685892707028,6 relevance,709,0.012163529997083498,9 link,707,0.012129218205836435,4 recent_work,707,0.012129218205836435,11 direct,707,0.012129218205836435,6 expensive,707,0.012129218205836435,9 comment,703,0.012060594623342311,7 flexible,702,0.012043438727718781,8 successful,701,0.01202628283209525,10 influence,700,0.012009126936471718,9 reliable,698,0.011974815145224657,8 boundary,694,0.011906191562730532,8 quantitative,694,0.011906191562730532,12 optimization,694,0.011906191562730532,12 next,692,0.011871879771483471,4 sentence_level,692,0.011871879771483471,14 association,691,0.01185472387585994,11 track,690,0.011837567980236408,5 decoding,690,0.011837567980236408,8 semi_supervised,690,0.011837567980236408,15 production,689,0.011820412084612876,10 entry,688,0.011803256188989347,5 special,687,0.011786100293365815,7 dimension,686,0.011768944397742283,9 optimal,684,0.011734632606495222,7 hidden,683,0.01171747671087169,6 operation,681,0.01168316491962463,9 constituent,681,0.01168316491962463,11 adversarial,675,0.011580229545883444,11 noise,673,0.01154591775463638,5 d'un,673,0.01154591775463638,4 pre_trained_language,672,0.011528761859012849,20 health,672,0.011528761859012849,6 automatique,672,0.011528761859012849,11 lower,667,0.011442982380895195,5 cognitive,666,0.011425826485271663,9 diversity,666,0.011425826485271663,9 advance,665,0.011408670589648133,7 free,665,0.011408670589648133,4 continuous,664,0.011391514694024602,10 bidirectional,663,0.01137435879840107,13 observation,662,0.011357202902777539,11 different_type,661,0.011340047007154009,14 third,661,0.011340047007154009,5 overview,661,0.011340047007154009,8 frame,661,0.011340047007154009,5 f_score,659,0.011305735215906946,7 fundamental,657,0.011271423424659885,11 systematic,657,0.011271423424659885,10 criterion,656,0.011254267529036353,9 genre,653,0.01120279984216576,5 state_of_the_art_result,652,0.011185643946542229,23 requirement,650,0.011151332155295167,11 pre_trained_language_model,650,0.011151332155295167,26 semantic_similarity,650,0.011151332155295167,19 feedback,649,0.011134176259671636,8 subtasks,649,0.011134176259671636,8 notion,649,0.011134176259671636,6 raw,648,0.011117020364048106,3 complete,647,0.011099864468424574,8 other_language,644,0.011048396781553982,14 cette,644,0.011048396781553982,5 matching,643,0.01103124088593045,8 svm,643,0.01103124088593045,3 large_corpus,641,0.010996929094683389,12 share,641,0.010996929094683389,5 informative,640,0.010979773199059857,11 power,640,0.010979773199059857,5 shallow,639,0.010962617303436326,7 stateof_the_art,636,0.010911149616565733,15 minimal,636,0.010911149616565733,7 text_classification,636,0.010911149616565733,19 whole,634,0.010876837825318671,5 comparative,631,0.010825370138448078,11 native,630,0.010808214242824547,6 entailment,630,0.010808214242824547,10 distinct,629,0.010791058347201015,8 theoretical,628,0.010773902451577484,11 predicate,627,0.010756746555953954,9 interesting,626,0.010739590660330423,11 transformation,623,0.01068812297345983,14 total,620,0.010636655286589237,5 extent,620,0.010636655286589237,6 transformer_based,618,0.010602343495342174,17 sequential,616,0.010568031704095112,10 utility,615,0.01055087580847158,7 qualitative,612,0.010499408121600988,11 node,611,0.010482252225977456,4 pre_training,611,0.010482252225977456,12 ambiguous,609,0.010447940434730395,9 synthetic,607,0.010413628643483334,9 history,606,0.010396472747859802,7 wmt,606,0.010396472747859802,3 smaller,605,0.01037931685223627,7 latter,605,0.01037931685223627,6 cue,603,0.01034500506098921,3 preference,602,0.010327849165365678,10 zero_shot,602,0.010327849165365678,9 material,601,0.010310693269742146,8 transcription,600,0.010293537374118616,13 phase,600,0.010293537374118616,5 principle,599,0.010276381478495085,9 entropy,599,0.010276381478495085,7 qui,599,0.010276381478495085,3 string,599,0.010276381478495085,6 reader,598,0.010259225582871553,6 wide_range,596,0.010224913791624492,10 valuable,595,0.01020775789600096,8 official,595,0.01020775789600096,8 claim,595,0.01020775789600096,5 in_domain,595,0.01020775789600096,9 state_ofthe_art,594,0.010190602000377429,15 translator,594,0.010190602000377429,10 graph_based,592,0.010156290209130368,11 conditional_random,591,0.010139134313506836,18 underlying,589,0.010104822522259775,10 margin,588,0.010087666626636243,6 guideline,587,0.010070510731012712,9 absolute,587,0.010070510731012712,8 story,585,0.01003619893976565,5 writing,585,0.01003619893976565,7 semantic_relation,585,0.01003619893976565,17 formalism,584,0.010019043044142119,9 gold_standard,584,0.010019043044142119,13 conditional_random_field,583,0.010001887148518589,24 weighted,583,0.010001887148518589,8 technical,581,0.009967575357271526,9 superior,581,0.009967575357271526,8 explanation,579,0.009933263566024465,11 powerful,578,0.009916107670400933,8 table,578,0.009916107670400933,5 family,576,0.009881795879153872,6 state_of_theart,576,0.009881795879153872,15 spoken_language,575,0.00986463998353034,15 person,575,0.00986463998353034,6 speed,574,0.009847484087906809,5 large_number,572,0.009813172296659747,12 compositional,572,0.009813172296659747,13 outperforms,572,0.009813172296659747,11 en,572,0.009813172296659747,2 coherence,571,0.009796016401036216,9 gender,571,0.009796016401036216,6 consistency,569,0.009761704609789154,11 help,568,0.009744548714165623,4 data_driven,566,0.009710236922918562,11 computation,566,0.009710236922918562,11 entire,564,0.009675925131671499,6 setup,564,0.009675925131671499,5 control,564,0.009675925131671499,7 open_domain,562,0.009641613340424437,11 least,562,0.009641613340424437,5 program,561,0.009624457444800906,7 strength,561,0.009624457444800906,8 linguistic_feature,558,0.009572989757930313,18 separate,558,0.009572989757930313,8 modality,557,0.009555833862306781,8 typical,555,0.00952152207105972,7 logical,554,0.009504366175436188,7 modification,554,0.009504366175436188,12 unknown,554,0.009504366175436188,7 natural_language_generation,552,0.009470054384189127,27 clear,552,0.009470054384189127,5 proper,549,0.009418586697318534,6 possibility,549,0.009418586697318534,11 low_resource_language,549,0.009418586697318534,21 background,548,0.009401430801695003,10 labeled,546,0.009367119010447941,7 highest,545,0.00934996311482441,7 automatic_speech,545,0.00934996311482441,16 semantic_representation,544,0.009332807219200878,23 prsentons,544,0.009332807219200878,9 best_result,544,0.009332807219200878,11 incremental,542,0.009298495427953817,11 fast,541,0.009281339532330285,4 semantic_information,539,0.009247027741083224,20 nous_prsentons,538,0.009229871845459692,14 light,538,0.009229871845459692,5 engineering,538,0.009229871845459692,11 internet,537,0.009212715949836161,8 head,537,0.009212715949836161,4 location,535,0.0091784041585891,8 majority,535,0.0091784041585891,8 asr,534,0.009161248262965568,3 sufficient,534,0.009161248262965568,10 predictive,533,0.009144092367342036,10 word_level,531,0.009109780576094975,10 automatic_evaluation,531,0.009109780576094975,20 au,529,0.009075468784847914,2 composition,528,0.009058312889224382,11 management,527,0.00904115699360085,10 d'une,527,0.00904115699360085,5 sequence_to_sequence,527,0.00904115699360085,20 lexical_resource,526,0.00902400109797732,16 forum,525,0.00900684520235379,5 narrative,524,0.008989689306730258,9 activity,523,0.008972533411106726,8 active,522,0.008955377515483197,6 turn,522,0.008955377515483197,4 equivalent,519,0.008903909828612602,10 sont,519,0.008903909828612602,4 date,517,0.00886959803736554,4 trained,515,0.00883528624611848,7 usefulness,513,0.008800974454871416,10 meaningful,512,0.008783818559247886,10 page,512,0.008783818559247886,4 historical,511,0.008766662663624355,10 patient,510,0.008749506768000823,7 scope,510,0.008749506768000823,5 better_performance,509,0.008732350872377292,18 learned,506,0.008680883185506699,7 penn,506,0.008680883185506699,4 availability,505,0.008663727289883169,12 coherent,504,0.008646571394259638,8 computational_linguistics,504,0.008646571394259638,25 act,503,0.008629415498636106,3 reinforcement,502,0.008612259603012574,13 prior_work,502,0.008612259603012574,10 automatic_speech_recognition,501,0.008595103707389045,28 partial,500,0.008577947811765513,7 primary,495,0.008492168333647859,7 matrix,494,0.008475012438024327,6 bayesian,494,0.008475012438024327,8 treebanks,492,0.008440700646777264,9 presence,492,0.008440700646777264,8 markov,492,0.008440700646777264,6 terminology,491,0.008423544751153735,11 line,491,0.008423544751153735,4 demonstrate,491,0.008423544751153735,11 syntactic_structure,491,0.008423544751153735,19 sparse,491,0.008423544751153735,6 achieves,491,0.008423544751153735,8 path,489,0.008389232959906671,4 artificial,489,0.008389232959906671,10 complementary,488,0.008372077064283142,13 dialect,488,0.008372077064283142,7 survey,488,0.008372077064283142,6 first_step,487,0.00835492116865961,10 exploration,487,0.00835492116865961,11 connection,487,0.00835492116865961,10 side,487,0.00835492116865961,4 policy,486,0.008337765273036079,6 frequent,486,0.008337765273036079,8 verbal,485,0.008320609377412547,6 crf,485,0.008320609377412547,3 rating,485,0.008320609377412547,6 auxiliary,484,0.008303453481789017,9 novel_method,483,0.008286297586165486,12 considerable,483,0.008286297586165486,12 video,482,0.008269141690541954,5 normalization,479,0.008217674003671361,13 applicable,479,0.008217674003671361,10 semantic_parsing,478,0.008200518108047831,16 corpus_based,476,0.008166206316800768,12 n_grams,475,0.008149050421177237,7 discovery,475,0.008149050421177237,9 early,474,0.008131894525553707,5 compound,474,0.008131894525553707,8 interpretable,473,0.008114738629930176,13 proposal,472,0.008097582734306644,8 relational,471,0.008080426838683114,10 state_of_the_art_method,468,0.00802895915181252,23 new_method,468,0.00802895915181252,10 programming,468,0.00802895915181252,11 distant,467,0.00801180325618899,7 sensitive,465,0.007977491464941927,9 hierarchy,465,0.007977491464941927,9 extractive,464,0.007960335569318397,10 beneficial,463,0.007943179673694865,10 poor,462,0.007926023778071334,4 prototype,462,0.007926023778071334,9 central,461,0.007908867882447804,7 acoustic,460,0.007891711986824273,8 conceptual,460,0.007891711986824273,10 generator,459,0.007874556091200741,9 russian,459,0.007874556091200741,7 confidence,458,0.00785740019557721,10 helpful,456,0.007823088404330148,7 recommendation,456,0.007823088404330148,14 portuguese,456,0.007823088404330148,10 personal,455,0.007805932508706617,8 other_hand,455,0.007805932508706617,10 broad,454,0.007788776613083086,5 record,453,0.007771620717459555,6 schema,453,0.007771620717459555,6 hindi,451,0.007737308926212493,5 validation,450,0.0077201530305889615,10 co_occurrence,450,0.0077201530305889615,13 extracted,450,0.0077201530305889615,9 exact,448,0.0076858412393419,5 international,448,0.0076858412393419,13 conversion,448,0.0076858412393419,10 script,448,0.0076858412393419,6 lot,447,0.007668685343718369,3 neural_network_model,447,0.007668685343718369,20 same_time,446,0.007651529448094838,9 professional,445,0.007634373552471306,12 european,445,0.007634373552471306,8 occurrence,444,0.007617217656847776,10 state_of_the_art_model,444,0.007617217656847776,22 true,443,0.007600061761224245,4 contextual_information,443,0.007600061761224245,22 annotated_corpus,440,0.007548594074353651,16 seed,440,0.007548594074353651,4 finite_state,439,0.007531438178730121,12 clause,439,0.007531438178730121,6 rsultats,439,0.007531438178730121,8 document_level,438,0.00751428228310659,14 template,438,0.00751428228310659,8 different_domain,437,0.0074971263874830585,16 digital,437,0.0074971263874830585,7 systme,437,0.0074971263874830585,6 competition,436,0.007479970491859528,11 f_measure,435,0.007462814596235996,9 rank,433,0.007428502804988934,4 human_judgment,432,0.007411346909365403,14 encoder_decoder,432,0.007411346909365403,15 cnn,432,0.007411346909365403,3 pronoun,432,0.007411346909365403,7 equal,431,0.007394191013741873,5 new_approach,431,0.007394191013741873,12 representative,431,0.007394191013741873,14 match,430,0.007377035118118341,5 passage,430,0.007377035118118341,7 iterative,430,0.007377035118118341,9 statement,429,0.0073598792224948105,9 organization,429,0.0073598792224948105,12 treatment,428,0.007342723326871279,9 right,427,0.007325567431247748,5 italian,426,0.007308411535624218,7 consideration,426,0.007308411535624218,13 toolkit,425,0.007291255640000686,7 child,425,0.007291255640000686,5 configuration,425,0.007291255640000686,13 promising_result,425,0.007291255640000686,16 universal_dependency,424,0.007274099744377155,20 empirical_result,424,0.007274099744377155,16 intent,424,0.007274099744377155,6 section,424,0.007274099744377155,7 new_dataset,423,0.007256943848753624,11 proposons,423,0.007256943848753624,9 implication,422,0.007239787953130093,11 likelihood,421,0.0072226320575065625,10 abstractive,421,0.0072226320575065625,11 arbitrary,417,0.007154008475012438,9 out_of_domain,417,0.007154008475012438,13 audio,417,0.007154008475012438,5 huge,416,0.007136852579388907,4 campaign,414,0.007102540788141845,8 outcome,413,0.007085384892518314,7 heterogeneous,413,0.007085384892518314,13 kernel,413,0.007085384892518314,6 pre_trained_model,413,0.007085384892518314,17 multiple_language,413,0.007085384892518314,17 expansion,412,0.007068228996894783,9 fine_tuned,412,0.007068228996894783,10 actual,412,0.007068228996894783,6 contrastive,412,0.007068228996894783,11 wsd,411,0.0070510731012712515,3 nous_proposons,411,0.0070510731012712515,14 unstructured,410,0.007033917205647721,12 chinese_english,410,0.007033917205647721,15 well_known,409,0.00701676131002419,10 formulation,409,0.00701676131002419,11 adaptive,406,0.0069652936231535964,8 transliteration,406,0.0069652936231535964,15 previous_study,405,0.006948137727530066,14 capture,405,0.006948137727530066,7 franais,405,0.006948137727530066,7 categorization,404,0.006930981831906535,14 encoding,404,0.006930981831906535,8 chinese_word,403,0.0069138259362830036,12 largest,402,0.006896670040659473,7 internal,402,0.006896670040659473,8 counterpart,402,0.006896670040659473,11 real_time,402,0.006896670040659473,9 post_editing,401,0.006879514145035941,12 index,401,0.006879514145035941,5 nlg,401,0.006879514145035941,3 game,401,0.006879514145035941,4 logic,400,0.006862358249412411,5 previous_approach,400,0.006862358249412411,17 iii,399,0.006845202353788879,3 high_level,399,0.006845202353788879,10 sparsity,399,0.006845202353788879,8 talk,398,0.0068280464581653485,4 conclusion,396,0.006793734666918286,10 visualization,394,0.006759422875671224,13 projection,394,0.006759422875671224,10 iwslt,394,0.006759422875671224,5 intermediate,393,0.006742266980047693,12 following,393,0.006742266980047693,9 task_specific,392,0.006725111084424163,13 avec,391,0.006707955188800631,4 intrinsic,391,0.006707955188800631,9 scoring,389,0.006673643397553569,7 emotional,389,0.006673643397553569,9 taxonomy,388,0.006656487501930038,8 ne,388,0.006656487501930038,2 natural_language_understanding,388,0.006656487501930038,30 relies,387,0.006639331606306508,6 empirical_study,387,0.006639331606306508,15 mutual,386,0.006622175710682976,6 scalable,386,0.006622175710682976,8 political,386,0.006622175710682976,9 relatedness,386,0.006622175710682976,11 concern,385,0.0066050198150594455,7 cet_article,385,0.0066050198150594455,11 generative_model,385,0.0066050198150594455,16 fashion,385,0.0066050198150594455,7 il,384,0.006587863919435914,2 trend,383,0.006570708023812383,5 commonsense,383,0.006570708023812383,11 distinction,382,0.006553552128188852,11 web_based,382,0.006553552128188852,9 map,382,0.006553552128188852,3 subjective,381,0.006536396232565321,10 synonym,380,0.00651924033694179,7 multiword,380,0.00651924033694179,9 life,379,0.006502084441318259,4 propagation,378,0.006484928545694728,11 google,376,0.006450616754447666,6 future_research,376,0.006450616754447666,15 inherent,375,0.006433460858824135,8 phonetic,375,0.006433460858824135,8 korean,375,0.006433460858824135,6 regular,375,0.006433460858824135,7 important_role,374,0.006416304963200604,14 classical,374,0.006416304963200604,9 transcript,373,0.006399149067577073,10 simplification,372,0.0063819931719535416,14 derivation,372,0.0063819931719535416,10 reasonable,370,0.00634768138070648,10 high_accuracy,370,0.00634768138070648,13 edge,369,0.006330525485082949,4 task_oriented,368,0.006313369589459418,13 natural_language_inference,368,0.006313369589459418,26 chain,367,0.0062962136938358865,5 shift,367,0.0062962136938358865,5 fluency,367,0.0062962136938358865,7 rnn,366,0.006279057798212356,3 collaborative,366,0.006279057798212356,13 device,366,0.006279057798212356,6 context_free,365,0.006261901902588824,12 realistic,364,0.006244746006965294,9 book,364,0.006244746006965294,4 dependent,364,0.006244746006965294,9 overlap,364,0.006244746006965294,7 website,364,0.006244746006965294,7 vision,363,0.006227590111341763,6 sophisticated,363,0.006227590111341763,13 run,363,0.006227590111341763,3 opportunity,363,0.006227590111341763,11 gradient,363,0.006227590111341763,8 pragmatic,362,0.006210434215718231,9 capacity,362,0.006210434215718231,8 short_term,361,0.006193278320094701,10 linguistic_knowledge,361,0.006193278320094701,20 introduction,360,0.006176122424471169,12 perplexity,359,0.0061589665288476385,10 pilot,359,0.0061589665288476385,5 linguist,359,0.0061589665288476385,8 offensive,359,0.0061589665288476385,9 granularity,358,0.006141810633224108,11 rapid,358,0.006141810633224108,5 future_work,358,0.006141810633224108,11 functional,357,0.006124654737600576,10 course,357,0.006124654737600576,6 neural_language,357,0.006124654737600576,15 weak,355,0.006090342946353514,4 slot,355,0.006090342946353514,4 few_shot,355,0.006090342946353514,8 electronic,354,0.0060731870507299834,10 perception,353,0.006056031155106452,10 rare,353,0.006056031155106452,4 donne,353,0.006056031155106452,5 textual_entailment,353,0.006056031155106452,18 partir,352,0.006038875259482921,6 advanced,352,0.006038875259482921,8 minimum,351,0.0060217193638593906,7 voice,351,0.0060217193638593906,5 fusion,351,0.0060217193638593906,6 competitive_result,350,0.006004563468235859,18 ai,350,0.006004563468235859,2 substitution,348,0.005970251676988797,12 combine,348,0.005970251676988797,7 intelligent,348,0.005970251676988797,11 fragment,348,0.005970251676988797,8 lm,348,0.005970251676988797,2 parallel_data,347,0.005953095781365266,13 mixture,347,0.005953095781365266,7 salient,346,0.0059359398857417355,7 correspondence,346,0.0059359398857417355,14 indicator,345,0.005918783990118204,9 new_task,345,0.005918783990118204,8 unlabeled_data,344,0.005901628094494673,14 cause,344,0.005901628094494673,5 regularization,344,0.005901628094494673,14 uncertainty,344,0.005901628094494673,11 adjective,344,0.005901628094494673,9 reordering,344,0.005901628094494673,10 prsente,344,0.005901628094494673,7 publication,343,0.005884472198871142,11 fewer,343,0.005884472198871142,5 semantic_role_labeling,342,0.005867316303247611,22 keywords,342,0.005867316303247611,8 metadata,342,0.005867316303247611,8 filtering,340,0.005833004512000549,9 suggestion,340,0.005833004512000549,10 costly,339,0.005815848616377018,6 massive,339,0.005815848616377018,7 transition,339,0.005815848616377018,10 modelling,339,0.005815848616377018,9 maximum_entropy,339,0.005815848616377018,15 ten,339,0.005815848616377018,3 simpler,339,0.005815848616377018,7 risk,339,0.005815848616377018,4 applicability,339,0.005815848616377018,13 mixed,338,0.005798692720753487,5 analyzer,337,0.005781536825129956,8 collocation,337,0.005781536825129956,11 bayes,337,0.005781536825129956,5 best_performance,337,0.005781536825129956,16 paragraph,337,0.005781536825129956,9 conll,337,0.005781536825129956,5 period,337,0.005781536825129956,6 cross_domain,336,0.0057643809295064245,12 part_of_speech_tagging,336,0.0057643809295064245,22 syntactic_information,336,0.0057643809295064245,21 encoders,336,0.0057643809295064245,8 instruction,335,0.005747225033882894,11 ground,335,0.005747225033882894,6 named_entity,335,0.005747225033882894,12 national,335,0.005747225033882894,8 quantity,334,0.005730069138259363,8 short_term_memory,332,0.005695757347012301,17 note,332,0.005695757347012301,4 transducer,331,0.005678601451388769,10 reliability,331,0.005678601451388769,11 library,330,0.005661445555765239,7 negation,329,0.005644289660141708,8 newspaper,329,0.005644289660141708,9 conference,329,0.005644289660141708,10 lemma,328,0.0056271337645181765,5 company,328,0.0056271337645181765,7 shared,328,0.0056271337645181765,6 best_performing,328,0.0056271337645181765,15 readability,328,0.0056271337645181765,11 measurement,328,0.0056271337645181765,11 easier,328,0.0056271337645181765,6 challenging_task,327,0.005609977868894646,16 greater,327,0.005609977868894646,7 contextualized,327,0.005609977868894646,14 manual_annotation,327,0.005609977868894646,17 aux,326,0.005592821973271114,3 completion,325,0.005575666077647584,10 behaviour,325,0.005575666077647584,9 feasibility,325,0.005575666077647584,11 numerous,325,0.005575666077647584,8 spoken_dialogue,324,0.005558510182024053,15 piece,324,0.005558510182024053,5 inter_annotator,324,0.005558510182024053,15 grammatical_error,323,0.005541354286400521,17 customer,323,0.005541354286400521,8 population,323,0.005541354286400521,10 discrete,323,0.005541354286400521,8 judgement,323,0.005541354286400521,9 second_language,323,0.005541354286400521,15 region,323,0.005541354286400521,6 preprocessing,323,0.005541354286400521,13 i.e.,322,0.005524198390776991,4 clue,322,0.005524198390776991,4 linguistic_resource,322,0.005524198390776991,19 linguistic_information,322,0.005524198390776991,22 propose,322,0.005524198390776991,7 self_attention,321,0.005507042495153459,14 thousand,321,0.005507042495153459,8 decade,320,0.0054898865995299286,6 pretraining,320,0.0054898865995299286,11 compression,319,0.005472730703906397,11 today,319,0.005472730703906397,5 czech,319,0.005472730703906397,5 accessible,319,0.005472730703906397,10 interpretability,319,0.005472730703906397,16 bert_based,318,0.005455574808282866,10 teacher,318,0.005455574808282866,7 dutch,318,0.005455574808282866,5 skill,318,0.005455574808282866,5 pairwise,317,0.005438418912659336,8 commercial,317,0.005438418912659336,10 graphical,317,0.005438418912659336,9 better_result,317,0.005438418912659336,13 count,316,0.005421263017035804,5 mandarin,316,0.005421263017035804,8 assignment,316,0.005421263017035804,10 marker,316,0.005421263017035804,6 specialized,316,0.005421263017035804,11 mthode,316,0.005421263017035804,6 efficacy,315,0.0054041071214122735,8 valid,315,0.0054041071214122735,5 approche,315,0.0054041071214122735,8 title,314,0.005386951225788742,5 us,314,0.005386951225788742,2 notre,314,0.005386951225788742,5 pa,313,0.005369795330165211,2 semantic_feature,313,0.005369795330165211,16 roberta,313,0.005369795330165211,7 crosslingual,312,0.005352639434541681,12 motivation,312,0.005352639434541681,10 former,311,0.005335483538918149,6 avon,311,0.005335483538918149,4 country,311,0.005335483538918149,7 volume,310,0.005318327643294618,6 stochastic,310,0.005318327643294618,10 previous_method,309,0.005301171747671087,15 nous_avon,309,0.005301171747671087,9 workflow,309,0.005301171747671087,8 english_language,309,0.005301171747671087,16 semantic_analysis,308,0.005284015852047556,17 expressive,308,0.005284015852047556,10 extra,308,0.005284015852047556,5 incorrect,307,0.0052668599564240255,9 textes,306,0.005249704060800494,6 realization,306,0.005249704060800494,11 best_model,306,0.005249704060800494,10 small_amount,305,0.005232548165176963,12 neural_architecture,305,0.005232548165176963,19 statistical_model,305,0.005232548165176963,17 synthesis,305,0.005232548165176963,9 reveals,305,0.005232548165176963,7 neural_language_model,305,0.005232548165176963,21 intelligence,305,0.005232548165176963,12 ongoing,305,0.005232548165176963,7 morphological_analysis,304,0.005215392269553432,22 deux,304,0.005215392269553432,4 foreign,304,0.005215392269553432,7 rouge,303,0.005198236373929901,5 multi_task_learning,303,0.005198236373929901,19 regard,303,0.005198236373929901,6 dense,302,0.00518108047830637,5 competitive_performance,302,0.00518108047830637,23 language_specific,302,0.00518108047830637,17 industry,301,0.005163924582682839,8 semeval_2020,301,0.005163924582682839,12 deep_learning_model,301,0.005163924582682839,19 comparable_corpus,301,0.005163924582682839,17 finite,301,0.005163924582682839,6 nlp_application,301,0.005163924582682839,15 estimate,299,0.005129612791435777,8 semeval_2020_task,299,0.005129612791435777,17 multi_document,299,0.005129612791435777,14 expectation,299,0.005129612791435777,11 decomposition,299,0.005129612791435777,13 pretrained_language,299,0.005129612791435777,19 distributed,299,0.005129612791435777,11 syntactic_feature,299,0.005129612791435777,17 suite,298,0.005112456895812246,5 longer,297,0.0050953010001887145,6 essay,297,0.0050953010001887145,5 http,297,0.0050953010001887145,4 recent_advance,297,0.0050953010001887145,14 disease,297,0.0050953010001887145,7 mode,296,0.005078145104565184,4 cross,296,0.005078145104565184,5 mental,296,0.005078145104565184,6 close,296,0.005078145104565184,5 age,296,0.005078145104565184,3 extended,296,0.005078145104565184,8 earlier,295,0.005060989208941653,7 flexibility,295,0.005060989208941653,11 static,295,0.005060989208941653,6 ou,294,0.005043833313318122,2 nominal,294,0.005043833313318122,7 approximation,294,0.005043833313318122,13 specification,294,0.005043833313318122,13 character_level,294,0.005043833313318122,15 assistant,292,0.005009521522071059,9 fixed,292,0.005009521522071059,5 chinese_word_segmentation,292,0.005009521522071059,25 performing,291,0.004992365626447529,10 cadre,290,0.004975209730823998,5 morpheme,290,0.004975209730823998,8 textual_similarity,290,0.004975209730823998,18 spatial,290,0.004975209730823998,7 virtual,290,0.004975209730823998,7 adequate,289,0.0049580538352004665,8 subsequent,289,0.0049580538352004665,10 sampling,289,0.0049580538352004665,8 edit,289,0.0049580538352004665,4 verification,288,0.004940897939576936,12 integrated,287,0.004923742043953404,10 functionality,287,0.004923742043953404,13 pretrained_language_model,286,0.004906586148329874,25 chunk,286,0.004906586148329874,5 site,286,0.004906586148329874,4 repository,286,0.004906586148329874,10 variational,286,0.004906586148329874,11 probabilistic_model,286,0.004906586148329874,19 hence,286,0.004906586148329874,5 ratio,286,0.004906586148329874,5 consisting,286,0.004906586148329874,10 seq2seq,286,0.004906586148329874,7 intuitive,286,0.004906586148329874,9 belief,285,0.004889430252706342,6 movie,285,0.004889430252706342,5 demand,285,0.004889430252706342,6 such_model,285,0.004889430252706342,10 new_domain,285,0.004889430252706342,10 filter,284,0.0048722743570828115,6 nli,284,0.0048722743570828115,3 thesaurus,284,0.0048722743570828115,9 drop,284,0.0048722743570828115,4 ablation,283,0.004855118461459281,8 amazon,283,0.004855118461459281,6 caption,283,0.004855118461459281,7 traitement,283,0.004855118461459281,10 noun_phrase,283,0.004855118461459281,11 academic,282,0.004837962565835749,8 feasible,282,0.004837962565835749,8 bottleneck,282,0.004837962565835749,10 business,282,0.004837962565835749,8 status,282,0.004837962565835749,6 interested,282,0.004837962565835749,10 nist,281,0.004820806670212219,4 many_language,281,0.004820806670212219,13 informal,281,0.004820806670212219,8 active_learning,281,0.004820806670212219,15 swedish,281,0.004820806670212219,7 deeper,281,0.004820806670212219,6 weakness,280,0.004803650774588687,8 presentation,280,0.004803650774588687,12 text_generation,280,0.004803650774588687,15 large_margin,280,0.004803650774588687,12 computational_model,280,0.004803650774588687,19 cross_language,279,0.004786494878965156,14 financial,279,0.004786494878965156,9 precise,278,0.004769338983341626,7 option,278,0.004769338983341626,6 predictor,278,0.004769338983341626,9 intuition,278,0.004769338983341626,9 portion,278,0.004769338983341626,7 naive,278,0.004769338983341626,5 linguistic_phenomenon,277,0.004752183087718094,21 compact,277,0.004752183087718094,7 body,277,0.004752183087718094,4 attention_based,277,0.004752183087718094,15 rhetorical,276,0.0047350271920945635,10 sound,276,0.0047350271920945635,5 different_approach,276,0.0047350271920945635,18 human_language,276,0.0047350271920945635,14 developer,275,0.004717871296471032,9 sign,275,0.004717871296471032,4 causal,275,0.004717871296471032,6 in_depth,275,0.004717871296471032,8 stance,275,0.004717871296471032,6 distillation,274,0.004700715400847501,12 combined,274,0.004700715400847501,8 unsupervised_method,273,0.004683559505223971,19 soft,273,0.004683559505223971,4 high_precision,273,0.004683559505223971,14 hour,272,0.004666403609600439,4 scarce,272,0.004666403609600439,6 phonological,272,0.004666403609600439,12 documentation,272,0.004666403609600439,13 different_level,272,0.004666403609600439,15 triple,271,0.004649247713976908,6 million,271,0.004649247713976908,7 distant_supervision,271,0.004649247713976908,19 time_consuming,271,0.004649247713976908,14 multi_word,270,0.004632091818353377,10 ainsi,270,0.004632091818353377,5 validity,270,0.004632091818353377,8 anaphora,270,0.004632091818353377,8 experiment_result,270,0.004632091818353377,17 logistic,270,0.004632091818353377,8 external_knowledge,269,0.004614935922729846,18 constituency,269,0.004614935922729846,12 fluent,269,0.004614935922729846,6 orthographic,269,0.004614935922729846,12 restriction,268,0.004597780027106315,11 improves,268,0.004597780027106315,8 preliminary_result,268,0.004597780027106315,18 consequence,268,0.004597780027106315,11 important_task,268,0.004597780027106315,14 false,268,0.004597780027106315,5 em,268,0.004597780027106315,2 tche,268,0.004597780027106315,4 analyse,268,0.004597780027106315,7 tre,268,0.004597780027106315,3 modular,268,0.004597780027106315,7 hand_crafted,267,0.004580624131482784,12 stream,267,0.004580624131482784,6 absence,267,0.004580624131482784,7 first_time,266,0.004563468235859253,10 simulation,266,0.004563468235859253,10 metaphor,265,0.004546312340235722,8 log,265,0.004546312340235722,3 langue,265,0.004546312340235722,6 big,265,0.004546312340235722,3 straightforward,265,0.004546312340235722,15 attribution,265,0.004546312340235722,11 inventory,264,0.004529156444612191,9 daily,264,0.004529156444612191,5 spontaneous,264,0.004529156444612191,11 preposition,264,0.004529156444612191,11 plausible,264,0.004529156444612191,9 vast,263,0.00451200054898866,4 supervised_learning,263,0.00451200054898866,19 synset,263,0.00451200054898866,6 lead,263,0.00451200054898866,4 extract,263,0.00451200054898866,7 hate,262,0.004494844653365129,4 transition_based,262,0.004494844653365129,16 ir,262,0.004494844653365129,2 indian,262,0.004494844653365129,6 popularity,261,0.004477688757741598,10 inclusion,261,0.004477688757741598,9 impressive,261,0.004477688757741598,10 multi_label,261,0.004477688757741598,11 raw_text,261,0.004477688757741598,8 enhancement,261,0.004477688757741598,11 movement,261,0.004477688757741598,8 high_performance,260,0.004460532862118067,16 mot,260,0.004460532862118067,3 syntactic_dependency,260,0.004460532862118067,20 magnitude,260,0.004460532862118067,9 update,260,0.004460532862118067,6 user_generated,259,0.004443376966494536,14 morphosyntactic,259,0.004443376966494536,15 debate,259,0.004443376966494536,6 conjunction,258,0.0044262210708710045,11 best_system,258,0.0044262210708710045,11 file,258,0.0044262210708710045,4 good_performance,258,0.0044262210708710045,16 pronunciation,258,0.0044262210708710045,13 nlp_system,258,0.0044262210708710045,10 entre,258,0.0044262210708710045,5 factual,257,0.004409065175247474,7 forest,257,0.004409065175247474,6 block,256,0.004391909279623943,5 n_best,256,0.004391909279623943,6 respective,256,0.004391909279623943,10 neutral,255,0.004374753384000412,7 matter,255,0.004374753384000412,6 un_corpus,255,0.004374753384000412,9 problematic,255,0.004374753384000412,11 equal_contribution,255,0.004374753384000412,18 state_of_the_art_system,255,0.004374753384000412,23 affect,254,0.004357597488376881,6 multi_modal,254,0.004357597488376881,11 shortcoming,254,0.004357597488376881,11 new_model,253,0.0043404415927533494,9 logistic_regression,253,0.0043404415927533494,19 character_based,253,0.0043404415927533494,15 language_independent,253,0.0043404415927533494,20 legal,253,0.0043404415927533494,5 controlled,252,0.004323285697129819,10 reward,252,0.004323285697129819,6 topical,252,0.004323285697129819,7 new_language,252,0.004323285697129819,12 non_native,251,0.004306129801506287,10 scarcity,251,0.004306129801506287,8 demonstration,251,0.004306129801506287,13 comme,251,0.004306129801506287,5 word2vec,251,0.004306129801506287,8 profile,250,0.004288973905882757,7 day,250,0.004288973905882757,3 human_annotation,250,0.004288973905882757,16 text_based,250,0.004288973905882757,10 extrinsic,250,0.004288973905882757,9 substantial_improvement,250,0.004288973905882757,23 bound,249,0.004271818010259226,5 trigger,249,0.004271818010259226,7 previous_research,249,0.004271818010259226,17 symbolic,249,0.004271818010259226,8 beam,249,0.004271818010259226,4 generalized,249,0.004271818010259226,11 richer,249,0.004271818010259226,6 binary_classification,248,0.004254662114635694,21 limit,248,0.004254662114635694,5 audience,248,0.004254662114635694,8 english_german,248,0.004254662114635694,14 non,248,0.004254662114635694,3 syntax_based,247,0.004237506219012164,12 synchronous,247,0.004237506219012164,11 incomplete,247,0.004237506219012164,10 divergence,246,0.004220350323388632,10 scene,246,0.004220350323388632,5 domaine,246,0.004220350323388632,7 discourse_relation,245,0.0042031944277651015,18 inflection,245,0.0042031944277651015,10 simultaneous,245,0.0042031944277651015,12 small_number,245,0.0042031944277651015,12 wide_variety,245,0.0042031944277651015,12 automatic_metric,245,0.0042031944277651015,16 phrasal,245,0.0042031944277651015,7 sub_tasks,245,0.0042031944277651015,9 attachment,245,0.0042031944277651015,10 journal,244,0.004186038532141571,7 growth,244,0.004186038532141571,6 resulting,244,0.004186038532141571,9 evolution,244,0.004186038532141571,9 writer,244,0.004186038532141571,6 modle,244,0.004186038532141571,5 education,244,0.004186038532141571,9 two_stage,244,0.004186038532141571,9 macro,243,0.004168882636518039,5 rich_language,243,0.004168882636518039,13 smantique,243,0.004168882636518039,9 recording,243,0.004168882636518039,9 linguistic_analysis,243,0.004168882636518039,19 unsupervised_approach,243,0.004168882636518039,21 proposition,243,0.004168882636518039,11 enhanced,242,0.004151726740894509,8 aggregation,242,0.004151726740894509,11 framenet,242,0.004151726740894509,8 scratch,241,0.004134570845270977,7 flow,241,0.004134570845270977,4 httpsgithub.com,241,0.004134570845270977,15 argumentation,241,0.004134570845270977,13 general_purpose,241,0.004134570845270977,15 compositionality,241,0.004134570845270977,16 truth,240,0.004117414949647446,5 educational,240,0.004117414949647446,11 neural_network_architecture,239,0.004100259054023916,27 question_answering,239,0.004100259054023916,18 crowdsourcing,239,0.004100259054023916,13 recent_study,239,0.004100259054023916,12 montrons,238,0.004083103158400384,8 rise,238,0.004083103158400384,4 aware,238,0.004083103158400384,5 semantic_parser,238,0.004083103158400384,15 small_set,238,0.004083103158400384,9 pre_processing,237,0.0040659472627768535,14 ie,237,0.0040659472627768535,2 correctness,237,0.0040659472627768535,11 simplicity,236,0.004048791367153322,10 attack,236,0.004048791367153322,6 collaboration,236,0.004048791367153322,13 insufficient,236,0.004048791367153322,12 extractor,235,0.004031635471529791,9 masked,235,0.004031635471529791,6 trade_off,235,0.004031635471529791,9 automatic_detection,235,0.004031635471529791,19 short_text,235,0.004031635471529791,10 se,235,0.004031635471529791,2 license,234,0.00401447957590626,7 ud,234,0.00401447957590626,2 typology,234,0.00401447957590626,8 deal,234,0.00401447957590626,4 testing,234,0.00401447957590626,7 context_free_grammar,234,0.00401447957590626,20 distributional_semantics,234,0.00401447957590626,24 monolingual_data,234,0.00401447957590626,16 member,233,0.003997323680282729,6 variability,233,0.003997323680282729,11 bilingual_dictionary,233,0.003997323680282729,20 shared_task,233,0.003997323680282729,11 bag_of_words,232,0.0039801677846591985,12 out_of_vocabulary,232,0.0039801677846591985,17 trait,232,0.0039801677846591985,5 diagnosis,232,0.0039801677846591985,9 faster,232,0.0039801677846591985,6 further_research,231,0.003963011889035667,16 desired,231,0.003963011889035667,7 protocol,231,0.003963011889035667,8 window,231,0.003963011889035667,6 andor,231,0.003963011889035667,5 creative,231,0.003963011889035667,8 approximate,231,0.003963011889035667,11 unknown_word,231,0.003963011889035667,12 dirichlet,231,0.003963011889035667,9 different_model,230,0.003945855993412136,15 brief,230,0.003945855993412136,5 remarkable,230,0.003945855993412136,10 unclear,230,0.003945855993412136,7 semeval_2019,230,0.003945855993412136,12 human_annotator,230,0.003945855993412136,15 multi_document_summarization,230,0.003945855993412136,28 aid,230,0.003945855993412136,3 mutual_information,229,0.003928700097788605,18 bootstrapping,229,0.003928700097788605,13 social_network,229,0.003928700097788605,14 paraphrasing,229,0.003928700097788605,12 prosodic,229,0.003928700097788605,8 literary,228,0.003911544202165074,8 semeval_2022,228,0.003911544202165074,12 descriptive,227,0.003894388306541543,11 abstractive_summarization,227,0.003894388306541543,25 semeval_2019_task,227,0.003894388306541543,17 weakly,227,0.003894388306541543,6 significance,227,0.003894388306541543,12 associated,226,0.003877232410918012,10 existence,226,0.003877232410918012,9 ordering,226,0.003877232410918012,8 thanks,226,0.003877232410918012,6 kb,226,0.003877232410918012,2 foundation,226,0.003877232410918012,10 deployment,226,0.003877232410918012,10 hmm,226,0.003877232410918012,3 intention,226,0.003877232410918012,9 semeval_2022_task,225,0.0038600765152944807,17 room,225,0.0038600765152944807,4 wider,224,0.00384292061967095,5 _a,224,0.00384292061967095,2 mobile,224,0.00384292061967095,6 inter_annotator_agreement,223,0.003825764724047419,25 word_based,223,0.003825764724047419,10 superiority,223,0.003825764724047419,11 semantic_annotation,223,0.003825764724047419,19 worse,222,0.003808608828423888,5 tuning,221,0.0037914529328003568,6 natural_language_text,221,0.0037914529328003568,21 blog,221,0.0037914529328003568,4 planning,221,0.0037914529328003568,8 turkish,221,0.0037914529328003568,7 neighbor,221,0.0037914529328003568,8 infrastructure,221,0.0037914529328003568,14 predicted,220,0.0037742970371768257,9 spoken_dialogue_system,220,0.0037742970371768257,22 semantic_model,220,0.0037742970371768257,14 ressources,220,0.0037742970371768257,10 learning_based,220,0.0037742970371768257,14 semeval_2016,220,0.0037742970371768257,12 call,219,0.003757141141553295,4 sub_task,219,0.003757141141553295,8 parallel_text,219,0.003757141141553295,13 predicate_argument,219,0.003757141141553295,18 elementary,219,0.003757141141553295,10 monolingual_corpus,219,0.003757141141553295,18 srl,219,0.003757141141553295,3 hybrid_approach,219,0.003757141141553295,15 cross_lingual_transfer,218,0.003739985245929764,22 semi_supervised_learning,218,0.003739985245929764,24 multi_domain,218,0.003739985245929764,12 moses,218,0.003739985245929764,5 coefficient,217,0.003722829350306233,11 convolution,217,0.003722829350306233,11 uniform,216,0.0037056734546827017,7 perceptron,216,0.0037056734546827017,10 refinement,216,0.0037056734546827017,10 acl,216,0.0037056734546827017,3 analogy,216,0.0037056734546827017,7 multitask,216,0.0037056734546827017,9 long_distance,216,0.0037056734546827017,13 stable,215,0.0036885175590591706,6 qualitative_analysis,215,0.0036885175590591706,20 knowledge_based,215,0.0036885175590591706,15 tracking,215,0.0036885175590591706,8 cultural,215,0.0036885175590591706,8 broader,214,0.0036713616634356395,7 bilingual_corpus,214,0.0036713616634356395,16 nmt_model,214,0.0036713616634356395,9 nous_montrons,214,0.0036713616634356395,13 contemporary,214,0.0036713616634356395,12 offensive_language,214,0.0036713616634356395,18 vital,214,0.0036713616634356395,5 lexical_feature,214,0.0036713616634356395,15 intervention,213,0.003654205767812109,12 inconsistency,213,0.003654205767812109,13 log_linear,212,0.0036370498721885777,10 prominent,212,0.0036370498721885777,9 construct,212,0.0036370498721885777,9 promise,212,0.0036370498721885777,7 tude,211,0.0036198939765650466,4 joint_model,211,0.0036198939765650466,11 travail,211,0.0036198939765650466,7 desirable,211,0.0036198939765650466,9 serious,211,0.0036198939765650466,7 enough,211,0.0036198939765650466,6 semi_automatic,211,0.0036198939765650466,14 native_speaker,210,0.0036027380809415155,14 connective,210,0.0036027380809415155,10 lattice,210,0.0036027380809415155,7 state_of_the_art_approach,210,0.0036027380809415155,25 xml,210,0.0036027380809415155,3 deterministic,210,0.0036027380809415155,13 oracle,210,0.0036027380809415155,6 manual_evaluation,209,0.0035855821853179844,17 post_processing,209,0.0035855821853179844,15 stronger,209,0.0035855821853179844,8 back_translation,209,0.0035855821853179844,16 semeval_2016_task,209,0.0035855821853179844,17 various_type,209,0.0035855821853179844,12 tokenization,209,0.0035855821853179844,12 observed,209,0.0035855821853179844,8 plan,209,0.0035855821853179844,4 bilingual_lexicon,209,0.0035855821853179844,17 release,208,0.0035684262896944533,7 citation,208,0.0035684262896944533,8 foreign_language,208,0.0035684262896944533,16 posterior,208,0.0035684262896944533,9 different_way,208,0.0035684262896944533,13 encouraging,208,0.0035684262896944533,11 context_aware,208,0.0035684262896944533,13 editor,208,0.0035684262896944533,6 keyword,208,0.0035684262896944533,7 th,208,0.0035684262896944533,2 multilingual_model,208,0.0035684262896944533,18 high_resource,207,0.0035512703940709226,13 morphological_analyzer,207,0.0035512703940709226,22 named,207,0.0035512703940709226,5 constrained,207,0.0035512703940709226,11 root,207,0.0035512703940709226,4 concrete,206,0.0035341144984473915,8 new_feature,206,0.0035341144984473915,11 confusion,206,0.0035341144984473915,9 threshold,206,0.0035341144984473915,9 adequacy,206,0.0035341144984473915,8 good_result,206,0.0035341144984473915,11 new_corpus,205,0.0035169586028238604,10 hundred,205,0.0035169586028238604,7 feature_based,205,0.0035169586028238604,13 tendency,205,0.0035169586028238604,8 subword,205,0.0035169586028238604,7 translated,204,0.0034998027072003293,10 ccg,204,0.0034998027072003293,3 argumentative,204,0.0034998027072003293,13 bigram,204,0.0034998027072003293,6 mismatch,204,0.0034998027072003293,8 symbol,204,0.0034998027072003293,6 off_the_shelf,204,0.0034998027072003293,13 bank,204,0.0034998027072003293,4 emphasis,203,0.0034826468115767982,8 center,203,0.0034826468115767982,6 multi_lingual,203,0.0034826468115767982,13 school,203,0.0034826468115767982,6 different_task,203,0.0034826468115767982,14 perform,203,0.0034826468115767982,7 lightweight,203,0.0034826468115767982,11 american,203,0.0034826468115767982,8 pivot,203,0.0034826468115767982,5 exercise,203,0.0034826468115767982,8 redundant,202,0.0034654909159532675,9 l'analyse,202,0.0034654909159532675,9 redundancy,202,0.0034654909159532675,10 greedy,202,0.0034654909159532675,6 acceptable,202,0.0034654909159532675,10 sota,202,0.0034654909159532675,4 sarcasm,202,0.0034654909159532675,7 crfs,202,0.0034654909159532675,4 prompt,201,0.0034483350203297364,6 categorial,201,0.0034483350203297364,10 demo,201,0.0034483350203297364,4 patent,201,0.0034483350203297364,6 on_line,201,0.0034483350203297364,7 syllable,201,0.0034483350203297364,8 failure,201,0.0034483350203297364,7 effective_method,201,0.0034483350203297364,16 finnish,201,0.0034483350203297364,7 superior_performance,201,0.0034483350203297364,20 phone,201,0.0034483350203297364,5 recursive,201,0.0034483350203297364,9 society,201,0.0034483350203297364,7 request,201,0.0034483350203297364,7 nlu,201,0.0034483350203297364,3 lstms,201,0.0034483350203297364,5 np,201,0.0034483350203297364,2 inflectional,200,0.0034311791247062053,12 token_level,200,0.0034311791247062053,11 reddit,200,0.0034311791247062053,6 detailed_analysis,200,0.0034311791247062053,17 semeval_2018,200,0.0034311791247062053,12 syntactic_parsing,199,0.0034140232290826742,17 clean,199,0.0034140232290826742,5 punctuation,199,0.0034140232290826742,11 judge,199,0.0034140232290826742,5 polish,199,0.0034140232290826742,6 old,199,0.0034140232290826742,3 literal,198,0.003396867333459143,7 parallel_sentence,198,0.003396867333459143,17 psycholinguistic,198,0.003396867333459143,16 channel,198,0.003396867333459143,7 recent_research,198,0.003396867333459143,15 overall_performance,198,0.003396867333459143,19 largescale,198,0.003396867333459143,10 percentage,198,0.003396867333459143,10 predefined,198,0.003396867333459143,10 covid_19,198,0.003396867333459143,8 cosine,198,0.003396867333459143,6 antecedent,197,0.003379711437835612,10 langues,197,0.003379711437835612,7 identity,197,0.003379711437835612,8 restaurant,197,0.003379711437835612,10 isolation,197,0.003379711437835612,9 da,197,0.003379711437835612,2 proportion,197,0.003379711437835612,10 intensity,197,0.003379711437835612,9 known,196,0.0033625555422120814,5 mwes,196,0.0033625555422120814,4 tamil,196,0.0033625555422120814,5 compatible,196,0.0033625555422120814,10 text_summarization,196,0.0033625555422120814,18 stylistic,196,0.0033625555422120814,9 care,196,0.0033625555422120814,4 robot,196,0.0033625555422120814,5 complement,195,0.0033453996465885503,10 different_method,195,0.0033453996465885503,16 comparable_performance,195,0.0033453996465885503,22 empirical_evaluation,195,0.0033453996465885503,20 sentiment_analysis,195,0.0033453996465885503,18 current_state,195,0.0033453996465885503,13 stanford,195,0.0033453996465885503,8 irrelevant,195,0.0033453996465885503,10 newswire,195,0.0033453996465885503,8 native_language,195,0.0033453996465885503,15 dual,195,0.0033453996465885503,4 indian_language,194,0.003328243750965019,15 amr,194,0.003328243750965019,3 canonical,194,0.003328243750965019,9 closed,194,0.003328243750965019,6 state_of_the_art_baseline,194,0.003328243750965019,25 long_term,194,0.003328243750965019,9 adversarial_training,194,0.003328243750965019,20 unsupervised_learning,194,0.003328243750965019,21 mt_system,194,0.003328243750965019,9 split,193,0.003311087855341488,5 numerical,193,0.003311087855341488,9 inconsistent,193,0.003311087855341488,12 semeval_2018_task,193,0.003311087855341488,17 code_mixed,193,0.003311087855341488,10 fine,192,0.003293931959717957,4 spelling,192,0.003293931959717957,8 picture,192,0.003293931959717957,7 single_word,192,0.003293931959717957,11 thorough,192,0.003293931959717957,8 task_oriented_dialogue,192,0.003293931959717957,22 nlp_model,192,0.003293931959717957,9 lexical_information,191,0.003276776064094426,19 abstraction,191,0.003276776064094426,11 galement,191,0.003276776064094426,8 classic,191,0.003276776064094426,7 diffrents,191,0.003276776064094426,9 many_application,191,0.003276776064094426,16 further_improvement,191,0.003276776064094426,19 widespread,191,0.003276776064094426,10 recognizer,191,0.003276776064094426,10 biomedical_text,191,0.003276776064094426,15 mistake,190,0.003259620168470895,7 real_life,190,0.003259620168470895,9 snippet,190,0.003259620168470895,7 linking,190,0.003259620168470895,7 demographic,189,0.003242464272847364,11 productivity,189,0.003242464272847364,12 discrimination,189,0.003242464272847364,14 leur,189,0.003242464272847364,4 automatic_extraction,188,0.003225308377223833,20 syntactic_analysis,188,0.003225308377223833,18 peut,188,0.003225308377223833,4 proficiency,188,0.003225308377223833,11 mind,187,0.003208152481600302,4 transformer_based_model,187,0.003208152481600302,23 contrary,187,0.003208152481600302,8 suffers,187,0.003208152481600302,7 satisfactory,187,0.003208152481600302,12 modified,187,0.003208152481600302,8 fourth,187,0.003208152481600302,6 reranking,187,0.003208152481600302,9 human_performance,187,0.003208152481600302,17 grammatical_error_correction,186,0.0031909965859767708,28 syntaxique,186,0.0031909965859767708,10 self_supervised,186,0.0031909965859767708,15 train,185,0.00317384069035324,5 inductive,185,0.00317384069035324,9 logical_form,185,0.00317384069035324,12 drawback,185,0.00317384069035324,8 so_called,185,0.00317384069035324,9 depth,185,0.00317384069035324,5 artificial_intelligence,185,0.00317384069035324,23 speech_recognition,185,0.00317384069035324,18 none,184,0.003156684794729709,4 transduction,184,0.003156684794729709,12 upper,184,0.003156684794729709,5 english_text,184,0.003156684794729709,12 semeval_2021,184,0.003156684794729709,12 autoencoder,184,0.003156684794729709,11 bottom_up,184,0.003156684794729709,9 density,184,0.003156684794729709,7 consistent_improvement,184,0.003156684794729709,22 temporal_relation,184,0.003156684794729709,17 lda,183,0.003139528899106178,3 figure,183,0.003139528899106178,6 experimental_evaluation,183,0.003139528899106178,23 tutorial,183,0.003139528899106178,8 contexte,183,0.003139528899106178,8 semeval_2021_task,183,0.003139528899106178,17 unannotated,183,0.003139528899106178,11 diagnostic,183,0.003139528899106178,10 identifier,183,0.003139528899106178,10 lexicalized,183,0.003139528899106178,11 broad_coverage,182,0.003122373003482647,14 dependency_based,182,0.003122373003482647,16 government,182,0.003122373003482647,10 human_judgement,182,0.003122373003482647,15 semantic_structure,182,0.003122373003482647,18 lowresource,182,0.003122373003482647,11 competitive_baseline,182,0.003122373003482647,20 integer,182,0.003122373003482647,7 l2,182,0.003122373003482647,2 variance,182,0.003122373003482647,8 supervised_machine,181,0.0031052171078591157,18 bad,181,0.0031052171078591157,3 biomedical_domain,181,0.0031052171078591157,17 meeting,181,0.0031052171078591157,7 offline,181,0.0031052171078591157,7 german_english,181,0.0031052171078591157,14 ter,181,0.0031052171078591157,3 thing,181,0.0031052171078591157,5 diachronic,181,0.0031052171078591157,10 statistical_method,181,0.0031052171078591157,18 operator,180,0.0030880612122355846,8 reconstruction,180,0.0030880612122355846,14 navigation,180,0.0030880612122355846,10 aligned,180,0.0030880612122355846,7 lexical_item,180,0.0030880612122355846,12 referential,180,0.0030880612122355846,11 iteration,180,0.0030880612122355846,9 institute,180,0.0030880612122355846,9 hidden_markov,180,0.0030880612122355846,13 human_like,180,0.0030880612122355846,10 allocation,180,0.0030880612122355846,10 different_feature,180,0.0030880612122355846,17 wrong,180,0.0030880612122355846,5 drug,180,0.0030880612122355846,4 equivalence,180,0.0030880612122355846,11 present_result,180,0.0030880612122355846,14 pretrained_model,179,0.003070905316612054,16 semeval_2017,179,0.003070905316612054,12 two_step,179,0.003070905316612054,8 grounding,179,0.003070905316612054,9 social_medium_platform,179,0.003070905316612054,22 categorial_grammar,179,0.003070905316612054,18 suffix,179,0.003070905316612054,6 traduction,179,0.003070905316612054,10 coarse_grained,179,0.003070905316612054,14 semantic_space,179,0.003070905316612054,14 differs,179,0.003070905316612054,7 affective,179,0.003070905316612054,9 duration,179,0.003070905316612054,8 subjectivity,179,0.003070905316612054,12 revision,178,0.003053749420988523,8 expertise,178,0.003053749420988523,9 obstacle,178,0.003053749420988523,8 whereas,178,0.003053749420988523,7 low_resource_setting,178,0.003053749420988523,20 synthetic_data,178,0.003053749420988523,14 gaussian,178,0.003053749420988523,8 specificity,178,0.003053749420988523,11 l'utilisation,178,0.003053749420988523,13 usability,177,0.0030365935253649917,9 automatic_identification,177,0.0030365935253649917,24 guidance,177,0.0030365935253649917,8 mechanical,177,0.0030365935253649917,10 exchange,177,0.0030365935253649917,8 organizer,177,0.0030365935253649917,9 chat,177,0.0030365935253649917,4 market,177,0.0030365935253649917,6 perturbation,177,0.0030365935253649917,12 formation,177,0.0030365935253649917,9 extractive_summarization,177,0.0030365935253649917,24 prior_knowledge,176,0.0030194376297414606,15 phoneme,176,0.0030194376297414606,7 specific_domain,176,0.0030194376297414606,15 session,176,0.0030194376297414606,7 single_model,176,0.0030194376297414606,12 ontological,176,0.0030194376297414606,11 different_datasets,176,0.0030194376297414606,18 phrase_based_smt,176,0.0030194376297414606,16 semantic_relatedness,176,0.0030194376297414606,20 calculation,176,0.0030194376297414606,11 discrepancy,175,0.0030022817341179295,11 barrier,175,0.0030022817341179295,7 pruning,175,0.0030022817341179295,7 headline,175,0.0030022817341179295,8 initiative,175,0.0030022817341179295,10 kg,175,0.0030022817341179295,2 asian,175,0.0030022817341179295,5 large_set,175,0.0030022817341179295,9 free_text,175,0.0030022817341179295,9 modifier,174,0.0029851258384943984,8 psychological,174,0.0029851258384943984,13 practitioner,173,0.0029679699428708677,12 excellent,173,0.0029679699428708677,9 utilisant,173,0.0029679699428708677,9 textual_data,173,0.0029679699428708677,12 voting,173,0.0029679699428708677,6 coordination,173,0.0029679699428708677,12 indexing,173,0.0029679699428708677,8 mthodes,173,0.0029679699428708677,7 versus,173,0.0029679699428708677,6 under_resourced,172,0.0029508140472473366,15 semeval_2017_task,172,0.0029508140472473366,17 local_context,172,0.0029508140472473366,13 physical,172,0.0029508140472473366,8 disorder,172,0.0029508140472473366,8 reaction,172,0.0029508140472473366,8 rnns,172,0.0029508140472473366,4 self_training,172,0.0029508140472473366,13 novel_framework,171,0.0029336581516238055,15 api,171,0.0029336581516238055,3 targeted,171,0.0029336581516238055,8 linguistic_annotation,171,0.0029336581516238055,21 dominant,171,0.0029336581516238055,8 latest,171,0.0029336581516238055,6 texte,171,0.0029336581516238055,5 smantiques,171,0.0029336581516238055,10 large_collection,171,0.0029336581516238055,16 communicative,171,0.0029336581516238055,13 different_aspect,170,0.0029165022560002744,16 different_word,170,0.0029165022560002744,14 referent,170,0.0029165022560002744,8 httpsgithub,170,0.0029165022560002744,11 relative_improvement,170,0.0029165022560002744,20 linguistiques,170,0.0029165022560002744,13 regularity,170,0.0029165022560002744,10 such_system,170,0.0029165022560002744,11 replacement,169,0.0028993463603767433,11 induced,169,0.0028993463603767433,7 leaderboard,169,0.0028993463603767433,11 semantic_knowledge,169,0.0028993463603767433,18 exploitation,169,0.0028993463603767433,12 lexical_semantics,169,0.0028993463603767433,17 norm,169,0.0028993463603767433,4 major_challenge,169,0.0028993463603767433,15 perfect,168,0.0028821904647532122,7 spectrum,168,0.0028821904647532122,8 premise,168,0.0028821904647532122,7 principled,168,0.0028821904647532122,10 ideal,168,0.0028821904647532122,5 crowdsourced,168,0.0028821904647532122,12 augmented,167,0.0028650345691296816,9 ace,167,0.0028650345691296816,3 masked_language,167,0.0028650345691296816,15 chinese_to_english,167,0.0028650345691296816,18 vowel,167,0.0028650345691296816,5 viable,167,0.0028650345691296816,6 several_language,167,0.0028650345691296816,16 pearson,166,0.0028478786735061505,7 significant_performance,166,0.0028478786735061505,23 flat,166,0.0028478786735061505,4 novelty,166,0.0028478786735061505,7 trained_model,166,0.0028478786735061505,13 une_approche,166,0.0028478786735061505,12 sensitivity,166,0.0028478786735061505,11 permet,166,0.0028478786735061505,6 personality,166,0.0028478786735061505,11 disagreement,166,0.0028478786735061505,12 adoption,165,0.0028307227778826194,8 labelling,165,0.0028307227778826194,9 turk,165,0.0028307227778826194,4 compte,165,0.0028307227778826194,6 hypernym,165,0.0028307227778826194,8 normal,165,0.0028307227778826194,6 ont,164,0.0028135668822590883,3 mechanical_turk,164,0.0028135668822590883,15 permettant,164,0.0028135668822590883,10 python,164,0.0028135668822590883,6 convolutional_network,164,0.0028135668822590883,21 degradation,164,0.0028135668822590883,11 dialectal,164,0.0028135668822590883,9 question_answer,164,0.0028135668822590883,15 typological,164,0.0028135668822590883,11 preliminary_experiment,164,0.0028135668822590883,22 innovation,164,0.0028135668822590883,10 relevant_information,163,0.002796410986635557,20 statistical_approach,163,0.002796410986635557,20 conversational_agent,163,0.002796410986635557,20 century,163,0.002796410986635557,7 objective_function,163,0.002796410986635557,18 linguistic_structure,163,0.002796410986635557,20 polysemy,163,0.002796410986635557,8 pseudo,163,0.002796410986635557,6 naive_bayes,163,0.002796410986635557,11 multi_hop,163,0.002796410986635557,9 theme,163,0.002796410986635557,5 law,162,0.0027792550910120265,3 simulated,162,0.0027792550910120265,9 weighting,162,0.0027792550910120265,9 latency,162,0.0027792550910120265,7 enable,162,0.0027792550910120265,6 franccais,162,0.0027792550910120265,9 extensible,162,0.0027792550910120265,10 first_attempt,162,0.0027792550910120265,13 mathematical,162,0.0027792550910120265,12 parole,162,0.0027792550910120265,6 difficult_task,162,0.0027792550910120265,14 hidden_markov_model,162,0.0027792550910120265,19 phrase_based_translation,162,0.0027792550910120265,24 sparseness,161,0.0027620991953884954,10 net,161,0.0027620991953884954,3 linguistique,161,0.0027620991953884954,12 ibm,161,0.0027620991953884954,3 innovative,161,0.0027620991953884954,10 multi_class,161,0.0027620991953884954,11 premier,161,0.0027620991953884954,7 glue,161,0.0027620991953884954,4 attractive,161,0.0027620991953884954,10 ranked,161,0.0027620991953884954,6 fake,160,0.0027449432997649643,4 ml,160,0.0027449432997649643,2 contains,160,0.0027449432997649643,8 modern_standard,160,0.0027449432997649643,15 everyday,160,0.0027449432997649643,8 automatiquement,160,0.0027449432997649643,15 finite_state_transducer,160,0.0027449432997649643,23 useful_information,160,0.0027449432997649643,18 edition,160,0.0027449432997649643,7 particle,160,0.0027449432997649643,8 dynamic_programming,160,0.0027449432997649643,19 black_box,159,0.002727787404141433,9 sts,159,0.002727787404141433,3 related_language,159,0.002727787404141433,16 bilstm,159,0.002727787404141433,6 varies,159,0.002727787404141433,6 email,159,0.002727787404141433,5 tf_idf,159,0.002727787404141433,6 consensus,159,0.002727787404141433,9 incorporation,159,0.002727787404141433,13 batch,159,0.002727787404141433,5 hpsg,159,0.002727787404141433,4 finetuning,158,0.002710631508517902,10 automatic_translation,158,0.002710631508517902,21 bi_directional,158,0.002710631508517902,14 latent_dirichlet,158,0.002710631508517902,16 structural_information,158,0.002710631508517902,22 scalability,158,0.002710631508517902,11 wide_coverage,158,0.002710631508517902,13 general_domain,158,0.002710631508517902,14 intensive,158,0.002710631508517902,9 facebook,157,0.002693475612894371,8 recherche,157,0.002693475612894371,9 subtle,157,0.002693475612894371,6 automatic_generation,157,0.002693475612894371,20 scientific_paper,157,0.002693475612894371,16 minority,157,0.002693475612894371,8 pre_trained_word,157,0.002693475612894371,16 letter,157,0.002693475612894371,6 main_contribution,157,0.002693475612894371,17 compare,157,0.002693475612894371,7 e_commerce,157,0.002693475612894371,10 mwe,157,0.002693475612894371,3 decrease,156,0.0026763197172708403,8 characterization,156,0.0026763197172708403,16 plain,156,0.0026763197172708403,5 satisfaction,156,0.0026763197172708403,12 automaton,156,0.0026763197172708403,9 afin,156,0.0026763197172708403,4 external_resource,156,0.0026763197172708403,17 ad,156,0.0026763197172708403,2 simple_method,156,0.0026763197172708403,13 archive,156,0.0026763197172708403,7 experimentation,155,0.002659163821647309,15 preparation,155,0.002659163821647309,11 lemmatization,155,0.002659163821647309,13 exploratory,155,0.002659163821647309,11 n_gram_language,155,0.002659163821647309,15 elmo,155,0.002659163821647309,4 preservation,155,0.002659163821647309,12 look,155,0.002659163821647309,4 bag,155,0.002659163821647309,3 standardized,155,0.002659163821647309,12 linguistic_data,155,0.002659163821647309,15 prevalent,155,0.002659163821647309,9 careful,154,0.002642007926023778,7 thread,154,0.002642007926023778,6 thematic,154,0.002642007926023778,8 re_ranking,154,0.002642007926023778,10 humanity,154,0.002642007926023778,8 new_data,154,0.002642007926023778,8 peuvent,154,0.002642007926023778,7 hierarchical_structure,154,0.002642007926023778,22 trainable,154,0.002642007926023778,9 latent_dirichlet_allocation,154,0.002642007926023778,27 higher_level,154,0.002642007926023778,12 vers,154,0.002642007926023778,4 attitude,153,0.002624852030400247,8 biological,153,0.002624852030400247,10 comparative_study,153,0.002624852030400247,17 exhibit,153,0.002624852030400247,7 english_french,153,0.002624852030400247,14 abundant,153,0.002624852030400247,8 strict,153,0.002624852030400247,6 auxiliary_task,153,0.002624852030400247,14 chunking,153,0.002624852030400247,8 temporal_information,152,0.002607696134776716,20 identical,152,0.002607696134776716,9 effective_approach,152,0.002607696134776716,18 nave,152,0.002607696134776716,4 shorter,152,0.002607696134776716,7 independence,152,0.002607696134776716,12 different_kind,152,0.002607696134776716,14 chinese_character,152,0.002607696134776716,17 closer,152,0.002607696134776716,6 oov,151,0.002590540239153185,3 consumer,151,0.002590540239153185,8 aspect_based,151,0.002590540239153185,12 consists,151,0.002590540239153185,8 cross_linguistic,151,0.002590540239153185,16 d'information,151,0.002590540239153185,13 clinical_text,151,0.002590540239153185,13 simplified,151,0.002590540239153185,10 common_sense,151,0.002590540239153185,12 squad,151,0.002590540239153185,5 montrent,151,0.002590540239153185,8 privacy,151,0.002590540239153185,7 intended,151,0.002590540239153185,8 son,151,0.002590540239153185,3 explainable,151,0.002590540239153185,11 other_domain,151,0.002590540239153185,12 rest,151,0.002590540239153185,4 current_approach,151,0.002590540239153185,16 microsoft,150,0.002573384343529654,9 semantic_class,150,0.002573384343529654,14 sharing,150,0.002573384343529654,7 repetition,150,0.002573384343529654,10 lab,150,0.002573384343529654,3 predicate_argument_structure,150,0.002573384343529654,28 worker,150,0.002573384343529654,6 boost,150,0.002573384343529654,5 correlate,150,0.002573384343529654,9 crowd,150,0.002573384343529654,5 first_order,150,0.002573384343529654,11 insertion,149,0.002556228447906123,9 examination,149,0.002556228447906123,11 detector,149,0.002556228447906123,8 automatic_method,149,0.002556228447906123,16 social_medium_text,149,0.002556228447906123,18 existing,149,0.002556228447906123,8 selectional,149,0.002556228447906123,11 distributional_similarity,149,0.002556228447906123,25 better_understanding,149,0.002556228447906123,20 ubiquitous,149,0.002556228447906123,10 trs,149,0.002556228447906123,3 generate,148,0.002539072552282592,8 non_english,148,0.002539072552282592,11 constant,148,0.002539072552282592,8 woman,148,0.002539072552282592,5 developed,148,0.002539072552282592,9 identifies,148,0.002539072552282592,10 multi_level,148,0.002539072552282592,11 convergence,148,0.002539072552282592,11 slow,148,0.002539072552282592,4 modern_standard_arabic,147,0.002521916656659061,22 advancement,147,0.002521916656659061,11 abbreviation,147,0.002521916656659061,12 reprsentation,147,0.002521916656659061,13 wer,147,0.002521916656659061,3 semantic_dependency,147,0.002521916656659061,19 new_word,147,0.002521916656659061,8 orientation,147,0.002521916656659061,11 non_standard,147,0.002521916656659061,12 cognate,147,0.002521916656659061,7 unable,147,0.002521916656659061,6 abusive,147,0.002521916656659061,7 non_trivial,147,0.002521916656659061,11 factorization,146,0.0025047607610355297,13 chart,146,0.0025047607610355297,5 psychology,146,0.0025047607610355297,10 party,146,0.0025047607610355297,5 erroneous,146,0.0025047607610355297,9 enrichment,146,0.0025047607610355297,10 rationale,146,0.0025047607610355297,9 une_mthode,146,0.0025047607610355297,10 valuation,146,0.0025047607610355297,9 concise,146,0.0025047607610355297,7 diffrentes,146,0.0025047607610355297,10 context_sensitive,146,0.0025047607610355297,17 humor,145,0.002487604865411999,5 phrase_based_machine,145,0.002487604865411999,20 neural_approach,145,0.002487604865411999,15 multiple_choice,145,0.002487604865411999,15 multilingual_bert,145,0.002487604865411999,17 web_search,145,0.002487604865411999,10 human_annotated,145,0.002487604865411999,15 network_based,145,0.002487604865411999,13 indirect,145,0.002487604865411999,8 mais,145,0.002487604865411999,4 human_translation,145,0.002487604865411999,17 unrestricted,145,0.002487604865411999,12 gloss,145,0.002487604865411999,5 top_down,144,0.002470448969788468,8 sentential,144,0.002470448969788468,10 gpt_2,144,0.002470448969788468,5 awareness,144,0.002470448969788468,9 tm,144,0.002470448969788468,2 lecture,144,0.002470448969788468,7 effective_way,144,0.002470448969788468,13 automatic_classification,144,0.002470448969788468,24 long_range,144,0.002470448969788468,10 modles,144,0.002470448969788468,6 half,144,0.002470448969788468,4 nearest,143,0.002453293074164937,7 domainspecific,143,0.002453293074164937,14 latin,143,0.002453293074164937,5 phrase_based_machine_translation,143,0.002453293074164937,32 curriculum,143,0.002453293074164937,10 st,143,0.002453293074164937,2 tal,143,0.002453293074164937,3 manager,143,0.002453293074164937,7 higher_accuracy,143,0.002453293074164937,15 langage,143,0.002453293074164937,7 statistical_mt,143,0.002453293074164937,14 assistance,143,0.002453293074164937,10 adjacent,142,0.0024361371785414057,8 start,142,0.0024361371785414057,5 other_method,142,0.0024361371785414057,12 gesture,142,0.0024361371785414057,7 plusieurs,142,0.0024361371785414057,9 extreme,142,0.0024361371785414057,7 dtection,142,0.0024361371785414057,8 morpho_syntactic,142,0.0024361371785414057,16 code_switching,142,0.0024361371785414057,14 eye,142,0.0024361371785414057,3 text_to_speech,142,0.0024361371785414057,14 formula,141,0.0024189812829178746,7 n_gram_language_model,141,0.0024189812829178746,21 probable,141,0.0024189812829178746,8 idiom,141,0.0024189812829178746,5 present_paper,141,0.0024189812829178746,13 _the,140,0.0024018253872943435,4 si,140,0.0024018253872943435,2 personalized,140,0.0024018253872943435,12 grammaticality,140,0.0024018253872943435,14 partner,140,0.0024018253872943435,7 automatic_text,140,0.0024018253872943435,14 balanced,140,0.0024018253872943435,8 such_data,140,0.0024018253872943435,9 symptom,140,0.0024018253872943435,7 additional_information,140,0.0024018253872943435,22 greek,140,0.0024018253872943435,5 tense,140,0.0024018253872943435,5 automatic_evaluation_metric,140,0.0024018253872943435,27 varied,140,0.0024018253872943435,6 reconnaissance,140,0.0024018253872943435,14 much_attention,140,0.0024018253872943435,14 understood,139,0.002384669491670813,10 english_word,139,0.002384669491670813,12 teaching,139,0.002384669491670813,8 identifying,139,0.002384669491670813,11 rapport,139,0.002384669491670813,7 proof,139,0.002384669491670813,5 perceptual,139,0.002384669491670813,10 healthcare,139,0.002384669491670813,10 computational_cost,139,0.002384669491670813,18 balance,139,0.002384669491670813,7 distributional_model,139,0.002384669491670813,20 inflected,139,0.002384669491670813,9 mental_health,139,0.002384669491670813,13 custom,139,0.002384669491670813,6 systmes,138,0.0023675135960472818,7 trivial,138,0.0023675135960472818,7 prefix,138,0.0023675135960472818,6 fair,138,0.0023675135960472818,4 trec,138,0.0023675135960472818,4 svms,138,0.0023675135960472818,4 usable,138,0.0023675135960472818,6 fit,138,0.0023675135960472818,3 pcfg,138,0.0023675135960472818,4 further_analysis,138,0.0023675135960472818,16 stability,138,0.0023675135960472818,9 rhetorical_structure,138,0.0023675135960472818,20 vanilla,138,0.0023675135960472818,7 stem,138,0.0023675135960472818,4 devlin,138,0.0023675135960472818,6 listener,138,0.0023675135960472818,8 copy,137,0.0023503577004237507,4 unstructured_text,137,0.0023503577004237507,17 fraction,137,0.0023503577004237507,8 utilise,137,0.0023503577004237507,7 romanian,137,0.0023503577004237507,8 medical_domain,137,0.0023503577004237507,14 oral,137,0.0023503577004237507,4 street,137,0.0023503577004237507,6 captioning,137,0.0023503577004237507,10 brazilian,137,0.0023503577004237507,9 city,137,0.0023503577004237507,4 other_word,137,0.0023503577004237507,10 main_challenge,137,0.0023503577004237507,14 distributed_representation,137,0.0023503577004237507,26 rule_based_system,137,0.0023503577004237507,17 chinese_language,137,0.0023503577004237507,16 learn,137,0.0023503577004237507,5 previous_model,136,0.0023332018048002195,14 different_source,136,0.0023332018048002195,16 text_simplification,136,0.0023332018048002195,19 complicated,136,0.0023332018048002195,11 authorship,136,0.0023332018048002195,10 opposite,136,0.0023332018048002195,8 morphological_feature,136,0.0023332018048002195,21 reviewer,136,0.0023332018048002195,8 extrinsic_evaluation,136,0.0023332018048002195,20 spoken_language_translation,136,0.0023332018048002195,27 origin,136,0.0023332018048002195,6 semantic_relationship,136,0.0023332018048002195,21 english_chinese,136,0.0023332018048002195,15 sa,136,0.0023332018048002195,2 chinese_text,136,0.0023332018048002195,12 significant_gain,136,0.0023332018048002195,16 combinatory,135,0.0023160459091766884,11 disfluency,135,0.0023160459091766884,10 nlp_research,135,0.0023160459091766884,12 pure,135,0.0023160459091766884,4 similar_language,135,0.0023160459091766884,16 scientist,135,0.0023160459091766884,9 box,135,0.0023160459091766884,3 alternation,135,0.0023160459091766884,11 prone,135,0.0023160459091766884,5 novel_model,135,0.0023160459091766884,11 severe,135,0.0023160459091766884,6 related_task,134,0.0022988900135531573,12 spurious,134,0.0022988900135531573,8 european_language,134,0.0022988900135531573,17 orthography,134,0.0022988900135531573,11 grounded,134,0.0022988900135531573,8 behavioral,134,0.0022988900135531573,10 ca,134,0.0022988900135531573,2 required,134,0.0022988900135531573,8 strong_performance,134,0.0022988900135531573,18 social_science,134,0.0022988900135531573,14 derivational,134,0.0022988900135531573,12 bitext,134,0.0022988900135531573,6 anaphoric,134,0.0022988900135531573,9 novel_task,134,0.0022988900135531573,10 restricted,134,0.0022988900135531573,10 english_sentence,134,0.0022988900135531573,16 vietnamese,134,0.0022988900135531573,10 polysemous,134,0.0022988900135531573,10 medicine,134,0.0022988900135531573,8 anaphora_resolution,133,0.0022817341179296267,19 responsible,133,0.0022817341179296267,11 initialization,133,0.0022817341179296267,14 several_baseline,133,0.0022817341179296267,16 transcribed,133,0.0022817341179296267,11 checking,133,0.0022817341179296267,8 human_human,133,0.0022817341179296267,11 culture,133,0.0022817341179296267,7 proposed,133,0.0022817341179296267,8 harder,133,0.0022817341179296267,6 tches,133,0.0022817341179296267,5 viewpoint,133,0.0022817341179296267,9 first_stage,133,0.0022817341179296267,11 bengali,132,0.0022645782223060956,7 quantifier,132,0.0022645782223060956,10 human_judge,132,0.0022645782223060956,11 lexicale,132,0.0022645782223060956,8 ensemble_model,132,0.0022645782223060956,14 cohesion,132,0.0022645782223060956,8 interview,132,0.0022645782223060956,9 last_year,132,0.0022645782223060956,9 propbank,132,0.0022645782223060956,8 spontaneous_speech,132,0.0022645782223060956,18 acoustic_model,132,0.0022645782223060956,14 informativeness,132,0.0022645782223060956,15 few_year,131,0.0022474223266825645,8 industrial,131,0.0022474223266825645,10 refers,131,0.0022474223266825645,6 cooccurrence,131,0.0022474223266825645,12 cell,131,0.0022474223266825645,4 keyphrase,131,0.0022474223266825645,9 modest,131,0.0022474223266825645,6 brown,131,0.0022474223266825645,5 d'apprentissage,131,0.0022474223266825645,15 human_translator,131,0.0022474223266825645,16 chance,131,0.0022474223266825645,6 adult,131,0.0022474223266825645,5 tone,131,0.0022474223266825645,4 offer,130,0.0022302664310590334,5 example_based,130,0.0022302664310590334,13 obvious,130,0.0022302664310590334,7 individual_word,130,0.0022302664310590334,15 discriminator,130,0.0022302664310590334,13 absolute_improvement,130,0.0022302664310590334,20 handling,130,0.0022302664310590334,8 wall,130,0.0022302664310590334,4 principal,130,0.0022302664310590334,9 imbalance,130,0.0022302664310590334,9 autoregressive,130,0.0022302664310590334,14 concatenation,130,0.0022302664310590334,13 other_type,130,0.0022302664310590334,10 positional,130,0.0022302664310590334,10 french_english,130,0.0022302664310590334,14 lesson,130,0.0022302664310590334,6 valence,130,0.0022302664310590334,7 cat,129,0.0022131105354355023,3 proxy,129,0.0022131105354355023,5 markup,129,0.0022131105354355023,6 face,129,0.0022131105354355023,4 unified_framework,129,0.0022131105354355023,17 general_framework,129,0.0022131105354355023,17 edits,129,0.0022131105354355023,5 live,129,0.0022131105354355023,4 outperform,129,0.0022131105354355023,10 trigram,129,0.0022131105354355023,7 provider,128,0.0021959546398119716,8 consist,128,0.0021959546398119716,7 private,128,0.0021959546398119716,7 discus,128,0.0021959546398119716,6 latent_variable,128,0.0021959546398119716,15 arabic_english,128,0.0021959546398119716,14 aspect_based_sentiment,128,0.0021959546398119716,22 dcrivons,128,0.0021959546398119716,8 significant_difference,128,0.0021959546398119716,22 fuzzy,128,0.0021959546398119716,5 additional_feature,128,0.0021959546398119716,18 travel,128,0.0021959546398119716,6 dimensionality,128,0.0021959546398119716,14 wsj,128,0.0021959546398119716,3 diverse_set,128,0.0021959546398119716,11 beginning,128,0.0021959546398119716,9 supervised_model,127,0.0021787987441884405,16 pre_defined,127,0.0021787987441884405,11 secondary,127,0.0021787987441884405,9 lexical_unit,127,0.0021787987441884405,12 practical_application,127,0.0021787987441884405,21 adversarial_attack,127,0.0021787987441884405,18 multimedia,127,0.0021787987441884405,10 shape,127,0.0021787987441884405,5 log_linear_model,127,0.0021787987441884405,16 indicative,127,0.0021787987441884405,10 chaque,126,0.0021616428485649094,6 ngram,126,0.0021616428485649094,5 better_translation,126,0.0021616428485649094,18 multi_layer,126,0.0021616428485649094,11 temp,126,0.0021616428485649094,4 basque,126,0.0021616428485649094,6 unrelated,126,0.0021616428485649094,9 various_language,126,0.0021616428485649094,16 semantic_frame,126,0.0021616428485649094,14 multi_word_expression,126,0.0021616428485649094,21 broadcast,126,0.0021616428485649094,9 activation,126,0.0021616428485649094,10 necessity,126,0.0021616428485649094,9 approches,126,0.0021616428485649094,9 hope,126,0.0021616428485649094,4 motivated,126,0.0021616428485649094,9 n_gram_model,126,0.0021616428485649094,12 un_systme,125,0.0021444869529413783,9 little_attention,125,0.0021444869529413783,16 expriences,125,0.0021444869529413783,10 adverse,125,0.0021444869529413783,7 discipline,125,0.0021444869529413783,10 default,125,0.0021444869529413783,7 ambiguous_word,125,0.0021444869529413783,14 devlin_et,125,0.0021444869529413783,9 fait,125,0.0021444869529413783,4 unsupervised_word,125,0.0021444869529413783,17 l'extraction,125,0.0021444869529413783,12 weak_supervision,125,0.0021444869529413783,16 compilation,125,0.0021444869529413783,11 human_effort,125,0.0021444869529413783,12 automation,125,0.0021444869529413783,10 player,125,0.0021444869529413783,6 immediate,125,0.0021444869529413783,9 impossible,124,0.002127331057317847,10 public_datasets,124,0.002127331057317847,15 meteor,124,0.002127331057317847,6 computer_assisted,124,0.002127331057317847,17 dont,124,0.002127331057317847,4 package,124,0.002127331057317847,7 open_domain_question,124,0.002127331057317847,20 bakeoff,124,0.002127331057317847,7 bionlp,124,0.002127331057317847,6 single_sentence,124,0.002127331057317847,15 gene,124,0.002127331057317847,4 manipulation,124,0.002127331057317847,12 scientific_article,124,0.002127331057317847,18 devlin_et_al.,124,0.002127331057317847,13 average_precision,124,0.002127331057317847,17 provided,124,0.002127331057317847,8 mesure,124,0.002127331057317847,6 lexique,123,0.002110175161694316,7 context_dependent,123,0.002110175161694316,17 leverage,123,0.002110175161694316,8 selon,123,0.002110175161694316,5 large_datasets,123,0.002110175161694316,14 tagset,123,0.002110175161694316,6 nowadays,123,0.002110175161694316,8 intersection,123,0.002110175161694316,12 conflict,123,0.002110175161694316,8 middle,123,0.002110175161694316,6 cross_lingual_word,123,0.002110175161694316,18 spread,122,0.0020930192660707854,6 low_level,122,0.0020930192660707854,9 subtitle,122,0.0020930192660707854,8 minute,122,0.0020930192660707854,6 empirical_evidence,122,0.0020930192660707854,18 comparable_result,122,0.0020930192660707854,17 domain_independent,122,0.0020930192660707854,18 danish,122,0.0020930192660707854,6 linguistic_property,122,0.0020930192660707854,19 terminological,122,0.0020930192660707854,14 dependence,122,0.0020930192660707854,10 generalizability,122,0.0020930192660707854,16 etc,122,0.0020930192660707854,3 client,122,0.0020930192660707854,6 intrinsic_evaluation,122,0.0020930192660707854,20 segmenter,122,0.0020930192660707854,9 cascade,122,0.0020930192660707854,7 walk,122,0.0020930192660707854,4 coding,122,0.0020930192660707854,6 social_medium_data,122,0.0020930192660707854,18 such_information,122,0.0020930192660707854,16 full_text,122,0.0020930192660707854,9 exponential,122,0.0020930192660707854,11 lors,122,0.0020930192660707854,4 in_depth_analysis,121,0.0020758633704472543,17 surprising,121,0.0020758633704472543,10 cloze,121,0.0020758633704472543,5 microblog,121,0.0020758633704472543,9 tv,121,0.0020758633704472543,2 nmt_system,121,0.0020758633704472543,10 controllable,121,0.0020758633704472543,12 attentive,121,0.0020758633704472543,9 machine_learning,121,0.0020758633704472543,16 emergence,121,0.0020758633704472543,9 recovery,121,0.0020758633704472543,8 generates,121,0.0020758633704472543,9 backbone,121,0.0020758633704472543,8 unlabelled,121,0.0020758633704472543,10 something,121,0.0020758633704472543,9 computational_approach,121,0.0020758633704472543,22 processus,121,0.0020758633704472543,9 problme,121,0.0020758633704472543,7 bien,120,0.002058707474823723,4 fine_tune,120,0.002058707474823723,9 fasttext,120,0.002058707474823723,8 github,120,0.002058707474823723,6 quantification,120,0.002058707474823723,14 supervised_approach,120,0.002058707474823723,19 ontonotes,120,0.002058707474823723,9 d'analyse,120,0.002058707474823723,9 in_domain_data,120,0.002058707474823723,14 selectional_preference,120,0.002058707474823723,22 exhaustive,119,0.002041551579200192,10 united,119,0.002041551579200192,6 main_goal,119,0.002041551579200192,9 spectral,119,0.002041551579200192,8 institution,119,0.002041551579200192,11 simple_approach,119,0.002041551579200192,15 projet,119,0.002041551579200192,6 higher_quality,119,0.002041551579200192,14 multiple_source,119,0.002041551579200192,15 discriminative_model,119,0.002041551579200192,20 dimensional,119,0.002041551579200192,11 prosody,119,0.002041551579200192,7 arabic_language,119,0.002041551579200192,15 notable,119,0.002041551579200192,7 guide,119,0.002041551579200192,5 increased,119,0.002041551579200192,9 aspect_based_sentiment_analysis,119,0.002041551579200192,31 figurative,118,0.002024395683576661,10 scholar,118,0.002024395683576661,7 brain,118,0.002024395683576661,5 higher_order,118,0.002024395683576661,12 internship,118,0.002024395683576661,10 toxic,118,0.002024395683576661,5 syntaxiques,118,0.002024395683576661,11 diverse_language,118,0.002024395683576661,16 command,118,0.002024395683576661,7 hebrew,118,0.002024395683576661,6 salience,118,0.002024395683576661,8 other_approach,118,0.002024395683576661,14 trial,118,0.002024395683576661,5 labor,118,0.002024395683576661,5 unigram,118,0.002024395683576661,7 algorithmic,118,0.002024395683576661,11 pre_trained_transformer,118,0.002024395683576661,23 nous_dcrivons,117,0.00200723978795313,13 localization,117,0.00200723978795313,12 clinical_note,117,0.00200723978795313,13 suitability,117,0.00200723978795313,11 evaluator,117,0.00200723978795313,9 synonymy,117,0.00200723978795313,8 laboratory,117,0.00200723978795313,10 pas,117,0.00200723978795313,3 empirical_analysis,117,0.00200723978795313,18 bidirectional_encoder,117,0.00200723978795313,21 storage,117,0.00200723978795313,7 sum,117,0.00200723978795313,3 categorical,116,0.0019900838923295992,11 transparent,116,0.0019900838923295992,11 splitting,116,0.0019900838923295992,9 d'valuation,116,0.0019900838923295992,11 minor,116,0.0019900838923295992,5 premire,116,0.0019900838923295992,7 speedup,116,0.0019900838923295992,7 niveau,116,0.0019900838923295992,6 selective,116,0.0019900838923295992,9 agglutinative,116,0.0019900838923295992,13 deletion,116,0.0019900838923295992,8 maintenance,116,0.0019900838923295992,11 mask,116,0.0019900838923295992,4 coarse,116,0.0019900838923295992,6 accessibility,116,0.0019900838923295992,13 analytics,116,0.0019900838923295992,9 pointer,116,0.0019900838923295992,7 lexical_database,116,0.0019900838923295992,16 multilingual_language,116,0.0019900838923295992,21 n_best_list,116,0.0019900838923295992,11 held_out,116,0.0019900838923295992,8 determination,116,0.0019900838923295992,13 multi_turn,115,0.001972927996706068,10 quantitative_analysis,115,0.001972927996706068,21 bidirectional_encoder_representation,115,0.001972927996706068,36 under_resourced_language,115,0.001972927996706068,24 plms,115,0.001972927996706068,4 ba,115,0.001972927996706068,2 different_corpus,115,0.001972927996706068,16 familiar,115,0.001972927996706068,8 engagement,115,0.001972927996706068,10 spanish_english,115,0.001972927996706068,15 fonction,115,0.001972927996706068,8 single_document,115,0.001972927996706068,15 bulgarian,115,0.001972927996706068,9 morphological_segmentation,115,0.001972927996706068,26 highlight,115,0.001972927996706068,9 fake_news,115,0.001972927996706068,9 reality,115,0.001972927996706068,7 qe,115,0.001972927996706068,2 bilingual_word,115,0.001972927996706068,14 board,115,0.001972927996706068,5 holistic,115,0.001972927996706068,8 realworld,114,0.001955772101082537,9 meme,114,0.001955772101082537,4 visual_question,114,0.001955772101082537,15 utilizes,114,0.001955772101082537,8 methodological,114,0.001955772101082537,14 address,114,0.001955772101082537,7 facility,114,0.001955772101082537,8 recipe,114,0.001955772101082537,6 domain_adaptation,114,0.001955772101082537,17 most_case,114,0.001955772101082537,9 text_classification_task,114,0.001955772101082537,24 mainstream,114,0.001955772101082537,10 play,114,0.001955772101082537,4 stress,114,0.001955772101082537,6 distinctive,114,0.001955772101082537,11 mt_evaluation,114,0.001955772101082537,13 part_ofspeech,114,0.001955772101082537,13 encoderdecoder,114,0.001955772101082537,14 automatic_summarization,113,0.001938616205459006,23 part_of_speech_tag,113,0.001938616205459006,18 left,113,0.001938616205459006,4 limited_amount,113,0.001938616205459006,14 lexical_knowledge,113,0.001938616205459006,17 underspecified,113,0.001938616205459006,14 nested,113,0.001938616205459006,6 l'valuation,113,0.001938616205459006,11 typed,113,0.001938616205459006,5 rule_based_approach,113,0.001938616205459006,19 month,113,0.001938616205459006,5 human_computer,113,0.001938616205459006,14 car,113,0.001938616205459006,3 natural_language_question,113,0.001938616205459006,25 check,113,0.001938616205459006,5 available_data,113,0.001938616205459006,14 blind,113,0.001938616205459006,5 integral,113,0.001938616205459006,8 large_dataset,113,0.001938616205459006,13 additional_training,113,0.001938616205459006,19 large_scale_corpus,113,0.001938616205459006,18 normalized,112,0.001921460309835475,10 poetry,112,0.001921460309835475,6 java,112,0.001921460309835475,4 low_dimensional,112,0.001921460309835475,15 non_local,112,0.001921460309835475,9 pre_trained_word_embeddings,112,0.001921460309835475,27 contrastive_learning,112,0.001921460309835475,20 japanese_english,112,0.001921460309835475,16 affix,112,0.001921460309835475,5 summarizer,112,0.001921460309835475,10 linear_programming,112,0.001921460309835475,18 mark,112,0.001921460309835475,4 human_machine,112,0.001921460309835475,13 gazetteer,112,0.001921460309835475,9 maximization,111,0.001904304414211944,12 gec,111,0.001904304414211944,3 highquality,111,0.001904304414211944,11 music,111,0.001904304414211944,5 productive,111,0.001904304414211944,10 prcision,111,0.001904304414211944,8 microblogs,111,0.001904304414211944,10 depression,111,0.001904304414211944,10 msa,111,0.001904304414211944,3 lexical_sample,111,0.001904304414211944,14 broad_range,111,0.001904304414211944,11 textual_information,111,0.001904304414211944,19 visual_information,111,0.001904304414211944,18 job,111,0.001904304414211944,3 chinese_treebank,111,0.001904304414211944,16 rst,110,0.0018871485185884128,3 smart,110,0.0018871485185884128,5 lexicales,110,0.0018871485185884128,9 hybrid_model,110,0.0018871485185884128,12 graphical_model,110,0.0018871485185884128,15 key_idea,110,0.0018871485185884128,8 convention,110,0.0018871485185884128,10 expected,110,0.0018871485185884128,8 penalty,110,0.0018871485185884128,7 discontinuous,110,0.0018871485185884128,13 bidirectional_lstm,110,0.0018871485185884128,18 mme,110,0.0018871485185884128,3 ocr,110,0.0018871485185884128,3 pose,110,0.0018871485185884128,4 implement,110,0.0018871485185884128,9 labelled,110,0.0018871485185884128,8 multi_party,110,0.0018871485185884128,11 lexical_entry,110,0.0018871485185884128,13 triplet,110,0.0018871485185884128,7 merit,110,0.0018871485185884128,5 hungarian,110,0.0018871485185884128,9 interlocutor,110,0.0018871485185884128,12 tree_based,110,0.0018871485185884128,10 used,110,0.0018871485185884128,4 real_world_datasets,110,0.0018871485185884128,19 europarl,109,0.001869992622964882,8 unification,109,0.001869992622964882,11 summarisation,109,0.001869992622964882,13 syntactic_parser,109,0.001869992622964882,16 south,109,0.001869992622964882,5 agnostic,109,0.001869992622964882,8 uncertain,109,0.001869992622964882,9 usual,109,0.001869992622964882,5 build,109,0.001869992622964882,5 portal,109,0.001869992622964882,6 prototypical,109,0.001869992622964882,12 mrc,109,0.001869992622964882,3 key_component,109,0.001869992622964882,13 several_method,109,0.001869992622964882,14 utilization,109,0.001869992622964882,11 collective,109,0.001869992622964882,10 arabic_dialect,109,0.001869992622964882,14 linear_model,109,0.001869992622964882,12 upper_bound,109,0.001869992622964882,11 semantic_network,109,0.001869992622964882,16 overall_accuracy,109,0.001869992622964882,16 contextual_word,109,0.001869992622964882,15 termes,109,0.001869992622964882,6 chatbot,109,0.001869992622964882,7 syntactic_annotation,108,0.0018528367273413508,20 portable,108,0.0018528367273413508,8 masked_language_model,108,0.0018528367273413508,21 original_text,108,0.0018528367273413508,13 spoken_language_understanding,108,0.0018528367273413508,29 genetic,108,0.0018528367273413508,7 obtained,108,0.0018528367273413508,8 source_side,108,0.0018528367273413508,11 urdu,108,0.0018528367273413508,4 move,108,0.0018528367273413508,4 scientific_literature,108,0.0018528367273413508,21 anchor,108,0.0018528367273413508,6 viability,108,0.0018528367273413508,9 pour_le,108,0.0018528367273413508,7 new_framework,108,0.0018528367273413508,13 semantic_property,108,0.0018528367273413508,17 unsupervised_model,108,0.0018528367273413508,18 phrasebased,108,0.0018528367273413508,11 monitoring,108,0.0018528367273413508,10 glove,108,0.0018528367273413508,5 low_frequency,107,0.0018356808317178197,13 d'extraction,107,0.0018356808317178197,12 social_medium_post,107,0.0018356808317178197,18 rich_feature,107,0.0018356808317178197,12 alternative_approach,107,0.0018356808317178197,20 model_based,107,0.0018356808317178197,11 representational,107,0.0018356808317178197,16 reliance,107,0.0018356808317178197,8 making,107,0.0018356808317178197,6 ellipsis,107,0.0018356808317178197,8 specific_task,107,0.0018356808317178197,13 current_research,107,0.0018356808317178197,16 part_of_speech_tagger,107,0.0018356808317178197,21 contextual_feature,107,0.0018356808317178197,18 ordinary,107,0.0018356808317178197,8 represent,107,0.0018356808317178197,9 english_tweet,107,0.0018356808317178197,13 lexica,107,0.0018356808317178197,6 pour_la,107,0.0018356808317178197,7 traditional_approach,107,0.0018356808317178197,20 many_case,106,0.0018185249360942889,9 handcrafted,106,0.0018185249360942889,11 syntactic_tree,106,0.0018185249360942889,14 widely_used,106,0.0018185249360942889,11 editing,106,0.0018185249360942889,7 eu,106,0.0018185249360942889,2 bi_lstm,106,0.0018185249360942889,7 marginal,106,0.0018185249360942889,8 human_expert,106,0.0018185249360942889,12 nlp_tool,106,0.0018185249360942889,8 joint_learning,106,0.0018185249360942889,14 pool,106,0.0018185249360942889,4 other_task,106,0.0018185249360942889,10 wall_street,106,0.0018185249360942889,11 temporal_expression,106,0.0018185249360942889,19 working,106,0.0018185249360942889,7 execution,106,0.0018185249360942889,9 interoperability,106,0.0018185249360942889,16 aussi,106,0.0018185249360942889,5 sou,106,0.0018185249360942889,3 visual_feature,106,0.0018185249360942889,14 tree_structure,106,0.0018185249360942889,14 considers,106,0.0018185249360942889,9 ease,106,0.0018185249360942889,4 runtime,106,0.0018185249360942889,7 multi_head,106,0.0018185249360942889,10 parent,106,0.0018185249360942889,6 stock,106,0.0018185249360942889,5 spite,105,0.0018013690404707578,5 rl,105,0.0018013690404707578,2 phrase_based_system,105,0.0018013690404707578,19 locality,105,0.0018013690404707578,8 annotated_dataset,105,0.0018013690404707578,17 acceptability,105,0.0018013690404707578,13 rigorous,105,0.0018013690404707578,8 non_native_speaker,105,0.0018013690404707578,18 idiomatic,105,0.0018013690404707578,9 testbed,105,0.0018013690404707578,7 proximity,105,0.0018013690404707578,9 data_driven_approach,105,0.0018013690404707578,20 new_state,105,0.0018013690404707578,9 neighborhood,105,0.0018013690404707578,12 related_work,105,0.0018013690404707578,12 non_projective,105,0.0018013690404707578,14 ancient,105,0.0018013690404707578,7 aligner,105,0.0018013690404707578,7 quick,105,0.0018013690404707578,5 filling,105,0.0018013690404707578,7 end_toend,105,0.0018013690404707578,9 large_data,105,0.0018013690404707578,10 cnns,105,0.0018013690404707578,4 key_challenge,105,0.0018013690404707578,13 protein,105,0.0018013690404707578,7 sarcastic,105,0.0018013690404707578,9 chatbots,105,0.0018013690404707578,8 souvent,105,0.0018013690404707578,7 l1,105,0.0018013690404707578,2 first_result,105,0.0018013690404707578,12 display,104,0.0017842131448472266,7 server,104,0.0017842131448472266,6 creative_common,104,0.0017842131448472266,15 discourse_level,104,0.0017842131448472266,15 notamment,104,0.0017842131448472266,9 connaissances,104,0.0017842131448472266,13 timeline,104,0.0017842131448472266,8 first_step_towards,104,0.0017842131448472266,18 available_resource,104,0.0017842131448472266,18 zero,104,0.0017842131448472266,4 organisation,104,0.0017842131448472266,12 compatibility,104,0.0017842131448472266,13 moderate,104,0.0017842131448472266,8 adverb,104,0.0017842131448472266,6 text_to_text,104,0.0017842131448472266,12 english_data,104,0.0017842131448472266,12 generality,104,0.0017842131448472266,10 guarantee,104,0.0017842131448472266,9 similar_word,104,0.0017842131448472266,12 other_system,104,0.0017842131448472266,12 relevant_document,103,0.0017670572492236958,17 imbalanced,103,0.0017670572492236958,10 finegrained,103,0.0017670572492236958,11 plot,103,0.0017670572492236958,4 pandemic,103,0.0017670572492236958,8 motion,103,0.0017670572492236958,6 few_shot_learning,103,0.0017670572492236958,17 avenue,103,0.0017670572492236958,6 hidden_state,103,0.0017670572492236958,12 prepositional,103,0.0017670572492236958,13 multilingual_corpus,103,0.0017670572492236958,19 directed,103,0.0017670572492236958,8 removal,103,0.0017670572492236958,7 different_data,103,0.0017670572492236958,14 cross_modal,103,0.0017670572492236958,11 starting,103,0.0017670572492236958,8 text_representation,103,0.0017670572492236958,19 home,103,0.0017670572492236958,4 tt,103,0.0017670572492236958,2 tradition,103,0.0017670572492236958,9 bayesian_model,103,0.0017670572492236958,14 electronic_health,103,0.0017670572492236958,17 phonology,103,0.0017670572492236958,9 competence,103,0.0017670572492236958,10 contain,102,0.0017499013536001647,7 bridge,102,0.0017499013536001647,6 predict,102,0.0017499013536001647,7 inverse,102,0.0017499013536001647,7 computational_complexity,102,0.0017499013536001647,24 neural_network_language,102,0.0017499013536001647,23 electronic_health_record,102,0.0017499013536001647,24 correspond,102,0.0017499013536001647,10 estimator,102,0.0017499013536001647,9 iv,102,0.0017499013536001647,2 lexicon_based,102,0.0017499013536001647,13 cycle,102,0.0017499013536001647,5 heavy,102,0.0017499013536001647,5 double,102,0.0017499013536001647,6 union,102,0.0017499013536001647,5 moment,102,0.0017499013536001647,6 convenient,102,0.0017499013536001647,10 thesis,102,0.0017499013536001647,6 meta_learning,102,0.0017499013536001647,13 multi_source,102,0.0017499013536001647,12 statistical_language,102,0.0017499013536001647,20 statistical_analysis,102,0.0017499013536001647,20 smoothing,102,0.0017499013536001647,9 lexical_substitution,102,0.0017499013536001647,20 sans,102,0.0017499013536001647,4 syntactic_pattern,102,0.0017499013536001647,17 particulier,102,0.0017499013536001647,11 semisupervised,102,0.0017499013536001647,14 tagged,102,0.0017499013536001647,6 large_language,102,0.0017499013536001647,14 une_tche,101,0.0017327454579766338,8 skip_gram,101,0.0017327454579766338,9 singular,101,0.0017327454579766338,8 readable,101,0.0017327454579766338,8 enormous,101,0.0017327454579766338,8 keyphrases,101,0.0017327454579766338,10 nous_intressons,101,0.0017327454579766338,15 small_corpus,101,0.0017327454579766338,12 translate,101,0.0017327454579766338,9 gate,101,0.0017327454579766338,4 data_to_text,101,0.0017327454579766338,12 new_type,101,0.0017327454579766338,8 artifact,101,0.0017327454579766338,8 backtranslation,101,0.0017327454579766338,15 multi_label_classification,101,0.0017327454579766338,26 new_algorithm,101,0.0017327454579766338,13 interval,101,0.0017327454579766338,8 forme,101,0.0017327454579766338,5 tensor,101,0.0017327454579766338,6 intressons,101,0.0017327454579766338,10 text_categorization,101,0.0017327454579766338,19 reproducibility,101,0.0017327454579766338,15 crucial_role,101,0.0017327454579766338,12 english_corpus,101,0.0017327454579766338,14 female,101,0.0017327454579766338,6 endto_end,101,0.0017327454579766338,9 causality,101,0.0017327454579766338,9 array,101,0.0017327454579766338,5 automatic_annotation,101,0.0017327454579766338,20 gated,101,0.0017327454579766338,5 tree_kernel,101,0.0017327454579766338,11 id,101,0.0017327454579766338,2 fundamental_task,101,0.0017327454579766338,16 various_task,100,0.0017155895623531027,12 best_practice,100,0.0017155895623531027,13 curve,100,0.0017155895623531027,5 complex_task,100,0.0017155895623531027,12 open_information,100,0.0017155895623531027,16 correct_answer,100,0.0017155895623531027,14 well_formed,100,0.0017155895623531027,11 enables,100,0.0017155895623531027,7 contextual_embeddings,100,0.0017155895623531027,21 peu,100,0.0017155895623531027,3 ensemble_method,100,0.0017155895623531027,15 extensive_evaluation,100,0.0017155895623531027,20 task_oriented_dialogue_system,100,0.0017155895623531027,29 unreliable,100,0.0017155895623531027,10 open_data,100,0.0017155895623531027,9 princeton,100,0.0017155895623531027,9 reverse,100,0.0017155895623531027,7 tant,100,0.0017155895623531027,4 sentencelevel,100,0.0017155895623531027,13 exists,100,0.0017155895623531027,6 other_model,100,0.0017155895623531027,11 traditional_method,100,0.0017155895623531027,18 mass,100,0.0017155895623531027,4 register,100,0.0017155895623531027,8 bert_model,99,0.0016984336667295716,10 factoid,99,0.0016984336667295716,7 centre,99,0.0016984336667295716,6 semantic_change,99,0.0016984336667295716,15 important_step,99,0.0016984336667295716,14 textual_feature,99,0.0016984336667295716,15 store,99,0.0016984336667295716,5 annotated_training,99,0.0016984336667295716,18 applied,99,0.0016984336667295716,7 exploit,99,0.0016984336667295716,7 smt_system,99,0.0016984336667295716,10 generated_text,99,0.0016984336667295716,14 textual_content,99,0.0016984336667295716,15 typing,99,0.0016984336667295716,6 unsupervised_manner,99,0.0016984336667295716,19 question_answer_pair,99,0.0016984336667295716,20 introduces,99,0.0016984336667295716,10 viterbi,99,0.0016984336667295716,7 agency,99,0.0016984336667295716,6 checker,99,0.0016984336667295716,7 spoken_dialog,99,0.0016984336667295716,13 important_information,99,0.0016984336667295716,21 state_of_art,99,0.0016984336667295716,12 plausibility,99,0.0016984336667295716,12 exposure,99,0.0016984336667295716,8 lexicographic,99,0.0016984336667295716,13 india,99,0.0016984336667295716,5 u.s.,99,0.0016984336667295716,4 cl,99,0.0016984336667295716,2 complex_word,98,0.0016812777711060407,12 open_information_extraction,98,0.0016812777711060407,27 deep_learning_method,98,0.0016812777711060407,20 low_resource_scenario,98,0.0016812777711060407,21 subcategorization,98,0.0016812777711060407,17 trois,98,0.0016812777711060407,5 deficiency,98,0.0016812777711060407,10 informed,98,0.0016812777711060407,8 hindi_english,98,0.0016812777711060407,13 inner,98,0.0016812777711060407,5 statistique,98,0.0016812777711060407,11 structured_prediction,98,0.0016812777711060407,21 budget,98,0.0016812777711060407,6 retrieved,98,0.0016812777711060407,9 comparative_analysis,98,0.0016812777711060407,20 briefly,98,0.0016812777711060407,7 prerequisite,98,0.0016812777711060407,12 new_challenge,98,0.0016812777711060407,13 price,98,0.0016812777711060407,5 croatian,98,0.0016812777711060407,8 important_aspect,98,0.0016812777711060407,16 presented,98,0.0016812777711060407,9 small_scale,98,0.0016812777711060407,11 tuples,98,0.0016812777711060407,6 generalizable,98,0.0016812777711060407,13 prevalence,98,0.0016812777711060407,10 large_scale_dataset,98,0.0016812777711060407,19 important_part,98,0.0016812777711060407,14 declarative,98,0.0016812777711060407,11 rich_set,98,0.0016812777711060407,8 vulnerable,98,0.0016812777711060407,10 semantic_content,98,0.0016812777711060407,16 cependant,98,0.0016812777711060407,9 sentiment_classification,97,0.0016641218754825096,24 different_strategy,97,0.0016641218754825096,18 separation,97,0.0016641218754825096,10 transformer_based_language,97,0.0016641218754825096,26 aforementioned,97,0.0016641218754825096,14 stack,97,0.0016641218754825096,5 second_stage,97,0.0016641218754825096,12 lookup,97,0.0016641218754825096,6 more_data,97,0.0016641218754825096,9 large_language_model,97,0.0016641218754825096,20 different_context,97,0.0016641218754825096,17 food,97,0.0016641218754825096,4 non_linear,97,0.0016641218754825096,10 grammaires,97,0.0016641218754825096,10 focused,97,0.0016641218754825096,7 consiste,97,0.0016641218754825096,8 such_method,97,0.0016641218754825096,11 new_resource,97,0.0016641218754825096,12 ground_truth,97,0.0016641218754825096,12 burden,97,0.0016641218754825096,6 present_work,97,0.0016641218754825096,12 biased,97,0.0016641218754825096,6 nearest_neighbor,97,0.0016641218754825096,16 current_model,97,0.0016641218754825096,13 hashtags,97,0.0016641218754825096,8 black,96,0.0016469659798589785,5 present_experiment,96,0.0016469659798589785,18 user_generated_content,96,0.0016469659798589785,22 malayalam,96,0.0016469659798589785,9 reuse,96,0.0016469659798589785,5 grand,96,0.0016469659798589785,5 british,96,0.0016469659798589785,7 faithful,96,0.0016469659798589785,8 transformer_based_language_model,96,0.0016469659798589785,32 dropout,96,0.0016469659798589785,7 vice,96,0.0016469659798589785,4 isolated,96,0.0016469659798589785,8 percent,96,0.0016469659798589785,7 probe,96,0.0016469659798589785,5 high_degree,96,0.0016469659798589785,11 hyperparameters,96,0.0016469659798589785,15 stimulus,96,0.0016469659798589785,8 semeval_2015,96,0.0016469659798589785,12 chinese_english_translation,96,0.0016469659798589785,27 resource_poor,96,0.0016469659798589785,13 semantic_web,96,0.0016469659798589785,12 gaze,96,0.0016469659798589785,4 geographical,96,0.0016469659798589785,12 analyser,96,0.0016469659798589785,8 regime,96,0.0016469659798589785,6 recent_approach,96,0.0016469659798589785,15 partof_speech,96,0.0016469659798589785,13 tape,96,0.0016469659798589785,4 rare_word,96,0.0016469659798589785,9 professional_translator,96,0.0016469659798589785,23 offensive_language_identification,95,0.0016298100842354476,33 utilized,95,0.0016298100842354476,8 adversarial_example,95,0.0016298100842354476,19 taiwan,95,0.0016298100842354476,6 cloud,95,0.0016298100842354476,5 tradeoff,95,0.0016298100842354476,8 multiple_domain,95,0.0016298100842354476,15 f_scores,95,0.0016298100842354476,8 questionnaire,95,0.0016298100842354476,13 grid,95,0.0016298100842354476,4 l'objectif,95,0.0016298100842354476,10 bart,95,0.0016298100842354476,4 indispensable,95,0.0016298100842354476,13 atomic,95,0.0016298100842354476,6 first_place,95,0.0016298100842354476,11 nave_bayes,95,0.0016298100842354476,10 coordinate,95,0.0016298100842354476,10 filler,95,0.0016298100842354476,6 improved_performance,95,0.0016298100842354476,20 economic,95,0.0016298100842354476,8 trajectory,95,0.0016298100842354476,10 richness,95,0.0016298100842354476,8 future_direction,95,0.0016298100842354476,16 rfrence,95,0.0016298100842354476,7 *_work,95,0.0016298100842354476,6 preliminary_evaluation,95,0.0016298100842354476,22 portability,95,0.0016298100842354476,11 reduced,95,0.0016298100842354476,7 distortion,95,0.0016298100842354476,10 text_corpus,95,0.0016298100842354476,11 novel_feature,95,0.0016298100842354476,13 present_study,95,0.0016298100842354476,13 orthogonal,95,0.0016298100842354476,10 open_ended,95,0.0016298100842354476,10 semantic_resource,95,0.0016298100842354476,17 exception,95,0.0016298100842354476,9 norwegian,95,0.0016298100842354476,9 english_spanish,95,0.0016298100842354476,15 memory_based,95,0.0016298100842354476,12 adapted,95,0.0016298100842354476,7 surprise,95,0.0016298100842354476,8 asian_language,95,0.0016298100842354476,14 d'etection,95,0.0016298100842354476,10 speaking,95,0.0016298100842354476,8 cela,94,0.0016126541886119165,4 dveloppement,94,0.0016126541886119165,12 low_quality,94,0.0016126541886119165,11 thought,94,0.0016126541886119165,7 named_entity_recognition,94,0.0016126541886119165,24 semi_structured,94,0.0016126541886119165,15 differentiable,94,0.0016126541886119165,14 li,94,0.0016126541886119165,2 lexical_semantic,94,0.0016126541886119165,16 brazilian_portuguese,94,0.0016126541886119165,20 curation,94,0.0016126541886119165,8 inductive_bias,94,0.0016126541886119165,14 infrequent,94,0.0016126541886119165,10 naturalness,94,0.0016126541886119165,11 force,94,0.0016126541886119165,5 metaphorical,94,0.0016126541886119165,12 new_evaluation,94,0.0016126541886119165,14 operational,94,0.0016126541886119165,11 understanding_task,94,0.0016126541886119165,18 different_system,94,0.0016126541886119165,16 encouraging_result,94,0.0016126541886119165,18 neural_mt,94,0.0016126541886119165,9 slight,94,0.0016126541886119165,6 china,94,0.0016126541886119165,5 freebase,94,0.0016126541886119165,8 actor,94,0.0016126541886119165,5 irony,94,0.0016126541886119165,5 thai,94,0.0016126541886119165,4 unavailable,94,0.0016126541886119165,11 facet,94,0.0016126541886119165,5 bert_based_model,94,0.0016126541886119165,16 new_benchmark,94,0.0016126541886119165,13 left_to_right,93,0.0015954982929883854,13 rdf,93,0.0015954982929883854,3 softmax,93,0.0015954982929883854,7 ted,93,0.0015954982929883854,3 target_side,93,0.0015954982929883854,11 code_switched,93,0.0015954982929883854,13 pitch,93,0.0015954982929883854,5 such_resource,93,0.0015954982929883854,13 important_problem,93,0.0015954982929883854,17 semantic_interpretation,93,0.0015954982929883854,23 adaptable,93,0.0015954982929883854,9 clarification,93,0.0015954982929883854,13 latent_space,93,0.0015954982929883854,12 apr,93,0.0015954982929883854,3 unambiguous,93,0.0015954982929883854,11 biomedical_literature,93,0.0015954982929883854,21 binary_classifier,93,0.0015954982929883854,17 composite,93,0.0015954982929883854,9 t5,93,0.0015954982929883854,2 statistical_parser,93,0.0015954982929883854,18 harmful,93,0.0015954982929883854,7 accent,93,0.0015954982929883854,6 era,93,0.0015954982929883854,3 transferability,93,0.0015954982929883854,15 current_method,93,0.0015954982929883854,14 several_experiment,93,0.0015954982929883854,18 sort,93,0.0015954982929883854,4 speech_to_speech,92,0.0015783423973648545,16 inefficient,92,0.0015783423973648545,11 grade,92,0.0015783423973648545,5 color,92,0.0015783423973648545,5 ultimate,92,0.0015783423973648545,8 current_work,92,0.0015783423973648545,12 interpolation,92,0.0015783423973648545,13 cross_document,92,0.0015783423973648545,14 contact,92,0.0015783423973648545,7 cross_entropy,92,0.0015783423973648545,13 substitute,92,0.0015783423973648545,10 novel_way,92,0.0015783423973648545,9 various_feature,92,0.0015783423973648545,15 more_attention,92,0.0015783423973648545,14 second_order,92,0.0015783423973648545,12 submitted,92,0.0015783423973648545,9 natural_language_sentence,92,0.0015783423973648545,25 mi,92,0.0015783423973648545,2 several_approach,92,0.0015783423973648545,16 decision_making,92,0.0015783423973648545,15 implemented,92,0.0015783423973648545,11 travaux,91,0.0015611865017413234,7 englishgerman,91,0.0015611865017413234,13 male,91,0.0015611865017413234,4 rhetorical_structure_theory,91,0.0015611865017413234,27 l'apprentissage,91,0.0015611865017413234,15 umls,91,0.0015611865017413234,4 little_work,91,0.0015611865017413234,11 systeme,91,0.0015611865017413234,7 best_performing_model,91,0.0015611865017413234,21 first_approach,91,0.0015611865017413234,14 comparative_evaluation,91,0.0015611865017413234,22 great_success,91,0.0015611865017413234,13 mbert,91,0.0015611865017413234,5 parsed,91,0.0015611865017413234,6 discriminative_training,91,0.0015611865017413234,23 verbnet,91,0.0015611865017413234,7 indication,91,0.0015611865017413234,10 combinatorial,91,0.0015611865017413234,13 utilizing,91,0.0015611865017413234,9 available_datasets,91,0.0015611865017413234,18 linear_time,91,0.0015611865017413234,11 appropriateness,91,0.0015611865017413234,15 dramatic,91,0.0015611865017413234,8 detecting,91,0.0015611865017413234,9 dictionary_based,91,0.0015611865017413234,16 proper_name,91,0.0015611865017413234,11 rte,91,0.0015611865017413234,3 statistical_translation,90,0.0015440306061177923,23 sql,90,0.0015440306061177923,3 race,90,0.0015440306061177923,4 versa,90,0.0015440306061177923,5 counterfactual,90,0.0015440306061177923,14 bleu_score,90,0.0015440306061177923,10 morphological_information,90,0.0015440306061177923,25 hybrid_system,90,0.0015440306061177923,13 post_edited,90,0.0015440306061177923,11 content_selection,90,0.0015440306061177923,17 l'aide,90,0.0015440306061177923,6 geographic,90,0.0015440306061177923,10 important_component,90,0.0015440306061177923,19 real_world_application,90,0.0015440306061177923,22 permettent,90,0.0015440306061177923,10 geometric,90,0.0015440306061177923,9 embedding_based,90,0.0015440306061177923,15 sm,90,0.0015440306061177923,2 cheap,90,0.0015440306061177923,5 lfg,90,0.0015440306061177923,3 huge_amount,90,0.0015440306061177923,11 labeled_training,90,0.0015440306061177923,16 out_of_domain_data,90,0.0015440306061177923,18 same_language,90,0.0015440306061177923,13 dialect_identification,90,0.0015440306061177923,22 doctor,90,0.0015440306061177923,6 available_corpus,90,0.0015440306061177923,16 overhead,90,0.0015440306061177923,8 cognition,90,0.0015440306061177923,9 certaines,90,0.0015440306061177923,9 task_based,90,0.0015440306061177923,10 polynomial,90,0.0015440306061177923,10 semantic_type,90,0.0015440306061177923,13 architectural,90,0.0015440306061177923,13 scholarly,89,0.0015268747104942614,9 sighan,89,0.0015268747104942614,6 grammar_based,89,0.0015268747104942614,13 phrase_level,89,0.0015268747104942614,12 non_expert,89,0.0015268747104942614,10 novel_dataset,89,0.0015268747104942614,13 hypernymy,89,0.0015268747104942614,9 morphological_inflection,89,0.0015268747104942614,24 dravidian,89,0.0015268747104942614,9 propaganda,89,0.0015268747104942614,10 sport,89,0.0015268747104942614,5 large_volume,89,0.0015268747104942614,12 autoencoders,89,0.0015268747104942614,12 abusive_language,89,0.0015268747104942614,16 europe,89,0.0015268747104942614,6 acyclic,89,0.0015268747104942614,7 figurative_language,89,0.0015268747104942614,19 semeval_2014,88,0.0015097188148707303,12 persian,88,0.0015097188148707303,7 unexplored,88,0.0015097188148707303,10 pervasive,88,0.0015097188148707303,9 dedicated,88,0.0015097188148707303,9 tremendous,88,0.0015097188148707303,10 alors,88,0.0015097188148707303,5 same_data,88,0.0015097188148707303,9 preliminary_study,88,0.0015097188148707303,17 _score,88,0.0015097188148707303,6 poor_performance,88,0.0015097188148707303,16 friend,88,0.0015097188148707303,6 many_task,88,0.0015097188148707303,9 realisation,88,0.0015097188148707303,11 added,88,0.0015097188148707303,5 multiple_sentence,88,0.0015097188148707303,17 different_language_pair,88,0.0015097188148707303,23 lexeme,88,0.0015097188148707303,6 resource_rich,88,0.0015097188148707303,13 transparency,88,0.0015097188148707303,12 significant_margin,88,0.0015097188148707303,18 identified,88,0.0015097188148707303,10 caractristiques,88,0.0015097188148707303,15 liu,88,0.0015097188148707303,3 conduct,88,0.0015097188148707303,7 technological,88,0.0015097188148707303,13 non_autoregressive,88,0.0015097188148707303,18 read,87,0.0014925629192471992,4 regular_expression,87,0.0014925629192471992,18 stereotype,87,0.0014925629192471992,10 nlp_community,87,0.0014925629192471992,13 benchmark_datasets,87,0.0014925629192471992,18 chosen,87,0.0014925629192471992,6 biology,87,0.0014925629192471992,7 ngrams,87,0.0014925629192471992,6 xlnet,87,0.0014925629192471992,5 bit,87,0.0014925629192471992,3 english_hindi,87,0.0014925629192471992,13 single_task,87,0.0014925629192471992,11 well_established,87,0.0014925629192471992,16 all_words,87,0.0014925629192471992,9 meta,87,0.0014925629192471992,4 arc,87,0.0014925629192471992,3 automatic_post_editing,87,0.0014925629192471992,22 semantic_graph,87,0.0014925629192471992,14 new_way,87,0.0014925629192471992,7 telugu,87,0.0014925629192471992,6 regional,87,0.0014925629192471992,8 cross_validation,87,0.0014925629192471992,16 disadvantage,87,0.0014925629192471992,12 indonesian,87,0.0014925629192471992,10 couple,87,0.0014925629192471992,6 apprentissage,87,0.0014925629192471992,13 dcrit,86,0.0014754070236236683,5 egyptian,86,0.0014754070236236683,8 commentary,86,0.0014754070236236683,10 medline,86,0.0014754070236236683,7 trust,86,0.0014754070236236683,5 procedural,86,0.0014754070236236683,10 security,86,0.0014754070236236683,8 maximal,86,0.0014754070236236683,7 syntactic_relation,86,0.0014754070236236683,18 load,86,0.0014754070236236683,4 court,86,0.0014754070236236683,5 try,86,0.0014754070236236683,3 long_document,86,0.0014754070236236683,13 multidimensional,86,0.0014754070236236683,16 abstract_meaning,86,0.0014754070236236683,16 eye_tracking,86,0.0014754070236236683,12 multilingual_language_model,86,0.0014754070236236683,27 semantic_category,86,0.0014754070236236683,17 pattern_based,86,0.0014754070236236683,13 additional_data,86,0.0014754070236236683,15 end_to_end_model,86,0.0014754070236236683,16 random_forest,86,0.0014754070236236683,13 faire,86,0.0014754070236236683,5 valency,86,0.0014754070236236683,7 chinese_sentence,86,0.0014754070236236683,16 wiktionary,86,0.0014754070236236683,10 modal,86,0.0014754070236236683,5 layout,86,0.0014754070236236683,6 collected,86,0.0014754070236236683,9 standard_datasets,86,0.0014754070236236683,17 run_time,86,0.0014754070236236683,8 unconstrained,85,0.0014582511280001372,13 standalone,85,0.0014582511280001372,10 cqa,85,0.0014582511280001372,3 multilingual_setting,85,0.0014582511280001372,20 nuanced,85,0.0014582511280001372,7 explosion,85,0.0014582511280001372,9 analytical,85,0.0014582511280001372,10 crowd_sourced,85,0.0014582511280001372,13 constraint_based,85,0.0014582511280001372,16 new_state_of_the_art,85,0.0014582511280001372,20 ungrammatical,85,0.0014582511280001372,13 exact_match,85,0.0014582511280001372,11 indomain,85,0.0014582511280001372,8 stacked,85,0.0014582511280001372,7 learned_representation,85,0.0014582511280001372,22 additive,85,0.0014582511280001372,8 context_information,85,0.0014582511280001372,19 se_meval,85,0.0014582511280001372,8 english_wikipedia,85,0.0014582511280001372,17 first_study,85,0.0014582511280001372,11 recent_progress,85,0.0014582511280001372,15 influential,85,0.0014582511280001372,11 first_work,85,0.0014582511280001372,10 african,85,0.0014582511280001372,7 enterprise,85,0.0014582511280001372,10 nouvelle,85,0.0014582511280001372,8 adverbial,85,0.0014582511280001372,9 genia,85,0.0014582511280001372,5 d'annotation,84,0.0014410952323766061,12 anglais,84,0.0014410952323766061,7 aggregate,84,0.0014410952323766061,9 switchboard,84,0.0014410952323766061,11 pooling,84,0.0014410952323766061,7 medical_text,84,0.0014410952323766061,12 maximum_entropy_model,84,0.0014410952323766061,21 _and,84,0.0014410952323766061,4 emoji,84,0.0014410952323766061,5 high_resource_language,84,0.0014410952323766061,22 vocal,84,0.0014410952323766061,5 computational_method,84,0.0014410952323766061,20 anaphor,84,0.0014410952323766061,7 prague,84,0.0014410952323766061,6 authentic,84,0.0014410952323766061,9 transferable,84,0.0014410952323766061,12 sequence_tosequence,84,0.0014410952323766061,19 transformer_model,84,0.0014410952323766061,17 situated,84,0.0014410952323766061,8 reproducible,84,0.0014410952323766061,12 controversial,84,0.0014410952323766061,13 sigmorphon,84,0.0014410952323766061,10 various_method,84,0.0014410952323766061,14 inadequate,84,0.0014410952323766061,10 sur_le,84,0.0014410952323766061,6 consumption,84,0.0014410952323766061,11 final_system,84,0.0014410952323766061,12 united_state,84,0.0014410952323766061,12 inversion,84,0.0014410952323766061,9 recent_development,84,0.0014410952323766061,18 deep_learning_architecture,84,0.0014410952323766061,26 hand_crafted_feature,83,0.0014239393367530752,20 learnt,83,0.0014239393367530752,6 politics,83,0.0014239393367530752,8 variable_model,83,0.0014239393367530752,14 construire,83,0.0014239393367530752,10 fifth,83,0.0014239393367530752,5 tail,83,0.0014239393367530752,4 maximum_likelihood,83,0.0014239393367530752,18 abuse,83,0.0014239393367530752,5 nombre,83,0.0014239393367530752,6 random_field,83,0.0014239393367530752,12 describe,83,0.0014239393367530752,8 reply,83,0.0014239393367530752,5 vocabulary_size,83,0.0014239393367530752,15 priori,83,0.0014239393367530752,6 linear_regression,83,0.0014239393367530752,17 instructional,83,0.0014239393367530752,13 grammaire,83,0.0014239393367530752,9 linguistic_pattern,83,0.0014239393367530752,18 most_language,83,0.0014239393367530752,13 explanatory,83,0.0014239393367530752,11 late,83,0.0014239393367530752,4 unlabeled_text,83,0.0014239393367530752,14 vise,83,0.0014239393367530752,4 grouping,83,0.0014239393367530752,8 analyseur,83,0.0014239393367530752,9 tractable,83,0.0014239393367530752,9 utiliss,82,0.0014067834411295441,7 membership,82,0.0014067834411295441,10 factored,82,0.0014067834411295441,8 toxicity,82,0.0014067834411295441,8 nd,82,0.0014067834411295441,2 youtube,82,0.0014067834411295441,7 supervised_method,82,0.0014067834411295441,17 vote,82,0.0014067834411295441,4 valuable_resource,82,0.0014067834411295441,17 short_answer,82,0.0014067834411295441,12 textbook,82,0.0014067834411295441,8 arabic_text,82,0.0014067834411295441,11 interpreter,82,0.0014067834411295441,11 reduces,82,0.0014067834411295441,7 partition,82,0.0014067834411295441,9 goal_oriented,82,0.0014067834411295441,13 intractable,82,0.0014067834411295441,11 large_text,82,0.0014067834411295441,10 natural_language_description,82,0.0014067834411295441,28 continuous_space,82,0.0014067834411295441,16 main_idea,82,0.0014067834411295441,9 neural_text,82,0.0014067834411295441,11 homogeneous,82,0.0014067834411295441,11 wall_street_journal,82,0.0014067834411295441,19 lexical_similarity,82,0.0014067834411295441,18 predictive_model,82,0.0014067834411295441,16 later,82,0.0014067834411295441,5 proposed_system,82,0.0014067834411295441,15 deep_learning_approach,82,0.0014067834411295441,22 human_written,82,0.0014067834411295441,13 branch,82,0.0014067834411295441,6 sub_word,82,0.0014067834411295441,8 handful,82,0.0014067834411295441,7 cascaded,82,0.0014067834411295441,8 multi,82,0.0014067834411295441,5 rulebased,82,0.0014067834411295441,9 evaluate,81,0.0013896275455060132,8 interplay,81,0.0013896275455060132,9 template_based,81,0.0013896275455060132,14 cooperative,81,0.0013896275455060132,11 older,81,0.0013896275455060132,5 hospital,81,0.0013896275455060132,8 optimisation,81,0.0013896275455060132,12 telephone,81,0.0013896275455060132,9 siamese,81,0.0013896275455060132,7 factuality,81,0.0013896275455060132,10 feeling,81,0.0013896275455060132,7 ethical,81,0.0013896275455060132,7 omission,81,0.0013896275455060132,8 complex_sentence,81,0.0013896275455060132,16 computing,81,0.0013896275455060132,9 drift,81,0.0013896275455060132,5 forward,81,0.0013896275455060132,7 efficient_algorithm,81,0.0013896275455060132,19 english_translation,81,0.0013896275455060132,19 indigenous,81,0.0013896275455060132,10 specific_language,81,0.0013896275455060132,17 young,81,0.0013896275455060132,5 conversational_speech,81,0.0013896275455060132,21 co_reference,81,0.0013896275455060132,12 well_studied,81,0.0013896275455060132,12 inappropriate,81,0.0013896275455060132,13 free_word,81,0.0013896275455060132,9 recent_success,81,0.0013896275455060132,14 learns,81,0.0013896275455060132,6 kappa,81,0.0013896275455060132,5 embedded,81,0.0013896275455060132,8 explainability,81,0.0013896275455060132,14 experimental_study,80,0.0013724716498824821,18 multiclass,80,0.0013724716498824821,10 analyze,80,0.0013724716498824821,7 micro,80,0.0013724716498824821,5 adjunct,80,0.0013724716498824821,7 subspace,80,0.0013724716498824821,8 phrase_based_model,80,0.0013724716498824821,18 pre_trained_bert,80,0.0013724716498824821,16 consortium,80,0.0013724716498824821,10 wang,80,0.0013724716498824821,4 ressource,80,0.0013724716498824821,9 contextual_representation,80,0.0013724716498824821,25 parallel_training,80,0.0013724716498824821,17 state_ofthe_art_performance,80,0.0013724716498824821,27 s'emantique,80,0.0013724716498824821,11 heritage,80,0.0013724716498824821,8 xlm_roberta,80,0.0013724716498824821,11 l'approche,80,0.0013724716498824821,10 hoc,80,0.0013724716498824821,3 visual_question_answering,80,0.0013724716498824821,25 feature_rich,80,0.0013724716498824821,12 treat,80,0.0013724716498824821,5 valuons,80,0.0013724716498824821,7 ingredient,80,0.0013724716498824821,10 energy,80,0.0013724716498824821,6 word_net,80,0.0013724716498824821,8 well_defined,80,0.0013724716498824821,12 creative_common_attribution,80,0.0013724716498824821,27 preferred,80,0.0013724716498824821,9 misinformation,80,0.0013724716498824821,14 human_rating,80,0.0013724716498824821,12 reveal,80,0.0013724716498824821,6 inspiration,80,0.0013724716498824821,11 visualisation,79,0.001355315754258951,13 achievement,79,0.001355315754258951,11 significant_progress,79,0.001355315754258951,20 vast_amount,79,0.001355315754258951,11 low_resourced,79,0.001355315754258951,13 cross_lingual_information,79,0.001355315754258951,25 residual,79,0.001355315754258951,8 best_performing_system,79,0.001355315754258951,22 free_word_order,79,0.001355315754258951,15 donc,79,0.001355315754258951,4 favor,79,0.001355315754258951,5 discourse_structure,79,0.001355315754258951,19 state_of_the,79,0.001355315754258951,12 repetitive,79,0.001355315754258951,10 extensive_analysis,79,0.001355315754258951,18 merging,79,0.001355315754258951,7 native_language_identification,79,0.001355315754258951,30 reporting,79,0.001355315754258951,9 clip,79,0.001355315754258951,4 open_question,79,0.001355315754258951,13 automatic_acquisition,79,0.001355315754258951,21 round,79,0.001355315754258951,5 such_task,79,0.001355315754258951,9 prsent,79,0.001355315754258951,6 pdtb,79,0.001355315754258951,4 on_going,79,0.001355315754258951,8 permutation,79,0.001355315754258951,11 scaling,79,0.001355315754258951,7 penn_discourse,79,0.001355315754258951,14 absa,79,0.001355315754258951,4 perceived,79,0.001355315754258951,9 alphabet,79,0.001355315754258951,8 nouveau,79,0.001355315754258951,7 automatic_analysis,78,0.0013381598586354201,18 specific_feature,78,0.0013381598586354201,16 outline,78,0.0013381598586354201,7 target_language,78,0.0013381598586354201,15 sarcasm_detection,78,0.0013381598586354201,17 unexpected,78,0.0013381598586354201,10 lexico_syntactic,78,0.0013381598586354201,16 rewriting,78,0.0013381598586354201,9 um,78,0.0013381598586354201,2 reprsentations,78,0.0013381598586354201,14 learnable,78,0.0013381598586354201,9 supervised_training,78,0.0013381598586354201,19 fairness,78,0.0013381598586354201,8 various_aspect,78,0.0013381598586354201,14 tedious,78,0.0013381598586354201,7 wikidata,78,0.0013381598586354201,8 human_subject,78,0.0013381598586354201,13 transitive,78,0.0013381598586354201,10 significant_challenge,78,0.0013381598586354201,21 relative_error,78,0.0013381598586354201,14 edinburgh,78,0.0013381598586354201,9 quantitative_evaluation,78,0.0013381598586354201,23 attentional,78,0.0013381598586354201,11 contribute,78,0.0013381598586354201,10 fiction,78,0.0013381598586354201,7 linguistic_theory,78,0.0013381598586354201,17 cover,78,0.0013381598586354201,5 impressive_performance,77,0.001321003963011889,22 lexicalization,77,0.001321003963011889,14 real_user,77,0.001321003963011889,9 semeval_2013,77,0.001321003963011889,12 estonian,77,0.001321003963011889,8 adapter,77,0.001321003963011889,7 bigger,77,0.001321003963011889,6 official_evaluation,77,0.001321003963011889,19 quelques,77,0.001321003963011889,8 probing,77,0.001321003963011889,7 analytic,77,0.001321003963011889,8 multinomial,77,0.001321003963011889,11 sequenceto_sequence,77,0.001321003963011889,19 sen,77,0.001321003963011889,3 gru,77,0.001321003963011889,3 normalisation,77,0.001321003963011889,13 proceeding,77,0.001321003963011889,10 differential,77,0.001321003963011889,12 important_feature,77,0.001321003963011889,17 iso,77,0.001321003963011889,3 notation,77,0.001321003963011889,8 narrow,77,0.001321003963011889,6 other_feature,77,0.001321003963011889,13 retrieval_based,77,0.001321003963011889,15 nuance,77,0.001321003963011889,6 task_oriented_dialog,77,0.001321003963011889,20 computational_resource,77,0.001321003963011889,22 rich_morphology,77,0.001321003963011889,15 multilayer,77,0.001321003963011889,10 final_model,77,0.001321003963011889,11 expressiveness,77,0.001321003963011889,14 topological,77,0.001321003963011889,11 co_training,77,0.001321003963011889,11 interdisciplinary,77,0.001321003963011889,17 contradiction,77,0.001321003963011889,13 first_one,77,0.001321003963011889,9 several_type,77,0.001321003963011889,12 different_genre,77,0.001321003963011889,15 select,77,0.001321003963011889,6 standard_benchmark,77,0.001321003963011889,18 easy_to_use,77,0.001321003963011889,11 out_of_vocabulary_word,76,0.001303848067388358,22 department,76,0.001303848067388358,10 faithfulness,76,0.001303848067388358,12 subtrees,76,0.001303848067388358,8 rd,76,0.001303848067388358,2 pointwise,76,0.001303848067388358,9 adjustment,76,0.001303848067388358,10 utilisation,76,0.001303848067388358,11 cross_language_information,76,0.001303848067388358,26 cancer,76,0.001303848067388358,6 various_kind,76,0.001303848067388358,12 simultaneous_translation,76,0.001303848067388358,24 different_translation,76,0.001303848067388358,21 wmt14,76,0.001303848067388358,5 slu,76,0.001303848067388358,3 formalization,76,0.001303848067388358,13 consonant,76,0.001303848067388358,9 global_context,76,0.001303848067388358,14 previous_system,76,0.001303848067388358,15 national_corpus,76,0.001303848067388358,15 semeval_2010,76,0.001303848067388358,12 quadratic,76,0.001303848067388358,9 simple_model,76,0.001303848067388358,12 aggressive,76,0.001303848067388358,10 medication,76,0.001303848067388358,10 d'amliorer,76,0.001303848067388358,10 comprehensive_experiment,76,0.001303848067388358,24 encoder_decoder_model,76,0.001303848067388358,21 poem,76,0.001303848067388358,4 solver,76,0.001303848067388358,6 nlg_system,76,0.001303848067388358,10 weakly_supervised,76,0.001303848067388358,17 language_agnostic,76,0.001303848067388358,17 beam_search,76,0.001303848067388358,11 qualit,76,0.001303848067388358,6 appearance,76,0.001303848067388358,10 ebmt,76,0.001303848067388358,4 synonymous,76,0.001303848067388358,10 last_decade,76,0.001303848067388358,11 relaxation,76,0.001303848067388358,10 imperfect,76,0.001303848067388358,9 adapt,76,0.001303848067388358,5 inaccurate,76,0.001303848067388358,10 instantiation,76,0.001303848067388358,13 chinese_corpus,76,0.001303848067388358,14 fact_checking,76,0.001303848067388358,13 consecutive,76,0.001303848067388358,11 strong_result,76,0.001303848067388358,13 binary_classification_task,76,0.001303848067388358,26 determiner,76,0.001303848067388358,10 return,76,0.001303848067388358,6 standard_evaluation,76,0.001303848067388358,19 lr,76,0.001303848067388358,2 higher_performance,76,0.001303848067388358,18 marking,76,0.001303848067388358,7 grammatical_relation,76,0.001303848067388358,20 spearman,75,0.001286692171764827,8 une_analyse,75,0.001286692171764827,11 mood,75,0.001286692171764827,4 tac,75,0.001286692171764827,3 semantic_processing,75,0.001286692171764827,19 macro_averaged,75,0.001286692171764827,14 current_system,75,0.001286692171764827,14 primitive,75,0.001286692171764827,9 second_step,75,0.001286692171764827,11 route,75,0.001286692171764827,5 unbalanced,75,0.001286692171764827,10 applies,75,0.001286692171764827,7 gpu,75,0.001286692171764827,3 refined,75,0.001286692171764827,7 ed,75,0.001286692171764827,2 allows,75,0.001286692171764827,6 duc,75,0.001286692171764827,3 ape,75,0.001286692171764827,3 wmt19,75,0.001286692171764827,5 complex_question,75,0.001286692171764827,16 noisy_data,75,0.001286692171764827,10 online_review,75,0.001286692171764827,13 invariant,75,0.001286692171764827,9 most_work,75,0.001286692171764827,9 pronominal,75,0.001286692171764827,10 assertion,75,0.001286692171764827,9 canada,75,0.001286692171764827,6 example_based_machine_translation,75,0.001286692171764827,33 international_workshop,75,0.001286692171764827,22 particulirement,75,0.001286692171764827,15 suboptimal,75,0.001286692171764827,10 optimized,75,0.001286692171764827,9 gnration,75,0.001286692171764827,8 current_study,75,0.001286692171764827,13 historical_text,74,0.001269536276141296,15 lexical_sample_task,74,0.001269536276141296,19 apparent,74,0.001269536276141296,8 average_accuracy,74,0.001269536276141296,16 advent,74,0.001269536276141296,6 utilis,74,0.001269536276141296,6 suggested,74,0.001269536276141296,9 projective,74,0.001269536276141296,10 lexicographer,74,0.001269536276141296,13 loop,74,0.001269536276141296,4 speech_to_speech_translation,74,0.001269536276141296,28 contextualized_word,74,0.001269536276141296,19 acceptance,74,0.001269536276141296,10 surprisal,74,0.001269536276141296,9 related_word,74,0.001269536276141296,12 colloquial,74,0.001269536276141296,10 passive,74,0.001269536276141296,7 prepositional_phrase,74,0.001269536276141296,20 programme,74,0.001269536276141296,9 multilingual_word,74,0.001269536276141296,17 wat,74,0.001269536276141296,3 final_result,74,0.001269536276141296,12 d'informations,74,0.001269536276141296,14 same_meaning,74,0.001269536276141296,12 sketch,74,0.001269536276141296,6 noisy_channel,74,0.001269536276141296,13 zeroshot,74,0.001269536276141296,8 new_annotation,74,0.001269536276141296,14 context_based,74,0.001269536276141296,13 literary_text,74,0.001269536276141296,13 example_based_machine,74,0.001269536276141296,21 threat,74,0.001269536276141296,6 qa_system,74,0.001269536276141296,9 romance,74,0.001269536276141296,7 similar_performance,74,0.001269536276141296,19 good_quality,74,0.001269536276141296,12 state_of_the_art_accuracy,74,0.001269536276141296,25 retriever,74,0.001269536276141296,9 limited_data,74,0.001269536276141296,12 equation,74,0.001269536276141296,8 processor,74,0.001269536276141296,9 resumo,74,0.001269536276141296,6 c'est,74,0.001269536276141296,5 pause,74,0.001269536276141296,5 non_parallel,74,0.001269536276141296,12 formality,73,0.0012523803805177649,9 domaines,73,0.0012523803805177649,8 pedagogical,73,0.0012523803805177649,11 academia,73,0.0012523803805177649,8 user_interface,73,0.0012523803805177649,14 online_discussion,73,0.0012523803805177649,17 l'identification,73,0.0012523803805177649,16 benchmarking,73,0.0012523803805177649,12 multiple_datasets,73,0.0012523803805177649,17 inexpensive,73,0.0012523803805177649,11 english_speaker,73,0.0012523803805177649,15 encyclopedia,73,0.0012523803805177649,12 integral_part,73,0.0012523803805177649,13 expense,73,0.0012523803805177649,7 statistical_parsing,73,0.0012523803805177649,19 new_datasets,73,0.0012523803805177649,12 ensuite,73,0.0012523803805177649,7 violation,73,0.0012523803805177649,9 suicide,73,0.0012523803805177649,7 syntactic_category,73,0.0012523803805177649,18 predictive_power,73,0.0012523803805177649,16 propositional,73,0.0012523803805177649,13 same_domain,73,0.0012523803805177649,11 psycholinguistics,73,0.0012523803805177649,17 comprhension,73,0.0012523803805177649,12 overall_quality,73,0.0012523803805177649,15 outil,73,0.0012523803805177649,5 annotated_training_data,73,0.0012523803805177649,23 semantic_meaning,73,0.0012523803805177649,16 detailed_description,73,0.0012523803805177649,20 scientific_publication,73,0.0012523803805177649,22 societal,73,0.0012523803805177649,8 investment,73,0.0012523803805177649,10 high_dimensional,73,0.0012523803805177649,16 multiple_task,73,0.0012523803805177649,13 transformerbased,73,0.0012523803805177649,16 definite,73,0.0012523803805177649,8 deviation,73,0.0012523803805177649,9 el,73,0.0012523803805177649,2 gigaword,73,0.0012523803805177649,8 emergent,73,0.0012523803805177649,8 abstract_meaning_representation,73,0.0012523803805177649,31 semantic_level,73,0.0012523803805177649,14 non_parametric,73,0.0012523803805177649,14 l'annotation,73,0.0012523803805177649,12 naturalistic,72,0.001235224484894234,12 statistiques,72,0.001235224484894234,12 information_theoretic,72,0.001235224484894234,21 internal_structure,72,0.001235224484894234,18 nl,72,0.001235224484894234,2 n_gram_feature,72,0.001235224484894234,14 sanskrit,72,0.001235224484894234,8 rule_based_machine,72,0.001235224484894234,18 anger,72,0.001235224484894234,5 english_japanese,72,0.001235224484894234,16 semantic_classification,72,0.001235224484894234,23 optional,72,0.001235224484894234,8 syntactic_knowledge,72,0.001235224484894234,19 cognitive_science,72,0.001235224484894234,17 chinese_to_english_translation,72,0.001235224484894234,30 stateof_the_art_performance,72,0.001235224484894234,27 special_case,72,0.001235224484894234,12 ainsi_que,72,0.001235224484894234,9 hotel,72,0.001235224484894234,5 clinical_domain,72,0.001235224484894234,15 near,72,0.001235224484894234,4 travers,72,0.001235224484894234,7 clir,72,0.001235224484894234,4 boundary_detection,72,0.001235224484894234,18 key_role,72,0.001235224484894234,8 puis,72,0.001235224484894234,4 neural_sequence,72,0.001235224484894234,15 nonparametric,72,0.001235224484894234,13 user_friendly,72,0.001235224484894234,13 york,72,0.001235224484894234,4 new_york,72,0.001235224484894234,8 generalisation,72,0.001235224484894234,14 large_quantity,72,0.001235224484894234,14 such_approach,72,0.001235224484894234,13 masking,72,0.001235224484894234,7 partie,72,0.001235224484894234,6 predominant,72,0.001235224484894234,11 progressive,72,0.001235224484894234,11 dbpedia,72,0.001235224484894234,7 proliferation,72,0.001235224484894234,13 early_stage,72,0.001235224484894234,11 initial_experiment,72,0.001235224484894234,18 smm4h,72,0.001235224484894234,5 pro,72,0.001235224484894234,3 textual_description,72,0.001235224484894234,19 spoken_dialog_system,72,0.001235224484894234,20 xlm_r,72,0.001235224484894234,5 zero_shot_setting,72,0.001235224484894234,17 negative_example,71,0.0012180685892707029,16 transition_based_dependency,71,0.0012180685892707029,27 supplementary,71,0.0012180685892707029,13 variational_autoencoder,71,0.0012180685892707029,23 text_analysis,71,0.0012180685892707029,13 math,71,0.0012180685892707029,4 state_ofthe_art_result,71,0.0012180685892707029,22 associative,71,0.0012180685892707029,11 signature,71,0.0012180685892707029,9 k_means,71,0.0012180685892707029,7 dnn,71,0.0012180685892707029,3 surge,71,0.0012180685892707029,5 asymmetric,71,0.0012180685892707029,10 second_place,71,0.0012180685892707029,12 predictable,71,0.0012180685892707029,11 lexical_choice,71,0.0012180685892707029,14 local_feature,71,0.0012180685892707029,13 persuasive,71,0.0012180685892707029,10 wmt16,71,0.0012180685892707029,5 multilingual_translation,71,0.0012180685892707029,24 promising_performance,71,0.0012180685892707029,21 entits,71,0.0012180685892707029,6 elicitation,71,0.0012180685892707029,11 men,71,0.0012180685892707029,3 limited_training,71,0.0012180685892707029,16 human_robot,71,0.0012180685892707029,11 feed_forward,71,0.0012180685892707029,12 wordlevel,71,0.0012180685892707029,9 bilingual_lexicon_induction,71,0.0012180685892707029,27 different_machine,71,0.0012180685892707029,17 supervised_system,71,0.0012180685892707029,17 ilp,71,0.0012180685892707029,3 text_normalization,71,0.0012180685892707029,18 official_test,71,0.0012180685892707029,13 mix,71,0.0012180685892707029,3 shift_reduce,71,0.0012180685892707029,12 bilingual_data,71,0.0012180685892707029,14 descent,71,0.0012180685892707029,7 comparaison,71,0.0012180685892707029,11 anonymous,71,0.0012180685892707029,9 landscape,71,0.0012180685892707029,9 humorous,71,0.0012180685892707029,8 imitation,71,0.0012180685892707029,9 syntactic_representation,71,0.0012180685892707029,24 spell,71,0.0012180685892707029,5 manuellement,71,0.0012180685892707029,12 recommender,71,0.0012180685892707029,11 linguistic_research,71,0.0012180685892707029,19 suggest,71,0.0012180685892707029,7 state_of_theart_performance,71,0.0012180685892707029,27 rapid_development,71,0.0012180685892707029,17 multilingue,71,0.0012180685892707029,11 various_domain,71,0.0012180685892707029,14 second_approach,71,0.0012180685892707029,15 abstractive_summary,71,0.0012180685892707029,19 reusable,70,0.0012009126936471718,8 single_language,70,0.0012009126936471718,15 transition_based_parser,70,0.0012009126936471718,23 cooperation,70,0.0012009126936471718,11 automatic_approach,70,0.0012009126936471718,18 pre_existing,70,0.0012009126936471718,12 word_aligned,70,0.0012009126936471718,12 novel_algorithm,70,0.0012009126936471718,15 japan,70,0.0012009126936471718,5 multiple_choice_question,70,0.0012009126936471718,24 classroom,70,0.0012009126936471718,9 high_frequency,70,0.0012009126936471718,14 full_sentence,70,0.0012009126936471718,13 accordance,70,0.0012009126936471718,10 minimization,70,0.0012009126936471718,12 practical_use,70,0.0012009126936471718,13 justification,70,0.0012009126936471718,13 latent_representation,70,0.0012009126936471718,21 automatic_system,70,0.0012009126936471718,16 noun_compound,70,0.0012009126936471718,13 circumstance,70,0.0012009126936471718,12 crisis,70,0.0012009126936471718,6 tudions,70,0.0012009126936471718,7 digital_humanity,70,0.0012009126936471718,16 understandable,70,0.0012009126936471718,14 syntactical,70,0.0012009126936471718,11 ranker,70,0.0012009126936471718,6 past_work,70,0.0012009126936471718,9 low_cost,70,0.0012009126936471718,8 enfin,70,0.0012009126936471718,5 indo_european,70,0.0012009126936471718,13 bible,70,0.0012009126936471718,5 rule_based_method,70,0.0012009126936471718,17 comparons,70,0.0012009126936471718,9 pp,70,0.0012009126936471718,2 competitor,70,0.0012009126936471718,10 require,70,0.0012009126936471718,7 slavic,70,0.0012009126936471718,6 atis,70,0.0012009126936471718,4 code_mixing,70,0.0012009126936471718,11 joint_training,70,0.0012009126936471718,14 derived,70,0.0012009126936471718,7 nlp_pipeline,70,0.0012009126936471718,12 web_scale,70,0.0012009126936471718,9 gf,69,0.0011837567980236409,2 man,69,0.0011837567980236409,3 limited_number,69,0.0011837567980236409,14 unseen_word,69,0.0011837567980236409,11 distant_language,69,0.0011837567980236409,16 solid,69,0.0011837567980236409,5 data_to_text_generation,69,0.0011837567980236409,23 constitution,69,0.0011837567980236409,12 several_model,69,0.0011837567980236409,13 joint_inference,69,0.0011837567980236409,15 conversational_system,69,0.0011837567980236409,21 corpus_based_approach,69,0.0011837567980236409,21 impressive_result,69,0.0011837567980236409,17 fonde,69,0.0011837567980236409,5 dravidian_language,69,0.0011837567980236409,18 human_reference,69,0.0011837567980236409,15 semi_supervised_approach,69,0.0011837567980236409,24 lexical_simplification,69,0.0011837567980236409,22 natural_question,69,0.0011837567980236409,16 exemple,69,0.0011837567980236409,7 specialist,69,0.0011837567980236409,10 current_state_of_the_art,69,0.0011837567980236409,24 various_way,69,0.0011837567980236409,11 clinician,69,0.0011837567980236409,9 shortage,69,0.0011837567980236409,8 nous_prsentons_dans,69,0.0011837567980236409,19 real_data,69,0.0011837567980236409,9 disparate,69,0.0011837567980236409,9 vqa,69,0.0011837567980236409,3 unsupervised_system,69,0.0011837567980236409,19 first_experiment,69,0.0011837567980236409,16 considerable_improvement,69,0.0011837567980236409,24 safety,69,0.0011837567980236409,6 main_task,69,0.0011837567980236409,9 efficient_method,69,0.0011837567980236409,16 mise,69,0.0011837567980236409,4 rule_based_machine_translation,69,0.0011837567980236409,30 b.,69,0.0011837567980236409,2 utilises,68,0.0011666009024001098,8 summarizers,68,0.0011666009024001098,11 human_language_technology,68,0.0011666009024001098,25 semantic_vector,68,0.0011666009024001098,15 daily_life,68,0.0011666009024001098,10 rgles,68,0.0011666009024001098,5 text_only,68,0.0011666009024001098,9 wikipedia_article,68,0.0011666009024001098,17 ad_hoc,68,0.0011666009024001098,6 large_improvement,68,0.0011666009024001098,17 manual_effort,68,0.0011666009024001098,13 a.,68,0.0011666009024001098,2 plural,68,0.0011666009024001098,6 traditional_machine,68,0.0011666009024001098,19 rsum,68,0.0011666009024001098,4 hierarchical_model,68,0.0011666009024001098,18 interlingua,68,0.0011666009024001098,11 unigrams,68,0.0011666009024001098,8 week,68,0.0011666009024001098,4 amliorer,68,0.0011666009024001098,8 impairment,68,0.0011666009024001098,10 veracity,68,0.0011666009024001098,8 other_baseline,68,0.0011666009024001098,14 preprocessing_step,68,0.0011666009024001098,18 dozen,68,0.0011666009024001098,5 web_page,68,0.0011666009024001098,8 enriched,68,0.0011666009024001098,8 sub_optimal,68,0.0011666009024001098,11 para,68,0.0011666009024001098,4 human_generated,68,0.0011666009024001098,15 grapheme_to_phoneme,68,0.0011666009024001098,19 important_research,68,0.0011666009024001098,18 strong_correlation,68,0.0011666009024001098,18 en_de,68,0.0011666009024001098,5 lsa,68,0.0011666009024001098,3 unlabeled_corpus,68,0.0011666009024001098,16 germanenglish,68,0.0011666009024001098,13 north,68,0.0011666009024001098,5 more_language,68,0.0011666009024001098,13 abundance,68,0.0011666009024001098,9 d'autres,68,0.0011666009024001098,8 sd,68,0.0011666009024001098,2 dsambigusation,68,0.0011666009024001098,14 facial,68,0.0011666009024001098,6 absent,68,0.0011666009024001098,6 initial_result,68,0.0011666009024001098,14 versatile,68,0.0011666009024001098,9 phonemic,68,0.0011666009024001098,8 une_valuation,67,0.0011494450067765787,13 tight,67,0.0011494450067765787,5 implicit_discourse,67,0.0011494450067765787,18 footprint,67,0.0011494450067765787,9 semeval_2007,67,0.0011494450067765787,12 significant_performance_improvement,67,0.0011494450067765787,35 descriptor,67,0.0011494450067765787,10 vardial,67,0.0011494450067765787,7 chapter,67,0.0011494450067765787,7 different_part,67,0.0011494450067765787,14 lowest,67,0.0011494450067765787,6 studied,67,0.0011494450067765787,7 pubmed,67,0.0011494450067765787,6 multi_sentence,67,0.0011494450067765787,14 new_technique,67,0.0011494450067765787,13 persona,67,0.0011494450067765787,7 valuable_information,67,0.0011494450067765787,20 recursion,67,0.0011494450067765787,9 strongest,67,0.0011494450067765787,9 large_text_corpus,67,0.0011494450067765787,17 specific_information,67,0.0011494450067765787,20 instructor,67,0.0011494450067765787,10 neural_based,67,0.0011494450067765787,12 speech_translation,67,0.0011494450067765787,18 user_feedback,67,0.0011494450067765787,13 multiwoz,67,0.0011494450067765787,8 chemical,67,0.0011494450067765787,8 observable,67,0.0011494450067765787,10 l'information,67,0.0011494450067765787,13 deception,67,0.0011494450067765787,9 different_modality,67,0.0011494450067765787,18 align,67,0.0011494450067765787,5 spcifiques,67,0.0011494450067765787,10 reported,67,0.0011494450067765787,8 environmental,67,0.0011494450067765787,13 statistical_language_model,67,0.0011494450067765787,26 new_information,67,0.0011494450067765787,15 college,67,0.0011494450067765787,7 grande,66,0.0011322891111530478,6 outside,66,0.0011322891111530478,7 wmt20,66,0.0011322891111530478,5 two_level,66,0.0011322891111530478,9 linguistic_expression,66,0.0011322891111530478,21 previous_result,66,0.0011322891111530478,15 effet,66,0.0011322891111530478,5 office,66,0.0011322891111530478,6 hot,66,0.0011322891111530478,3 open_source_software,66,0.0011322891111530478,20 tracker,66,0.0011322891111530478,7 nous_valuons,66,0.0011322891111530478,12 url,66,0.0011322891111530478,3 worth,66,0.0011322891111530478,5 lstm_based,66,0.0011322891111530478,10 shortest,66,0.0011322891111530478,8 factoid_question,66,0.0011322891111530478,16 browser,66,0.0011322891111530478,7 division,66,0.0011322891111530478,8 various_approach,66,0.0011322891111530478,16 catalan,66,0.0011322891111530478,7 grce,66,0.0011322891111530478,4 potential_application,66,0.0011322891111530478,21 gaussian_mixture,66,0.0011322891111530478,16 structural_feature,66,0.0011322891111530478,18 interlingual,66,0.0011322891111530478,12 natural_language_interface,66,0.0011322891111530478,26 semantic_composition,66,0.0011322891111530478,20 supervised_machine_learning,66,0.0011322891111530478,27 common_approach,66,0.0011322891111530478,15 victim,66,0.0011322891111530478,6 latent_topic,66,0.0011322891111530478,12 song,66,0.0011322891111530478,4 intelligibility,66,0.0011322891111530478,15 ltag,66,0.0011322891111530478,4 manuscript,66,0.0011322891111530478,10 authorship_attribution,66,0.0011322891111530478,22 long_sentence,66,0.0011322891111530478,13 medical_record,66,0.0011322891111530478,14 fear,66,0.0011322891111530478,4 lens,66,0.0011322891111530478,4 nous_tudions,66,0.0011322891111530478,12 automatic_construction,66,0.0011322891111530478,22 giza++,66,0.0011322891111530478,6 public_health,66,0.0011322891111530478,13 discourse_representation,66,0.0011322891111530478,24 unstable,66,0.0011322891111530478,8 le_corpus,66,0.0011322891111530478,9 monolingual_model,66,0.0011322891111530478,17 neural_method,66,0.0011322891111530478,13 undesirable,66,0.0011322891111530478,11 optical,66,0.0011322891111530478,7 prospect,66,0.0011322891111530478,8 possible_solution,66,0.0011322891111530478,17 such_feature,66,0.0011322891111530478,12 fmeasure,66,0.0011322891111530478,8 contextualized_representation,66,0.0011322891111530478,29 unique_challenge,65,0.0011151332155295167,16 commonality,65,0.0011151332155295167,11 maximum_entropy_classifier,65,0.0011151332155295167,26 great_deal,65,0.0011151332155295167,10 parliament,65,0.0011151332155295167,10 agglutinative_language,65,0.0011151332155295167,22 same_topic,65,0.0011151332155295167,10 high_coverage,65,0.0011151332155295167,13 ligne,65,0.0011151332155295167,5 previous_state,65,0.0011151332155295167,14 dvelopp,65,0.0011151332155295167,7 rich_source,65,0.0011151332155295167,11 content_based,65,0.0011151332155295167,13 multidocument,65,0.0011151332155295167,13 press,65,0.0011151332155295167,5 much_work,65,0.0011151332155295167,9 automatic_word,65,0.0011151332155295167,14 qualitative_evaluation,65,0.0011151332155295167,22 customization,65,0.0011151332155295167,13 adjective_noun,65,0.0011151332155295167,14 open_domain_dialogue,65,0.0011151332155295167,20 developmental,65,0.0011151332155295167,13 exam,65,0.0011151332155295167,4 rational,65,0.0011151332155295167,8 pitfall,65,0.0011151332155295167,7 available_online,65,0.0011151332155295167,16 tabular,65,0.0011151332155295167,7 n'est,65,0.0011151332155295167,5 interact,65,0.0011151332155295167,8 labeled_training_data,65,0.0011151332155295167,21 continuation,65,0.0011151332155295167,12 personal_name,65,0.0011151332155295167,13 source_language,65,0.0011151332155295167,15 relative_clause,65,0.0011151332155295167,15 multi_head_attention,65,0.0011151332155295167,20 acronym,65,0.0011151332155295167,7 specified,65,0.0011151332155295167,9 contenu,65,0.0011151332155295167,7 optimum,65,0.0011151332155295167,7 intermediate_representation,65,0.0011151332155295167,27 complex_language,65,0.0011151332155295167,16 yahoo,65,0.0011151332155295167,5 ted_talk,65,0.0011151332155295167,8 various_level,65,0.0011151332155295167,13 global_information,65,0.0011151332155295167,18 different_setting,65,0.0011151332155295167,17 such_corpus,65,0.0011151332155295167,11 aspect_term,65,0.0011151332155295167,11 user_utterance,65,0.0011151332155295167,14 long_text,65,0.0011151332155295167,9 online_news,65,0.0011151332155295167,11 choix,65,0.0011151332155295167,5 zero_shot_learning,64,0.0010979773199059858,18 pre_trained_embeddings,64,0.0010979773199059858,22 automatic_recognition,64,0.0010979773199059858,21 fewer_parameter,64,0.0010979773199059858,15 bot,64,0.0010979773199059858,3 available_training,64,0.0010979773199059858,18 dissemination,64,0.0010979773199059858,13 qu'il,64,0.0010979773199059858,5 long_tail,64,0.0010979773199059858,9 distributional_representation,64,0.0010979773199059858,29 specific_type,64,0.0010979773199059858,13 vast_majority,64,0.0010979773199059858,13 cross_lingual_word_embeddings,64,0.0010979773199059858,29 hmms,64,0.0010979773199059858,4 important_factor,64,0.0010979773199059858,16 macro_f1,64,0.0010979773199059858,8 white,64,0.0010979773199059858,5 election,64,0.0010979773199059858,8 catastrophic,64,0.0010979773199059858,12 divergent,64,0.0010979773199059858,9 repair,64,0.0010979773199059858,6 polynomial_time,64,0.0010979773199059858,15 tree_adjoining,64,0.0010979773199059858,14 optical_character,64,0.0010979773199059858,17 volunteer,64,0.0010979773199059858,9 bpe,64,0.0010979773199059858,3 neural_system,64,0.0010979773199059858,13 phrase_based_smt_system,64,0.0010979773199059858,23 trick,64,0.0010979773199059858,5 standard_approach,64,0.0010979773199059858,17 compositional_semantics,64,0.0010979773199059858,23 joy,64,0.0010979773199059858,3 semi_supervised_method,64,0.0010979773199059858,22 inspection,64,0.0010979773199059858,10 utilisons,64,0.0010979773199059858,9 reformulation,64,0.0010979773199059858,13 nous_utilisons,64,0.0010979773199059858,14 impractical,64,0.0010979773199059858,11 human_user,64,0.0010979773199059858,10 permis,64,0.0010979773199059858,6 finance,64,0.0010979773199059858,7 sentiment_lexicon,64,0.0010979773199059858,17 lexico_semantic,64,0.0010979773199059858,15 concreteness,64,0.0010979773199059858,12 hateful,64,0.0010979773199059858,7 higher_correlation,64,0.0010979773199059858,18 freedom,64,0.0010979773199059858,7 adverse_drug,64,0.0010979773199059858,12 cws,64,0.0010979773199059858,3 resource_poor_language,64,0.0010979773199059858,22 contributes,64,0.0010979773199059858,11 dissimilar,64,0.0010979773199059858,10 sein,64,0.0010979773199059858,4 multilingual_text,64,0.0010979773199059858,17 cfg,64,0.0010979773199059858,3 different_technique,64,0.0010979773199059858,19 jeu,64,0.0010979773199059858,3 heart,64,0.0010979773199059858,5 relaxed,64,0.0010979773199059858,7 multi_dimensional,63,0.0010808214242824547,17 arithmetic,63,0.0010808214242824547,10 levenshtein,63,0.0010808214242824547,11 hierarchical_attention,63,0.0010808214242824547,22 conception,63,0.0010808214242824547,10 dictionnaire,63,0.0010808214242824547,12 variational_inference,63,0.0010808214242824547,21 feed,63,0.0010808214242824547,4 html,63,0.0010808214242824547,4 networking,63,0.0010808214242824547,10 grammatical_structure,63,0.0010808214242824547,21 common_practice,63,0.0010808214242824547,15 que_le,63,0.0010808214242824547,6 formal_language,63,0.0010808214242824547,15 john,63,0.0010808214242824547,4 montre,63,0.0010808214242824547,6 wealth,63,0.0010808214242824547,6 lyric,63,0.0010808214242824547,5 albert,63,0.0010808214242824547,6 customized,63,0.0010808214242824547,10 analogous,63,0.0010808214242824547,9 more_information,63,0.0010808214242824547,16 toolkits,63,0.0010808214242824547,8 empathy,63,0.0010808214242824547,7 many_study,63,0.0010808214242824547,10 successive,63,0.0010808214242824547,10 annotated_data,63,0.0010808214242824547,14 profiling,63,0.0010808214242824547,9 calibration,63,0.0010808214242824547,11 ontology_based,63,0.0010808214242824547,14 multi_step,63,0.0010808214242824547,10 genuine,63,0.0010808214242824547,7 hallucination,63,0.0010808214242824547,13 d'obtenir,63,0.0010808214242824547,9 opendomain,63,0.0010808214242824547,10 penn_discourse_treebank,63,0.0010808214242824547,23 indic,63,0.0010808214242824547,5 journalist,63,0.0010808214242824547,10 few_shot_setting,63,0.0010808214242824547,16 rbmt,63,0.0010808214242824547,4 best_translation,63,0.0010808214242824547,16 fall,63,0.0010808214242824547,4 machine_readable,63,0.0010808214242824547,16 contextualized_embeddings,63,0.0010808214242824547,25 campagne,63,0.0010808214242824547,8 senseval_2,63,0.0010808214242824547,10 encode,63,0.0010808214242824547,6 mail,63,0.0010808214242824547,4 detect,63,0.0010808214242824547,6 unlikely,63,0.0010808214242824547,8 meet,63,0.0010808214242824547,4 less_resourced,63,0.0010808214242824547,14 labeler,63,0.0010808214242824547,7 closed_track,63,0.0010808214242824547,12 disability,63,0.0010808214242824547,10 japanese_language,62,0.0010636655286589236,17 conditional_probability,62,0.0010636655286589236,23 neural_network_approach,62,0.0010636655286589236,23 fidelity,62,0.0010636655286589236,8 end_to_end_system,62,0.0010636655286589236,17 d'entits,62,0.0010636655286589236,8 different_combination,62,0.0010636655286589236,21 graphic,62,0.0010636655286589236,7 taxonomic,62,0.0010636655286589236,9 morphologique,62,0.0010636655286589236,13 adversarial_network,62,0.0010636655286589236,19 fever,62,0.0010636655286589236,5 peer,62,0.0010636655286589236,4 calcul,62,0.0010636655286589236,6 linear_classifier,62,0.0010636655286589236,17 text_to_sql,62,0.0010636655286589236,11 different_granularity,62,0.0010636655286589236,21 noisy_text,62,0.0010636655286589236,10 specialised,62,0.0010636655286589236,11 ptb,62,0.0010636655286589236,3 fscore,62,0.0010636655286589236,6 lexical_complexity,62,0.0010636655286589236,18 substring,62,0.0010636655286589236,9 vague,62,0.0010636655286589236,5 licence,62,0.0010636655286589236,7 longitudinal,62,0.0010636655286589236,12 turn_taking,62,0.0010636655286589236,11 healthy,62,0.0010636655286589236,7 taskspecific,62,0.0010636655286589236,12 uas,62,0.0010636655286589236,3 continual,62,0.0010636655286589236,9 imperative,62,0.0010636655286589236,10 vector_space,62,0.0010636655286589236,12 involvement,62,0.0010636655286589236,11 effective_feature,62,0.0010636655286589236,17 text_document,62,0.0010636655286589236,13 stateof_the_art_result,62,0.0010636655286589236,22 nlp_researcher,62,0.0010636655286589236,14 same_task,62,0.0010636655286589236,9 le_attention,62,0.0010636655286589236,12 exemplar,62,0.0010636655286589236,8 large_model,62,0.0010636655286589236,11 offense,62,0.0010636655286589236,7 fine_grained_entity,62,0.0010636655286589236,19 new_system,62,0.0010636655286589236,10 full_use,62,0.0010636655286589236,8 localisation,62,0.0010636655286589236,12 sadness,62,0.0010636655286589236,7 tree_structured,62,0.0010636655286589236,15 unseen_data,62,0.0010636655286589236,11 senseval_3,62,0.0010636655286589236,10 systematic_study,62,0.0010636655286589236,16 conventional_method,62,0.0010636655286589236,19 adversarial_learning,62,0.0010636655286589236,20 relative_error_reduction,62,0.0010636655286589236,24 end_user,62,0.0010636655286589236,8 paired,62,0.0010636655286589236,6 well,62,0.0010636655286589236,4 f1_measure,62,0.0010636655286589236,10 forgetting,62,0.0010636655286589236,10 unnecessary,62,0.0010636655286589236,11 multi_view,62,0.0010636655286589236,10 disponibles,61,0.0010465096330353927,11 illness,61,0.0010465096330353927,7 semantic_unit,61,0.0010465096330353927,13 correct_translation,61,0.0010465096330353927,19 differ,61,0.0010465096330353927,6 monolingual_text,61,0.0010465096330353927,16 noun_noun,61,0.0010465096330353927,9 cpu,61,0.0010465096330353927,3 open_problem,61,0.0010465096330353927,12 significant_amount,61,0.0010465096330353927,18 light_verb,61,0.0010465096330353927,10 infeasible,61,0.0010465096330353927,10 out_ofdomain,61,0.0010465096330353927,12 distributional_information,61,0.0010465096330353927,26 wild,61,0.0010465096330353927,4 someone,61,0.0010465096330353927,7 leurs,61,0.0010465096330353927,5 user_generated_text,61,0.0010465096330353927,19 deceptive,61,0.0010465096330353927,9 keyboard,61,0.0010465096330353927,8 second_language_learner,61,0.0010465096330353927,23 algorithme,61,0.0010465096330353927,10 advice,61,0.0010465096330353927,6 regardless,61,0.0010465096330353927,10 mesures,61,0.0010465096330353927,7 symmetric,61,0.0010465096330353927,9 described,61,0.0010465096330353927,9 cleaning,61,0.0010465096330353927,8 deft,61,0.0010465096330353927,4 raters,61,0.0010465096330353927,6 con,61,0.0010465096330353927,3 tree_adjoining_grammar,61,0.0010465096330353927,22 annot,61,0.0010465096330353927,5 framing,61,0.0010465096330353927,7 offensive_language_detection,61,0.0010465096330353927,28 state_of_theart_result,61,0.0010465096330353927,22 similarity_based,61,0.0010465096330353927,16 neural_word,61,0.0010465096330353927,11 final_submission,61,0.0010465096330353927,16 recognizers,61,0.0010465096330353927,11 disaster,61,0.0010465096330353927,8 automatiques,61,0.0010465096330353927,12 lexical_relation,61,0.0010465096330353927,16 annual,61,0.0010465096330353927,6 suffer,61,0.0010465096330353927,6 mert,61,0.0010465096330353927,4 optical_character_recognition,61,0.0010465096330353927,29 carlo,61,0.0010465096330353927,5 real_world_scenario,61,0.0010465096330353927,19 emoticon,61,0.0010465096330353927,8 l'tude,61,0.0010465096330353927,6 harm,61,0.0010465096330353927,4 such_knowledge,61,0.0010465096330353927,14 animal,61,0.0010465096330353927,6 certain_type,61,0.0010465096330353927,12 trace,61,0.0010465096330353927,5 scientific_document,61,0.0010465096330353927,19 documentlevel,61,0.0010465096330353927,13 anthology,61,0.0010465096330353927,9 updated,61,0.0010465096330353927,7 reranker,61,0.0010465096330353927,8 encyclopedic,61,0.0010465096330353927,12 interannotator,60,0.0010293537374118616,14 computational_linguist,60,0.0010293537374118616,22 driven,60,0.0010293537374118616,6 gibbs,60,0.0010293537374118616,5 overt,60,0.0010293537374118616,5 mobile_device,60,0.0010293537374118616,13 human_level,60,0.0010293537374118616,11 c.,60,0.0010293537374118616,2 mitigation,60,0.0010293537374118616,10 acoustic_feature,60,0.0010293537374118616,16 empty,60,0.0010293537374118616,5 different_meaning,60,0.0010293537374118616,17 model_agnostic,60,0.0010293537374118616,14 basic_idea,60,0.0010293537374118616,10 maxent,60,0.0010293537374118616,6 backward,60,0.0010293537374118616,8 different_text,60,0.0010293537374118616,14 best_accuracy,60,0.0010293537374118616,13 weaker,60,0.0010293537374118616,6 machine_generated,60,0.0010293537374118616,17 main_focus,60,0.0010293537374118616,10 opensource,60,0.0010293537374118616,10 adversary,60,0.0010293537374118616,9 long_range_dependency,60,0.0010293537374118616,21 cosine_similarity,60,0.0010293537374118616,17 positive_result,60,0.0010293537374118616,15 expressive_power,60,0.0010293537374118616,16 alternate,60,0.0010293537374118616,9 neighbour,60,0.0010293537374118616,9 large_scale_datasets,60,0.0010293537374118616,20 scientific_text,60,0.0010293537374118616,15 paradigmatic,60,0.0010293537374118616,12 light_weight,60,0.0010293537374118616,12 multiple_document,60,0.0010293537374118616,17 such_language,60,0.0010293537374118616,13 several_technique,60,0.0010293537374118616,17 thinking,60,0.0010293537374118616,8 small_training,60,0.0010293537374118616,14 pronoun_resolution,60,0.0010293537374118616,18 cross_language_information_retrieval,60,0.0010293537374118616,36 additional_training_data,60,0.0010293537374118616,24 physician,60,0.0010293537374118616,9 inflected_form,60,0.0010293537374118616,14 instant,60,0.0010293537374118616,7 ongoing_work,60,0.0010293537374118616,12 f1_scores,60,0.0010293537374118616,9 important_issue,60,0.0010293537374118616,15 unimodal,60,0.0010293537374118616,8 pbsmt,60,0.0010293537374118616,5 antonym,60,0.0010293537374118616,7 informational,60,0.0010293537374118616,13 subjective_evaluation,60,0.0010293537374118616,21 ibm_model,60,0.0010293537374118616,9 syntactic_complexity,60,0.0010293537374118616,20 promising_approach,60,0.0010293537374118616,18 pagerank,60,0.0010293537374118616,8 inquiry,60,0.0010293537374118616,7 offenseval,60,0.0010293537374118616,10 uk,60,0.0010293537374118616,2 subsequence,60,0.0010293537374118616,11 similar_result,59,0.0010121978417883305,14 pertinence,59,0.0010121978417883305,10 idiosyncratic,59,0.0010121978417883305,13 in_house,59,0.0010121978417883305,8 new_perspective,59,0.0010121978417883305,15 stop,59,0.0010121978417883305,4 various_model,59,0.0010121978417883305,13 misspelling,59,0.0010121978417883305,11 experimental_setting,59,0.0010121978417883305,20 web_interface,59,0.0010121978417883305,13 code_mixed_text,59,0.0010121978417883305,15 diver,59,0.0010121978417883305,5 better_model,59,0.0010121978417883305,12 completeness,59,0.0010121978417883305,12 unsupervised_machine,59,0.0010121978417883305,20 instrument,59,0.0010121978417883305,10 mtl,59,0.0010121978417883305,3 subtree,59,0.0010121978417883305,7 resource_rich_language,59,0.0010121978417883305,22 unchanged,59,0.0010121978417883305,9 restoration,59,0.0010121978417883305,11 cf,59,0.0010121978417883305,2 east,59,0.0010121978417883305,4 non_linguistic,59,0.0010121978417883305,14 urgent,59,0.0010121978417883305,6 fly,59,0.0010121978417883305,3 different_degree,59,0.0010121978417883305,16 official_result,59,0.0010121978417883305,15 new_insight,59,0.0010121978417883305,11 discourse_analysis,59,0.0010121978417883305,18 creativecommons.orglicensesby4.0,59,0.0010121978417883305,32 sr,59,0.0010121978417883305,2 proof_of_concept,59,0.0010121978417883305,16 theorem,59,0.0010121978417883305,7 icelandic,59,0.0010121978417883305,9 cross_sentence,59,0.0010121978417883305,14 grant,59,0.0010121978417883305,5 machine_translated,59,0.0010121978417883305,18 state_of_the_art_machine,59,0.0010121978417883305,24 embodied,59,0.0010121978417883305,8 slection,59,0.0010121978417883305,8 nothing,59,0.0010121978417883305,7 experimental_setup,59,0.0010121978417883305,18 inability,59,0.0010121978417883305,9 acyclic_graph,59,0.0010121978417883305,13 submitted_system,59,0.0010121978417883305,16 ineffective,59,0.0010121978417883305,11 inferred,59,0.0010121978417883305,8 several_task,59,0.0010121978417883305,12 proprits,59,0.0010121978417883305,8 elegant,59,0.0010121978417883305,7 transductive,59,0.0010121978417883305,12 priority,59,0.0010121978417883305,8 radiology,59,0.0010121978417883305,9 topic_based,58,0.0009950419461647996,11 syntactic_property,58,0.0009950419461647996,18 novice,58,0.0009950419461647996,6 unified_model,58,0.0009950419461647996,13 multi_stage,58,0.0009950419461647996,11 slang,58,0.0009950419461647996,5 lexical_level,58,0.0009950419461647996,13 standard_test,58,0.0009950419461647996,13 combinaison,58,0.0009950419461647996,11 disjoint,58,0.0009950419461647996,8 non_english_language,58,0.0009950419461647996,20 syntactic_construction,58,0.0009950419461647996,22 content_word,58,0.0009950419461647996,12 comprehensive_evaluation,58,0.0009950419461647996,24 implicit_discourse_relation,58,0.0009950419461647996,27 gnralement,58,0.0009950419461647996,10 computational_analysis,58,0.0009950419461647996,22 past_decade,58,0.0009950419461647996,11 relative_importance,58,0.0009950419461647996,19 outstanding,58,0.0009950419461647996,11 monte,58,0.0009950419461647996,5 top_performing,58,0.0009950419461647996,14 understand,58,0.0009950419461647996,10 nous_comparons,58,0.0009950419461647996,14 linear_chain,58,0.0009950419461647996,12 key_feature,58,0.0009950419461647996,11 japanese_to_english,58,0.0009950419461647996,19 several_way,58,0.0009950419461647996,11 topology,58,0.0009950419461647996,8 taiwanese,58,0.0009950419461647996,9 scalar,58,0.0009950419461647996,6 neural_translation,58,0.0009950419461647996,18 ici,58,0.0009950419461647996,3 le_traitement,58,0.0009950419461647996,13 subwords,58,0.0009950419461647996,8 mr,58,0.0009950419461647996,2 human_assessment,58,0.0009950419461647996,16 linguistically_motivated,58,0.0009950419461647996,24 human_intervention,58,0.0009950419461647996,18 politician,58,0.0009950419461647996,10 authoring,58,0.0009950419461647996,9 constructed,58,0.0009950419461647996,11 click,58,0.0009950419461647996,5 rewrite,58,0.0009950419461647996,7 hyperparameter,58,0.0009950419461647996,14 generated_summary,58,0.0009950419461647996,17 aspect_level,58,0.0009950419461647996,12 different_set,58,0.0009950419461647996,13 unsupervised_fashion,58,0.0009950419461647996,20 cible,58,0.0009950419461647996,5 text_similarity,58,0.0009950419461647996,15 terme,58,0.0009950419461647996,5 long_standing,58,0.0009950419461647996,13 shallow_parsing,58,0.0009950419461647996,15 superficial,58,0.0009950419461647996,11 semantic_task,58,0.0009950419461647996,13 rseau,58,0.0009950419461647996,5 different_annotation,58,0.0009950419461647996,20 small_subset,58,0.0009950419461647996,12 span_based,58,0.0009950419461647996,10 aggression,58,0.0009950419461647996,10 interpersonal,58,0.0009950419461647996,13 geometry,58,0.0009950419461647996,8 lie,58,0.0009950419461647996,3 arabe,58,0.0009950419461647996,5 wisdom,58,0.0009950419461647996,6 simple_baseline,58,0.0009950419461647996,15 babelnet,58,0.0009950419461647996,8 similar_task,58,0.0009950419461647996,12 postediting,58,0.0009950419461647996,11 next_step,58,0.0009950419461647996,9 speech_to_text,57,0.0009778860505412685,14 lexicography,57,0.0009778860505412685,12 sub,57,0.0009778860505412685,3 human_evaluator,57,0.0009778860505412685,15 soit,57,0.0009778860505412685,4 diacritic,57,0.0009778860505412685,9 macro_f1_score,57,0.0009778860505412685,14 semeval_2015_task,57,0.0009778860505412685,17 datadriven,57,0.0009778860505412685,10 textual_inference,57,0.0009778860505412685,17 efficient_way,57,0.0009778860505412685,13 boosting,57,0.0009778860505412685,8 theoretic,57,0.0009778860505412685,9 same_entity,57,0.0009778860505412685,11 utilisant_de,57,0.0009778860505412685,12 unsupervised_domain_adaptation,57,0.0009778860505412685,30 unsupervised_domain,57,0.0009778860505412685,19 stateof_the_art_method,57,0.0009778860505412685,22 certainty,57,0.0009778860505412685,9 opinionated,57,0.0009778860505412685,11 graded,57,0.0009778860505412685,6 collins,57,0.0009778860505412685,7 noticeable,57,0.0009778860505412685,10 several_machine,57,0.0009778860505412685,15 better_accuracy,57,0.0009778860505412685,15 annotated_datasets,57,0.0009778860505412685,18 placement,57,0.0009778860505412685,9 different_evaluation,57,0.0009778860505412685,20 limited_training_data,57,0.0009778860505412685,21 natural_language_query,57,0.0009778860505412685,22 credibility,57,0.0009778860505412685,11 long_time,57,0.0009778860505412685,9 pivot_language,57,0.0009778860505412685,14 collocational,57,0.0009778860505412685,13 modlisation,57,0.0009778860505412685,11 chineseenglish,57,0.0009778860505412685,14 discours,57,0.0009778860505412685,8 hidden_layer,57,0.0009778860505412685,12 authority,57,0.0009778860505412685,9 modularity,57,0.0009778860505412685,10 same_word,57,0.0009778860505412685,9 linkage,57,0.0009778860505412685,7 highest_accuracy,57,0.0009778860505412685,16 less_resourced_language,57,0.0009778860505412685,23 moderation,57,0.0009778860505412685,10 supervised_classification,57,0.0009778860505412685,25 cohesive,57,0.0009778860505412685,8 speculation,57,0.0009778860505412685,11 fois,57,0.0009778860505412685,4 semantic_lexicon,57,0.0009778860505412685,16 higher_precision,57,0.0009778860505412685,16 ready,57,0.0009778860505412685,5 l'anglais,57,0.0009778860505412685,9 class_based,57,0.0009778860505412685,11 linguistic_unit,57,0.0009778860505412685,15 esl,57,0.0009778860505412685,3 naturel,57,0.0009778860505412685,7 joint_modeling,57,0.0009778860505412685,14 taux,56,0.0009607301549177375,4 multiple_level,56,0.0009607301549177375,14 irish,56,0.0009607301549177375,5 automated_system,56,0.0009607301549177375,16 reciprocal,56,0.0009607301549177375,10 multiparty,56,0.0009607301549177375,10 closest,56,0.0009607301549177375,7 positive_impact,56,0.0009607301549177375,15 grading,56,0.0009607301549177375,7 importante,56,0.0009607301549177375,10 technical_term,56,0.0009607301549177375,14 alignment_model,56,0.0009607301549177375,15 consuming,56,0.0009607301549177375,9 clarity,56,0.0009607301549177375,7 corporate,56,0.0009607301549177375,9 baseline_model,56,0.0009607301549177375,14 great_potential,56,0.0009607301549177375,15 reinforcement_learning,56,0.0009607301549177375,22 strategic,56,0.0009607301549177375,9 contour,56,0.0009607301549177375,7 detected,56,0.0009607301549177375,8 follow_up,56,0.0009607301549177375,9 user_query,56,0.0009607301549177375,10 geolocation,56,0.0009607301549177375,11 eleven,56,0.0009607301549177375,6 directional,56,0.0009607301549177375,11 bilingual_word_embeddings,56,0.0009607301549177375,25 transitivity,56,0.0009607301549177375,12 new_sentence,56,0.0009607301549177375,12 vertex,56,0.0009607301549177375,6 generated_question,56,0.0009607301549177375,18 emotional_state,56,0.0009607301549177375,15 neural_sequence_to_sequence,56,0.0009607301549177375,27 effective_use,56,0.0009607301549177375,13 tels,56,0.0009607301549177375,4 snli,56,0.0009607301549177375,4 statistical_technique,56,0.0009607301549177375,21 browsing,56,0.0009607301549177375,8 interoperable,56,0.0009607301549177375,13 user_satisfaction,56,0.0009607301549177375,17 regulation,56,0.0009607301549177375,10 first_model,56,0.0009607301549177375,11 available_dataset,56,0.0009607301549177375,17 continuous_speech,56,0.0009607301549177375,17 calculus,56,0.0009607301549177375,8 main_feature,56,0.0009607301549177375,12 nontrivial,56,0.0009607301549177375,10 svm_based,56,0.0009607301549177375,9 german_language,56,0.0009607301549177375,15 et_al,56,0.0009607301549177375,5 generated_sentence,56,0.0009607301549177375,18 formal_semantics,56,0.0009607301549177375,16 sociolinguistic,56,0.0009607301549177375,15 human_computer_interaction,56,0.0009607301549177375,26 original_model,56,0.0009607301549177375,14 new_training,56,0.0009607301549177375,12 high_recall,56,0.0009607301549177375,11 electronic_dictionary,56,0.0009607301549177375,21 several_study,56,0.0009607301549177375,13 marathi,56,0.0009607301549177375,7 kong,56,0.0009607301549177375,4 longest,56,0.0009607301549177375,7 parallelism,56,0.0009607301549177375,11 crf_based,56,0.0009607301549177375,9 ordinal,56,0.0009607301549177375,7 este,56,0.0009607301549177375,4 d'autre,56,0.0009607301549177375,7 biggest,56,0.0009607301549177375,7 serbian,56,0.0009607301549177375,7 word_sense,55,0.0009435742592942064,10 contributor,55,0.0009435742592942064,11 high_cost,55,0.0009435742592942064,9 crowd_sourcing,55,0.0009435742592942064,14 hit,55,0.0009435742592942064,3 lingual,55,0.0009435742592942064,7 sub_sentential,55,0.0009435742592942064,14 avoir,55,0.0009435742592942064,5 natural_language_task,55,0.0009435742592942064,21 asymmetry,55,0.0009435742592942064,9 certains,55,0.0009435742592942064,8 advertisement,55,0.0009435742592942064,13 red,55,0.0009435742592942064,3 log_likelihood,55,0.0009435742592942064,14 languageindependent,55,0.0009435742592942064,19 new_research,55,0.0009435742592942064,12 adaptability,55,0.0009435742592942064,12 expressivity,55,0.0009435742592942064,12 dominance,55,0.0009435742592942064,9 optimality,55,0.0009435742592942064,10 hong,55,0.0009435742592942064,4 rnn_based,55,0.0009435742592942064,9 hint,55,0.0009435742592942064,4 van,55,0.0009435742592942064,3 reach,55,0.0009435742592942064,5 bilingual_parallel,55,0.0009435742592942064,18 interference,55,0.0009435742592942064,12 peculiarity,55,0.0009435742592942064,11 first_language,55,0.0009435742592942064,14 compute,55,0.0009435742592942064,7 linguistic_rule,55,0.0009435742592942064,15 tat,55,0.0009435742592942064,3 quantization,55,0.0009435742592942064,12 papier,55,0.0009435742592942064,6 indo_european_language,55,0.0009435742592942064,22 syntactic_constraint,55,0.0009435742592942064,20 pipelined,55,0.0009435742592942064,9 query_expansion,55,0.0009435742592942064,15 moyen,55,0.0009435742592942064,5 non_projective_dependency,55,0.0009435742592942064,25 general_approach,55,0.0009435742592942064,16 open_source_toolkit,55,0.0009435742592942064,19 drawn,55,0.0009435742592942064,5 continuum,55,0.0009435742592942064,9 random_walk,55,0.0009435742592942064,11 mlm,55,0.0009435742592942064,3 favorable,55,0.0009435742592942064,9 graph_based_approach,55,0.0009435742592942064,20 overall_system,55,0.0009435742592942064,14 recent_effort,55,0.0009435742592942064,13 hardware,55,0.0009435742592942064,8 earlier_work,55,0.0009435742592942064,12 neuron,55,0.0009435742592942064,6 applique,55,0.0009435742592942064,8 different_category,55,0.0009435742592942064,18 single_system,55,0.0009435742592942064,13 short_paper,55,0.0009435742592942064,11 genetic_algorithm,55,0.0009435742592942064,17 laptop,55,0.0009435742592942064,6 empirical_comparison,55,0.0009435742592942064,20 whole_sentence,55,0.0009435742592942064,14 kernel_based,55,0.0009435742592942064,12 subgraph,55,0.0009435742592942064,8 viz,55,0.0009435742592942064,3 relevant_sentence,55,0.0009435742592942064,17 inferior,55,0.0009435742592942064,8 reinflection,55,0.0009435742592942064,12 user_experience,55,0.0009435742592942064,15 multilabel,55,0.0009435742592942064,10 evident,55,0.0009435742592942064,7 web_document,55,0.0009435742592942064,12 menes,55,0.0009435742592942064,5 grammatical_function,55,0.0009435742592942064,20 driver,55,0.0009435742592942064,6 negligible,55,0.0009435742592942064,10 state_of_the_art_parser,55,0.0009435742592942064,23 extraire,55,0.0009435742592942064,8 dictionary_definition,55,0.0009435742592942064,21 first_method,55,0.0009435742592942064,12 free_form,54,0.0009264183636706754,9 philosophy,54,0.0009264183636706754,10 morphological_complexity,54,0.0009264183636706754,24 original_document,54,0.0009264183636706754,17 btec,54,0.0009264183636706754,4 darpa,54,0.0009264183636706754,5 dst,54,0.0009264183636706754,3 evolutionary,54,0.0009264183636706754,12 well_suited,54,0.0009264183636706754,11 polysemous_word,54,0.0009264183636706754,15 economy,54,0.0009264183636706754,7 persuasion,54,0.0009264183636706754,10 vector_based,54,0.0009264183636706754,12 angle,54,0.0009264183636706754,5 employ,54,0.0009264183636706754,6 d'autre_part,54,0.0009264183636706754,12 back,54,0.0009264183636706754,4 slower,54,0.0009264183636706754,6 essence,54,0.0009264183636706754,7 pe,54,0.0009264183636706754,2 spatial_relation,54,0.0009264183636706754,16 tutoring,54,0.0009264183636706754,8 automatic_processing,54,0.0009264183636706754,20 western,54,0.0009264183636706754,7 proper_noun,54,0.0009264183636706754,11 several_benchmark,54,0.0009264183636706754,17 phylogenetic,54,0.0009264183636706754,12 moins,54,0.0009264183636706754,5 unsegmented,54,0.0009264183636706754,11 uma,54,0.0009264183636706754,3 fine_grained_sentiment,54,0.0009264183636706754,22 preferable,54,0.0009264183636706754,10 semantic_evaluation,54,0.0009264183636706754,19 various_application,54,0.0009264183636706754,19 disparity,54,0.0009264183636706754,9 gradient_based,54,0.0009264183636706754,14 wordnet_based,54,0.0009264183636706754,13 manning,54,0.0009264183636706754,7 rescoring,54,0.0009264183636706754,9 unbiased,54,0.0009264183636706754,8 defense,54,0.0009264183636706754,7 tous,54,0.0009264183636706754,4 vu,54,0.0009264183636706754,2 analogical,54,0.0009264183636706754,10 such_text,54,0.0009264183636706754,9 connectivity,54,0.0009264183636706754,12 such_case,54,0.0009264183636706754,9 lexical_ambiguity,54,0.0009264183636706754,17 *_*,54,0.0009264183636706754,3 social_medium_user,54,0.0009264183636706754,18 final_output,54,0.0009264183636706754,12 domain_specific_corpus,54,0.0009264183636706754,22 chen,54,0.0009264183636706754,4 manual_analysis,54,0.0009264183636706754,15 significant_increase,54,0.0009264183636706754,20 tend,54,0.0009264183636706754,4 important_word,54,0.0009264183636706754,14 raw_corpus,54,0.0009264183636706754,10 different_perspective,54,0.0009264183636706754,21 affinity,54,0.0009264183636706754,8 conceptnet,54,0.0009264183636706754,10 rsolution,54,0.0009264183636706754,9 deep_model,54,0.0009264183636706754,10 large_training,54,0.0009264183636706754,14 pertinent,53,0.0009092624680471444,9 intra_sentential,53,0.0009092624680471444,16 nonlinear,53,0.0009092624680471444,9 labor_intensive,53,0.0009092624680471444,15 situational,53,0.0009092624680471444,11 unbounded,53,0.0009092624680471444,9 translational,53,0.0009092624680471444,13 efficace,53,0.0009092624680471444,8 bipartite,53,0.0009092624680471444,9 unsatisfactory,53,0.0009092624680471444,14 patron,53,0.0009092624680471444,6 key_factor,53,0.0009092624680471444,10 numeric,53,0.0009092624680471444,7 ralisation,53,0.0009092624680471444,10 autres,53,0.0009092624680471444,6 hierarchical_clustering,53,0.0009092624680471444,23 autre,53,0.0009092624680471444,5 wide_web,53,0.0009092624680471444,8 logistic_regression_model,53,0.0009092624680471444,25 structuring,53,0.0009092624680471444,11 german_text,53,0.0009092624680471444,11 alexa,53,0.0009092624680471444,5 telles,53,0.0009092624680471444,6 learned_model,53,0.0009092624680471444,13 international_license,53,0.0009092624680471444,21 syntactic_parse,53,0.0009092624680471444,15 prose,53,0.0009092624680471444,5 draft,53,0.0009092624680471444,5 happy,53,0.0009092624680471444,5 yelp,53,0.0009092624680471444,4 sign_language,53,0.0009092624680471444,13 selfattention,53,0.0009092624680471444,13 glossary,53,0.0009092624680471444,8 new_set,53,0.0009092624680471444,7 s'appuie,53,0.0009092624680471444,8 traiter,53,0.0009092624680471444,7 elaborate,53,0.0009092624680471444,9 plm,53,0.0009092624680471444,3 preliminary_analysis,53,0.0009092624680471444,20 apple,53,0.0009092624680471444,5 weather,53,0.0009092624680471444,7 brand,53,0.0009092624680471444,5 single_document_summarization,53,0.0009092624680471444,29 cross_lingual_information_retrieval,53,0.0009092624680471444,35 multiple_model,53,0.0009092624680471444,14 sl,53,0.0009092624680471444,2 download,53,0.0009092624680471444,8 summary_sentence,53,0.0009092624680471444,16 gcn,53,0.0009092624680471444,3 arabic_tweet,53,0.0009092624680471444,12 d'abord,53,0.0009092624680471444,7 monotonic,53,0.0009092624680471444,9 extensibility,53,0.0009092624680471444,13 susceptible,53,0.0009092624680471444,11 first_system,53,0.0009092624680471444,12 big_data,53,0.0009092624680471444,8 special_attention,53,0.0009092624680471444,17 mrr,53,0.0009092624680471444,3 cours,53,0.0009092624680471444,5 averaged,53,0.0009092624680471444,8 l'ensemble,53,0.0009092624680471444,10 common_word,53,0.0009092624680471444,11 unannotated_corpus,53,0.0009092624680471444,18 outlier,53,0.0009092624680471444,7 publisher,53,0.0009092624680471444,9 lee,53,0.0009092624680471444,3 positive_effect,53,0.0009092624680471444,15 computer_aided,53,0.0009092624680471444,14 advantageous,53,0.0009092624680471444,12 useful_feature,53,0.0009092624680471444,14 high_order,53,0.0009092624680471444,10 afterwards,53,0.0009092624680471444,10 similarit,53,0.0009092624680471444,9 high_quality_translation,53,0.0009092624680471444,24 bayesian_network,53,0.0009092624680471444,16 simulator,53,0.0009092624680471444,9 dfinition,53,0.0009092624680471444,9 complex_model,53,0.0009092624680471444,13 comprehensive_analysis,53,0.0009092624680471444,22 ordered,52,0.0008921065724236133,7 open_ie,52,0.0008921065724236133,7 chunker,52,0.0008921065724236133,7 unsupervised_algorithm,52,0.0008921065724236133,22 empirical_investigation,52,0.0008921065724236133,23 ddi,52,0.0008921065724236133,3 wmt21,52,0.0008921065724236133,5 first_phase,52,0.0008921065724236133,11 graphbased,52,0.0008921065724236133,10 hmm_based,52,0.0008921065724236133,9 same_sentence,52,0.0008921065724236133,13 pcfgs,52,0.0008921065724236133,5 better_generalization,52,0.0008921065724236133,21 zero_shot_transfer,52,0.0008921065724236133,18 fewshot,52,0.0008921065724236133,7 citizen,52,0.0008921065724236133,7 major_problem,52,0.0008921065724236133,13 summary_generation,52,0.0008921065724236133,18 emnlp,52,0.0008921065724236133,5 different_form,52,0.0008921065724236133,14 specific_word,52,0.0008921065724236133,13 lexical_overlap,52,0.0008921065724236133,15 new_measure,52,0.0008921065724236133,11 sector,52,0.0008921065724236133,6 robust_model,52,0.0008921065724236133,12 rc,52,0.0008921065724236133,2 important_resource,52,0.0008921065724236133,18 vae,52,0.0008921065724236133,3 up_to_date,52,0.0008921065724236133,10 billion,52,0.0008921065724236133,7 episode,52,0.0008921065724236133,7 deep_reinforcement,52,0.0008921065724236133,18 highest_score,52,0.0008921065724236133,13 k_best,52,0.0008921065724236133,6 cultural_heritage,52,0.0008921065724236133,17 automatic_question,52,0.0008921065724236133,18 vaswani,52,0.0008921065724236133,7 trouble,52,0.0008921065724236133,7 predictability,52,0.0008921065724236133,14 synchronous_grammar,52,0.0008921065724236133,19 ensemble_approach,52,0.0008921065724236133,17 literacy,52,0.0008921065724236133,8 sixth,52,0.0008921065724236133,5 sizable,52,0.0008921065724236133,7 heterogeneity,52,0.0008921065724236133,13 small_size,52,0.0008921065724236133,10 post_editing_effort,52,0.0008921065724236133,19 dp,52,0.0008921065724236133,2 multiword_expression,52,0.0008921065724236133,20 external_data,52,0.0008921065724236133,13 cumulative,52,0.0008921065724236133,10 winner,52,0.0008921065724236133,6 timing,52,0.0008921065724236133,6 dictionary_entry,52,0.0008921065724236133,16 personalization,52,0.0008921065724236133,15 restrictive,52,0.0008921065724236133,11 different_size,52,0.0008921065724236133,14 posterior_probability,52,0.0008921065724236133,21 two_fold,52,0.0008921065724236133,8 many_to_many,52,0.0008921065724236133,12 alignment_error,52,0.0008921065724236133,15 com,52,0.0008921065724236133,3 celles,52,0.0008921065724236133,6 customizable,52,0.0008921065724236133,12 small_data,52,0.0008921065724236133,10 creativity,52,0.0008921065724236133,10 laborious,52,0.0008921065724236133,9 wellknown,52,0.0008921065724236133,9 new_translation,52,0.0008921065724236133,15 heuristic_rule,52,0.0008921065724236133,14 reproduction,52,0.0008921065724236133,12 auto_encoder,52,0.0008921065724236133,12 new_york_time,52,0.0008921065724236133,13 montr,52,0.0008921065724236133,5 negative_sentiment,52,0.0008921065724236133,18 aspectual,52,0.0008921065724236133,9 france,52,0.0008921065724236133,6 checkpoint,52,0.0008921065724236133,10 legal_document,52,0.0008921065724236133,14 understudied,52,0.0008921065724236133,12 different_classifier,52,0.0008921065724236133,20 inferential,52,0.0008921065724236133,11 lower_level,51,0.0008749506768000823,11 saliency,51,0.0008749506768000823,8 effective_strategy,51,0.0008749506768000823,18 many_researcher,51,0.0008749506768000823,15 grammatical_framework,51,0.0008749506768000823,21 surveillance,51,0.0008749506768000823,12 open_domain_question_answering,51,0.0008749506768000823,30 parallel_training_data,51,0.0008749506768000823,22 un_analyseur,51,0.0008749506768000823,12 analyst,51,0.0008749506768000823,7 low_resource_language_pair,51,0.0008749506768000823,26 informal_text,51,0.0008749506768000823,13 top_ranked,51,0.0008749506768000823,10 different_class,51,0.0008749506768000823,15 standard_language,51,0.0008749506768000823,17 predictive_performance,51,0.0008749506768000823,22 large_data_set,51,0.0008749506768000823,14 font,51,0.0008749506768000823,4 baseline_method,51,0.0008749506768000823,15 death,51,0.0008749506768000823,5 transformer_architecture,51,0.0008749506768000823,24 slavic_language,51,0.0008749506768000823,15 unlabelled_data,51,0.0008749506768000823,15 covid_19_pandemic,51,0.0008749506768000823,17 available_training_data,51,0.0008749506768000823,23 baseline_system,51,0.0008749506768000823,15 finitestate,51,0.0008749506768000823,11 er,51,0.0008749506768000823,2 debiasing,51,0.0008749506768000823,9 grapheme,51,0.0008749506768000823,8 same_way,51,0.0008749506768000823,8 worst,51,0.0008749506768000823,5 unlexicalized,51,0.0008749506768000823,13 multilingual_machine,51,0.0008749506768000823,20 searching,51,0.0008749506768000823,9 further_investigation,51,0.0008749506768000823,21 same_corpus,51,0.0008749506768000823,11 molecular,51,0.0008749506768000823,9 first_task,51,0.0008749506768000823,10 key_issue,51,0.0008749506768000823,9 catgories,51,0.0008749506768000823,9 subclass,51,0.0008749506768000823,8 additional_resource,51,0.0008749506768000823,19 front,51,0.0008749506768000823,5 flaw,51,0.0008749506768000823,4 parametric,51,0.0008749506768000823,10 non_compositional,51,0.0008749506768000823,17 english_verb,51,0.0008749506768000823,12 marked,51,0.0008749506768000823,6 emojis,51,0.0008749506768000823,6 slt,51,0.0008749506768000823,3 hand_annotated,51,0.0008749506768000823,14 tongue,51,0.0008749506768000823,6 adjectival,51,0.0008749506768000823,10 comparables,51,0.0008749506768000823,11 natural_language_application,51,0.0008749506768000823,28 visant,51,0.0008749506768000823,6 vidence,51,0.0008749506768000823,7 bilstm_crf,51,0.0008749506768000823,10 prosodic_feature,51,0.0008749506768000823,16 fake_news_detection,51,0.0008749506768000823,19 principe,51,0.0008749506768000823,8 similar_sentence,51,0.0008749506768000823,16 blind_test,51,0.0008749506768000823,10 medical_language,51,0.0008749506768000823,16 cantonese,51,0.0008749506768000823,9 contiguous,51,0.0008749506768000823,10 complex_word_identification,51,0.0008749506768000823,27 computer_assisted_translation,51,0.0008749506768000823,29 top_k,51,0.0008749506768000823,5 coarse_to_fine,51,0.0008749506768000823,14 open_access,51,0.0008749506768000823,11 under_explored,51,0.0008749506768000823,14 film,51,0.0008749506768000823,4 stateof_the_art_model,51,0.0008749506768000823,21 segmental,51,0.0008749506768000823,9 assist,51,0.0008749506768000823,6 intellectual,51,0.0008749506768000823,12 original_sentence,51,0.0008749506768000823,17 frequent_word,51,0.0008749506768000823,13 parse_tree,51,0.0008749506768000823,10 break,51,0.0008749506768000823,5 dev,50,0.0008577947811765513,3 phrase_based_mt,50,0.0008577947811765513,15 novel_data,50,0.0008577947811765513,10 utilize,50,0.0008577947811765513,7 mature,50,0.0008577947811765513,6 english_to_chinese,50,0.0008577947811765513,18 sentence_aligned,50,0.0008577947811765513,16 bottom,50,0.0008577947811765513,6 _which,50,0.0008577947811765513,6 massive_amount,50,0.0008577947811765513,14 parts_of_speech,50,0.0008577947811765513,15 safe,50,0.0008577947811765513,4 editorial,50,0.0008577947811765513,9 tutor,50,0.0008577947811765513,5 une_tude,50,0.0008577947811765513,8 screen,50,0.0008577947811765513,6 column,50,0.0008577947811765513,6 finer_grained,50,0.0008577947811765513,13 ralise,50,0.0008577947811765513,6 elementary_tree,50,0.0008577947811765513,15 objectif,50,0.0008577947811765513,8 dot,50,0.0008577947811765513,3 ranked_list,50,0.0008577947811765513,11 incoherent,50,0.0008577947811765513,10 lesser,50,0.0008577947811765513,6 microsoft_research,50,0.0008577947811765513,18 indigenous_language,50,0.0008577947811765513,19 statistical_mt_system,50,0.0008577947811765513,21 soft_constraint,50,0.0008577947811765513,15 bow,50,0.0008577947811765513,3 auc,50,0.0008577947811765513,3 bitexts,50,0.0008577947811765513,7 standardization,50,0.0008577947811765513,15 imdb,50,0.0008577947811765513,4 new_text,50,0.0008577947811765513,8 statistical_measure,50,0.0008577947811765513,19 chinese_language_processing,50,0.0008577947811765513,27 second_part,50,0.0008577947811765513,11 crosslingual_transfer,50,0.0008577947811765513,21 dog,50,0.0008577947811765513,3 routine,50,0.0008577947811765513,7 ample,50,0.0008577947811765513,5 anyone,50,0.0008577947811765513,6 lower_bound,50,0.0008577947811765513,11 therefore,50,0.0008577947811765513,9 simplest,50,0.0008577947811765513,8 post_hoc,50,0.0008577947811765513,8 other_resource,50,0.0008577947811765513,14 automated_evaluation,50,0.0008577947811765513,20 hybrid_method,50,0.0008577947811765513,13 two_phase,50,0.0008577947811765513,9 sensible,50,0.0008577947811765513,8 non_verbal,50,0.0008577947811765513,10 substantial_gain,50,0.0008577947811765513,16 supervise,50,0.0008577947811765513,9 copying,50,0.0008577947811765513,7 prise,50,0.0008577947811765513,5 ldc,50,0.0008577947811765513,3 obtains,50,0.0008577947811765513,7 first_version,50,0.0008577947811765513,13 final_translation,50,0.0008577947811765513,17 key_aspect,50,0.0008577947811765513,10 hedge,50,0.0008577947811765513,5 s'agit,50,0.0008577947811765513,6 historical_linguistics,50,0.0008577947811765513,22 textuelles,50,0.0008577947811765513,10 child_directed,50,0.0008577947811765513,14 zhang,50,0.0008577947811765513,5 bleu_point,50,0.0008577947811765513,10 english_to_german,50,0.0008577947811765513,17 seq2seq_model,50,0.0008577947811765513,13 manifold,50,0.0008577947811765513,8 reflection,50,0.0008577947811765513,10 trade,50,0.0008577947811765513,5 different_layer,50,0.0008577947811765513,15 depuis,50,0.0008577947811765513,6 second_language_acquisition,49,0.0008406388855530203,27 denotation,49,0.0008406388855530203,10 social_interaction,49,0.0008406388855530203,18 finer,49,0.0008406388855530203,5 qa_datasets,49,0.0008406388855530203,11 data_driven_method,49,0.0008406388855530203,18 une_reprsentation,49,0.0008406388855530203,17 semantic_role_label,49,0.0008406388855530203,19 bilingual_text,49,0.0008406388855530203,14 small_datasets,49,0.0008406388855530203,14 semantic_concept,49,0.0008406388855530203,16 satisfactory_result,49,0.0008406388855530203,19 littrature,49,0.0008406388855530203,10 app,49,0.0008406388855530203,3 edited,49,0.0008406388855530203,6 new_paradigm,49,0.0008406388855530203,12 new_tool,49,0.0008406388855530203,8 large_document,49,0.0008406388855530203,14 open_source_tool,49,0.0008406388855530203,16 md,49,0.0008406388855530203,2 sure,49,0.0008406388855530203,4 significant_performance_gain,49,0.0008406388855530203,28 comprises,49,0.0008406388855530203,9 portuguese_language,49,0.0008406388855530203,19 conventional_approach,49,0.0008406388855530203,21 clark,49,0.0008406388855530203,5 convex,49,0.0008406388855530203,6 whilst,49,0.0008406388855530203,6 distractors,49,0.0008406388855530203,11 agenda,49,0.0008406388855530203,6 more_detail,49,0.0008406388855530203,11 smooth,49,0.0008406388855530203,6 morphological_tagging,49,0.0008406388855530203,21 injection,49,0.0008406388855530203,9 offensive_content,49,0.0008406388855530203,17 next_word,49,0.0008406388855530203,9 k_nearest,49,0.0008406388855530203,9 translationese,49,0.0008406388855530203,14 essential_component,49,0.0008406388855530203,19 apis,49,0.0008406388855530203,4 essential_task,49,0.0008406388855530203,14 nomm'ees,49,0.0008406388855530203,8 annotated_sentence,49,0.0008406388855530203,18 vary,49,0.0008406388855530203,4 intern,49,0.0008406388855530203,6 mlp,49,0.0008406388855530203,3 fundamental_problem,49,0.0008406388855530203,19 english_russian,49,0.0008406388855530203,15 same_model,49,0.0008406388855530203,10 social_bias,49,0.0008406388855530203,11 segmented,49,0.0008406388855530203,9 misogyny,49,0.0008406388855530203,8 grammatical_error_detection,49,0.0008406388855530203,27 average_improvement,49,0.0008406388855530203,19 monolingual_word,49,0.0008406388855530203,16 upcoming,49,0.0008406388855530203,8 overfitting,49,0.0008406388855530203,11 main_finding,49,0.0008406388855530203,12 real_valued,49,0.0008406388855530203,11 hyponym,49,0.0008406388855530203,7 dmonstration,49,0.0008406388855530203,12 complementary_information,49,0.0008406388855530203,25 finite_state_automaton,49,0.0008406388855530203,22 further_experiment,49,0.0008406388855530203,18 labeled_example,49,0.0008406388855530203,15 primary_submission,49,0.0008406388855530203,18 charge,49,0.0008406388855530203,6 handle,49,0.0008406388855530203,6 bilingual_terminology,49,0.0008406388855530203,21 alignment_quality,49,0.0008406388855530203,17 parliamentary,49,0.0008406388855530203,13 global_feature,49,0.0008406388855530203,14 semcor,49,0.0008406388855530203,6 kit,49,0.0008406388855530203,3 language_dependent,49,0.0008406388855530203,18 bracketing,49,0.0008406388855530203,10 powerful_tool,49,0.0008406388855530203,13 contradictory,49,0.0008406388855530203,13 face_to_face,49,0.0008406388855530203,12 formalisme,49,0.0008406388855530203,10 first_part,49,0.0008406388855530203,10 cration,49,0.0008406388855530203,7 timeml,49,0.0008406388855530203,6 simple_feature,49,0.0008406388855530203,14 considerable_attention,49,0.0008406388855530203,22 linguistic_processing,49,0.0008406388855530203,21 door,49,0.0008406388855530203,4 tonal,48,0.0008234829899294892,5 encoded,48,0.0008234829899294892,7 noisy_channel_model,48,0.0008234829899294892,19 principled_way,48,0.0008234829899294892,14 linguistic_characteristic,48,0.0008234829899294892,25 agglomerative,48,0.0008234829899294892,13 large_vocabulary,48,0.0008234829899294892,16 back_off,48,0.0008234829899294892,8 social_medium_content,48,0.0008234829899294892,21 contest,48,0.0008234829899294892,7 phrase_structure,48,0.0008234829899294892,16 different_sens,48,0.0008234829899294892,14 axiom,48,0.0008234829899294892,5 wmt17,48,0.0008234829899294892,5 verb_noun,48,0.0008234829899294892,9 spcifique,48,0.0008234829899294892,9 transformation_based,48,0.0008234829899294892,20 hotpotqa,48,0.0008234829899294892,8 comparability,48,0.0008234829899294892,13 test_set,48,0.0008234829899294892,8 timely,48,0.0008234829899294892,6 limited_resource,48,0.0008234829899294892,16 _an,48,0.0008234829899294892,3 herein,48,0.0008234829899294892,6 rumor,48,0.0008234829899294892,5 holder,48,0.0008234829899294892,6 nlp_method,48,0.0008234829899294892,10 rich_resource,48,0.0008234829899294892,13 tagsets,48,0.0008234829899294892,7 unprecedented,48,0.0008234829899294892,13 nommes,48,0.0008234829899294892,6 curated,48,0.0008234829899294892,7 unsupervised_machine_translation,48,0.0008234829899294892,32 cost_effective,48,0.0008234829899294892,14 critical_role,48,0.0008234829899294892,13 many_downstream,48,0.0008234829899294892,15 negated,48,0.0008234829899294892,7 syntagmatic,48,0.0008234829899294892,11 proportional,48,0.0008234829899294892,12 syntactic_context,48,0.0008234829899294892,17 individual_sentence,48,0.0008234829899294892,19 visual_scene,48,0.0008234829899294892,12 user_review,48,0.0008234829899294892,11 systematic_comparison,48,0.0008234829899294892,21 incorporate,48,0.0008234829899294892,11 lexical_meaning,48,0.0008234829899294892,15 confident,48,0.0008234829899294892,9 prior_research,48,0.0008234829899294892,14 hashtag,48,0.0008234829899294892,7 money,48,0.0008234829899294892,5 rwth,48,0.0008234829899294892,4 significant_impact,48,0.0008234829899294892,18 asset,48,0.0008234829899294892,5 hand_written,48,0.0008234829899294892,12 lexicaux,48,0.0008234829899294892,8 bilingual_lexicon_extraction,48,0.0008234829899294892,28 final_prediction,48,0.0008234829899294892,16 post_editors,48,0.0008234829899294892,12 open_track,48,0.0008234829899294892,10 several_feature,48,0.0008234829899294892,15 tl,48,0.0008234829899294892,2 generated_response,48,0.0008234829899294892,18 compressed,48,0.0008234829899294892,10 actionable,48,0.0008234829899294892,10 many_domain,48,0.0008234829899294892,11 max,48,0.0008234829899294892,3 wmt18,48,0.0008234829899294892,5 bnc,48,0.0008234829899294892,3 multi_class_classification,48,0.0008234829899294892,26 useful_resource,48,0.0008234829899294892,15 negotiation,48,0.0008234829899294892,11 error_prone,48,0.0008234829899294892,11 linguistic_representation,48,0.0008234829899294892,25 shot,48,0.0008234829899294892,4 council,48,0.0008234829899294892,7 ultimate_goal,48,0.0008234829899294892,13 interactive_system,48,0.0008234829899294892,18 becomes,48,0.0008234829899294892,7 second_method,48,0.0008234829899294892,13 learning_based_approach,48,0.0008234829899294892,23 couverture,48,0.0008234829899294892,10 endeavor,48,0.0008234829899294892,8 factual_knowledge,48,0.0008234829899294892,17 promising_direction,47,0.0008063270943059582,19 locuteurs,47,0.0008063270943059582,9 cmu,47,0.0008063270943059582,3 semantic_equivalence,47,0.0008063270943059582,20 pretrained_transformer,47,0.0008063270943059582,22 semi_automated,47,0.0008063270943059582,14 biaffine,47,0.0008063270943059582,8 parmi,47,0.0008063270943059582,5 avant,47,0.0008063270943059582,5 individual_model,47,0.0008063270943059582,16 l'adaptation,47,0.0008063270943059582,12 different_target,47,0.0008063270943059582,16 different_user,47,0.0008063270943059582,14 syntax_based_machine_translation,47,0.0008063270943059582,32 visual_context,47,0.0008063270943059582,14 single_domain,47,0.0008063270943059582,13 continuous_vector,47,0.0008063270943059582,17 excerpt,47,0.0008063270943059582,7 executable,47,0.0008063270943059582,10 domain_specific_knowledge,47,0.0008063270943059582,25 different_sentence,47,0.0008063270943059582,18 syntax_based_machine,47,0.0008063270943059582,20 future_study,47,0.0008063270943059582,12 different_architecture,47,0.0008063270943059582,22 co_occurring,47,0.0008063270943059582,12 contraintes,47,0.0008063270943059582,11 gaussian_mixture_model,47,0.0008063270943059582,22 ideology,47,0.0008063270943059582,8 heterogeneous_graph,47,0.0008063270943059582,19 other_application,47,0.0008063270943059582,17 linearization,47,0.0008063270943059582,13 wide_margin,47,0.0008063270943059582,11 various_source,47,0.0008063270943059582,14 s'emantiques,47,0.0008063270943059582,12 workbench,47,0.0008063270943059582,9 further_development,47,0.0008063270943059582,19 public_opinion,47,0.0008063270943059582,14 one_to_many,47,0.0008063270943059582,11 morphological_analyser,47,0.0008063270943059582,22 aspect_category,47,0.0008063270943059582,15 linguistic_variation,47,0.0008063270943059582,20 e2e,47,0.0008063270943059582,3 severity,47,0.0008063270943059582,8 lieu,47,0.0008063270943059582,4 main_component,47,0.0008063270943059582,14 minimalist,47,0.0008063270943059582,10 detailed_error,47,0.0008063270943059582,14 nn,47,0.0008063270943059582,2 kannada,47,0.0008063270943059582,7 celui,47,0.0008063270943059582,5 rhetorical_relation,47,0.0008063270943059582,19 credit,47,0.0008063270943059582,6 progression,47,0.0008063270943059582,11 different_topic,47,0.0008063270943059582,15 second_phase,47,0.0008063270943059582,12 marketing,47,0.0008063270943059582,9 qg,47,0.0008063270943059582,2 planner,47,0.0008063270943059582,7 web_application,47,0.0008063270943059582,15 bridging,47,0.0008063270943059582,8 simple_sentence,47,0.0008063270943059582,15 provide,47,0.0008063270943059582,7 finite_state_machine,47,0.0008063270943059582,20 human_robot_interaction,47,0.0008063270943059582,23 syntactic_level,47,0.0008063270943059582,15 answer_selection,47,0.0008063270943059582,16 lexical_category,47,0.0008063270943059582,16 self,47,0.0008063270943059582,4 designer,47,0.0008063270943059582,8 delay,47,0.0008063270943059582,5 autonomous,47,0.0008063270943059582,10 best_score,47,0.0008063270943059582,10 phrase_based_translation_system,47,0.0008063270943059582,31 multilingual_resource,47,0.0008063270943059582,21 singular_value,47,0.0008063270943059582,14 regularizer,47,0.0008063270943059582,11 lexical_representation,47,0.0008063270943059582,22 pyramid,47,0.0008063270943059582,7 new_version,47,0.0008063270943059582,11 multilingual_data,47,0.0008063270943059582,17 commission,47,0.0008063270943059582,10 qu'une,47,0.0008063270943059582,6 subsystem,47,0.0008063270943059582,9 infinite,47,0.0008063270943059582,8 mit,47,0.0008063270943059582,3 long_sequence,47,0.0008063270943059582,13 exprience,47,0.0008063270943059582,9 profit,47,0.0008063270943059582,6 fouille,47,0.0008063270943059582,7 tale,47,0.0008063270943059582,4 median,47,0.0008063270943059582,6 berkeley,47,0.0008063270943059582,8 main_result,47,0.0008063270943059582,11 lorsque,46,0.0007891711986824273,7 alignment_based,46,0.0007891711986824273,15 possible_translation,46,0.0007891711986824273,20 nouvelles,46,0.0007891711986824273,9 vulnerability,46,0.0007891711986824273,13 violence,46,0.0007891711986824273,8 shallow_discourse,46,0.0007891711986824273,17 end_to_end_speech,46,0.0007891711986824273,17 several_datasets,46,0.0007891711986824273,16 word_by_word,46,0.0007891711986824273,12 high_correlation,46,0.0007891711986824273,16 stand_alone,46,0.0007891711986824273,11 naive_bayes_classifier,46,0.0007891711986824273,22 similar_context,46,0.0007891711986824273,15 byte,46,0.0007891711986824273,4 identifiable,46,0.0007891711986824273,12 previous_year,46,0.0007891711986824273,13 user_interaction,46,0.0007891711986824273,16 multiple_word,46,0.0007891711986824273,13 polar,46,0.0007891711986824273,5 negative_sample,46,0.0007891711986824273,15 general_language,46,0.0007891711986824273,16 japanese_sentence,46,0.0007891711986824273,17 context_vector,46,0.0007891711986824273,14 rich_information,46,0.0007891711986824273,16 entire_document,46,0.0007891711986824273,15 neural_net,46,0.0007891711986824273,10 ongoing_project,46,0.0007891711986824273,15 codemixed,46,0.0007891711986824273,9 tokenizer,46,0.0007891711986824273,9 abstractive_summarization_model,46,0.0007891711986824273,31 rsultat,46,0.0007891711986824273,7 in_domain_training,46,0.0007891711986824273,18 main_advantage,46,0.0007891711986824273,14 leaf,46,0.0007891711986824273,4 one_to_one,46,0.0007891711986824273,10 tested,46,0.0007891711986824273,6 visible,46,0.0007891711986824273,7 modified_version,46,0.0007891711986824273,16 medical_concept,46,0.0007891711986824273,15 sinica,46,0.0007891711986824273,6 document_classification,46,0.0007891711986824273,23 same_text,46,0.0007891711986824273,9 short_term_memory_network,46,0.0007891711986824273,25 ironic,46,0.0007891711986824273,6 unification_based,46,0.0007891711986824273,17 give,46,0.0007891711986824273,4 polysynthetic,46,0.0007891711986824273,13 equality,46,0.0007891711986824273,8 human_being,46,0.0007891711986824273,11 implicit_relation,46,0.0007891711986824273,17 hub,46,0.0007891711986824273,3 english_to_japanese,46,0.0007891711986824273,19 corpus_based_study,46,0.0007891711986824273,18 latvian,46,0.0007891711986824273,7 variable_length,46,0.0007891711986824273,15 graphical_user,46,0.0007891711986824273,14 nation,46,0.0007891711986824273,6 catastrophic_forgetting,46,0.0007891711986824273,23 ax,46,0.0007891711986824273,2 house,46,0.0007891711986824273,5 natural_language_instruction,46,0.0007891711986824273,28 past_year,46,0.0007891711986824273,9 pre_processing_step,46,0.0007891711986824273,19 commitment,46,0.0007891711986824273,10 new_application,46,0.0007891711986824273,15 mots_cls,46,0.0007891711986824273,8 explicit_discourse,46,0.0007891711986824273,18 diagram,46,0.0007891711986824273,7 standard_word,46,0.0007891711986824273,13 bilingue,46,0.0007891711986824273,8 porte,46,0.0007891711986824273,5 detailed_error_analysis,46,0.0007891711986824273,23 pronounced,46,0.0007891711986824273,10 probabilistic_approach,46,0.0007891711986824273,22 code_mixed_data,46,0.0007891711986824273,15 deaf,46,0.0007891711986824273,4 ensembling,46,0.0007891711986824273,10 tempeval,46,0.0007891711986824273,8 online_community,46,0.0007891711986824273,16 source_target,46,0.0007891711986824273,13 on_the_fly,46,0.0007891711986824273,10 multilingual_nmt,46,0.0007891711986824273,16 wizard_of_oz,46,0.0007891711986824273,12 vaswani_et,46,0.0007891711986824273,10 false_positive,46,0.0007891711986824273,14 1_best,46,0.0007891711986824273,6 impression,46,0.0007891711986824273,10 observe,46,0.0007891711986824273,7 propos,46,0.0007891711986824273,6 elles,46,0.0007891711986824273,5 better_quality,46,0.0007891711986824273,14 different_data_set,46,0.0007891711986824273,18 backoff,46,0.0007891711986824273,7 discriminant,46,0.0007891711986824273,12 few_example,46,0.0007891711986824273,11 euclidean,46,0.0007891711986824273,9 graphical_user_interface,46,0.0007891711986824273,24 discursive,46,0.0007891711986824273,10 bird,46,0.0007891711986824273,4 assistive,46,0.0007891711986824273,9 bilingual_sentence,46,0.0007891711986824273,18 labeled_data,46,0.0007891711986824273,12 fail,46,0.0007891711986824273,4 indo_aryan,46,0.0007891711986824273,10 cohen,46,0.0007891711986824273,5 duplicate,46,0.0007891711986824273,9 visual_representation,45,0.0007720153030588961,21 english_datasets,45,0.0007720153030588961,16 first_author,45,0.0007720153030588961,12 cky,45,0.0007720153030588961,3 annotated_resource,45,0.0007720153030588961,18 gpt,45,0.0007720153030588961,3 twofold,45,0.0007720153030588961,7 neighboring,45,0.0007720153030588961,11 multilingual_parsing,45,0.0007720153030588961,20 question_answering_system,45,0.0007720153030588961,25 dfi,45,0.0007720153030588961,3 multimodal_machine,45,0.0007720153030588961,18 switch,45,0.0007720153030588961,6 uima,45,0.0007720153030588961,4 hinders,45,0.0007720153030588961,7 replication,45,0.0007720153030588961,11 minimum_error,45,0.0007720153030588961,13 un_modle,45,0.0007720153030588961,8 negative_sampling,45,0.0007720153030588961,17 hybrid_machine,45,0.0007720153030588961,14 english_dataset,45,0.0007720153030588961,15 state_of_theart_method,45,0.0007720153030588961,22 critres,45,0.0007720153030588961,7 negative_effect,45,0.0007720153030588961,15 pdf,45,0.0007720153030588961,3 little_research,45,0.0007720153030588961,15 morphological_reinflection,45,0.0007720153030588961,26 twelve,45,0.0007720153030588961,6 popular_approach,45,0.0007720153030588961,16 syntax_aware,45,0.0007720153030588961,12 oov_word,45,0.0007720153030588961,8 non_neural,45,0.0007720153030588961,10 next_generation,45,0.0007720153030588961,15 entropy_based,45,0.0007720153030588961,13 transform,45,0.0007720153030588961,9 centroid,45,0.0007720153030588961,8 pre_trained_bert_model,45,0.0007720153030588961,22 articulatory,45,0.0007720153030588961,12 vaswani_et_al.,45,0.0007720153030588961,14 non_experts,45,0.0007720153030588961,11 central_role,45,0.0007720153030588961,12 built_in,45,0.0007720153030588961,8 several_language_pair,45,0.0007720153030588961,21 current_paper,45,0.0007720153030588961,13 centrality,45,0.0007720153030588961,10 low_rank,45,0.0007720153030588961,8 na,45,0.0007720153030588961,2 presidential,45,0.0007720153030588961,12 corpus_level,45,0.0007720153030588961,12 argue,45,0.0007720153030588961,5 binding,45,0.0007720153030588961,7 confirmation,45,0.0007720153030588961,12 island,45,0.0007720153030588961,6 statistical_information,45,0.0007720153030588961,23 theoretical_framework,45,0.0007720153030588961,21 adaption,45,0.0007720153030588961,8 lengthy,45,0.0007720153030588961,7 expert_annotation,45,0.0007720153030588961,17 many_people,45,0.0007720153030588961,11 similar_meaning,45,0.0007720153030588961,15 semeval_2014_task,45,0.0007720153030588961,17 natural_way,45,0.0007720153030588961,11 clpsych,45,0.0007720153030588961,7 tourism,45,0.0007720153030588961,7 future_improvement,45,0.0007720153030588961,18 surrogate,45,0.0007720153030588961,9 other_researcher,45,0.0007720153030588961,16 crucial_step,45,0.0007720153030588961,12 irrespective,45,0.0007720153030588961,12 singular_value_decomposition,45,0.0007720153030588961,28 unaligned,45,0.0007720153030588961,9 free_grammar,45,0.0007720153030588961,12 word_to_word,45,0.0007720153030588961,12 experimental_data,45,0.0007720153030588961,17 multilingual_system,45,0.0007720153030588961,19 annots,45,0.0007720153030588961,6 intonation,45,0.0007720153030588961,10 segmenters,45,0.0007720153030588961,10 gated_recurrent,45,0.0007720153030588961,15 stemmer,45,0.0007720153030588961,7 null,45,0.0007720153030588961,4 undergraduate,45,0.0007720153030588961,13 phonetic_transcription,45,0.0007720153030588961,22 subject_verb,45,0.0007720153030588961,12 tiny,45,0.0007720153030588961,4 statistical_word,45,0.0007720153030588961,16 multitude,45,0.0007720153030588961,9 lexical_acquisition,45,0.0007720153030588961,19 politeness,45,0.0007720153030588961,10 conversational_context,45,0.0007720153030588961,22 unsupervised_setting,45,0.0007720153030588961,20 selector,45,0.0007720153030588961,8 recorded,45,0.0007720153030588961,8 arabic_to_english,45,0.0007720153030588961,17 cambridge,45,0.0007720153030588961,9 linear_combination,45,0.0007720153030588961,18 stacking,44,0.0007548594074353652,8 advertising,44,0.0007548594074353652,11 semantic_search,44,0.0007548594074353652,15 telle,44,0.0007548594074353652,5 dag,44,0.0007548594074353652,3 unsupervised_way,44,0.0007548594074353652,16 ct,44,0.0007548594074353652,2 proposes,44,0.0007548594074353652,8 cooccurrences,44,0.0007548594074353652,13 missing,44,0.0007548594074353652,7 robotic,44,0.0007548594074353652,7 new_data_set,44,0.0007548594074353652,12 better_representation,44,0.0007548594074353652,21 conclude,44,0.0007548594074353652,8 deeper_understanding,44,0.0007548594074353652,20 traductions,44,0.0007548594074353652,11 pmi,44,0.0007548594074353652,3 open_challenge,44,0.0007548594074353652,14 unseen_test,44,0.0007548594074353652,11 notre_approche,44,0.0007548594074353652,14 linguistic_context,44,0.0007548594074353652,18 african_language,44,0.0007548594074353652,16 linguistic_description,44,0.0007548594074353652,22 negative_impact,44,0.0007548594074353652,15 multilingual_machine_translation,44,0.0007548594074353652,32 alternative_method,44,0.0007548594074353652,18 stratgies,44,0.0007548594074353652,9 structured_representation,44,0.0007548594074353652,25 textual_representation,44,0.0007548594074353652,22 contextualization,44,0.0007548594074353652,17 disentanglement,44,0.0007548594074353652,15 light_verb_construction,44,0.0007548594074353652,23 pathway,44,0.0007548594074353652,7 novel_word,44,0.0007548594074353652,10 resolvers,44,0.0007548594074353652,9 see,44,0.0007548594074353652,3 rponse,44,0.0007548594074353652,6 frequency_based,44,0.0007548594074353652,15 bilingual_parallel_corpus,44,0.0007548594074353652,25 principal_component,44,0.0007548594074353652,19 salient_information,44,0.0007548594074353652,19 n_ary,44,0.0007548594074353652,5 tel,44,0.0007548594074353652,3 stochastic_gradient,44,0.0007548594074353652,19 narrative_text,44,0.0007548594074353652,14 pr,44,0.0007548594074353652,2 asian_translation,44,0.0007548594074353652,17 ethic,44,0.0007548594074353652,5 graduate,44,0.0007548594074353652,8 stakeholder,44,0.0007548594074353652,11 abusive_language_detection,44,0.0007548594074353652,26 rigid,44,0.0007548594074353652,5 owl,44,0.0007548594074353652,3 concordance,44,0.0007548594074353652,11 binary_classification_problem,44,0.0007548594074353652,29 mt_quality,44,0.0007548594074353652,10 main_objective,44,0.0007548594074353652,14 thmatique,44,0.0007548594074353652,9 donn,44,0.0007548594074353652,4 few_study,44,0.0007548594074353652,9 emergency,44,0.0007548594074353652,9 multilinguality,44,0.0007548594074353652,15 keystroke,44,0.0007548594074353652,9 serial,44,0.0007548594074353652,6 animation,44,0.0007548594074353652,9 clausal,44,0.0007548594074353652,7 graph_based_method,44,0.0007548594074353652,18 itg,44,0.0007548594074353652,3 connotation,44,0.0007548594074353652,11 excellent_performance,44,0.0007548594074353652,21 epoch,44,0.0007548594074353652,5 real_world_data,44,0.0007548594074353652,15 diffrences,44,0.0007548594074353652,10 cross_lingual_setting,44,0.0007548594074353652,21 knowledge_base,44,0.0007548594074353652,14 distinguish,44,0.0007548594074353652,11 neural_generation,44,0.0007548594074353652,17 occupation,44,0.0007548594074353652,10 random_baseline,44,0.0007548594074353652,15 pos_tagging,44,0.0007548594074353652,11 set_up,44,0.0007548594074353652,6 relative_position,44,0.0007548594074353652,17 overall_result,44,0.0007548594074353652,14 ideological,44,0.0007548594074353652,11 capsule,44,0.0007548594074353652,7 muc,44,0.0007548594074353652,3 worldwide,44,0.0007548594074353652,9 le_systme,44,0.0007548594074353652,9 such_question,44,0.0007548594074353652,13 plagiarism,44,0.0007548594074353652,10 committee,44,0.0007548594074353652,9 verse,44,0.0007548594074353652,5 manifest,44,0.0007548594074353652,8 transport,44,0.0007548594074353652,9 chinese_english_translation_task,44,0.0007548594074353652,32 produit,44,0.0007548594074353652,7 interdependency,44,0.0007548594074353652,15 algebra,44,0.0007548594074353652,7 large_scale_knowledge,44,0.0007548594074353652,21 legal_domain,44,0.0007548594074353652,12 encoder_decoder_architecture,44,0.0007548594074353652,28 automatic_machine,44,0.0007548594074353652,17 speech_synthesis,44,0.0007548594074353652,16 inclusive,44,0.0007548594074353652,9 semantic_distance,44,0.0007548594074353652,17 such_representation,44,0.0007548594074353652,19 systran,44,0.0007548594074353652,7 significant_reduction,44,0.0007548594074353652,21 saving,44,0.0007548594074353652,6 ensemble_learning,44,0.0007548594074353652,17 distributional_word,44,0.0007548594074353652,19 pearson_correlation,44,0.0007548594074353652,19 packed,44,0.0007548594074353652,6 ehrs,44,0.0007548594074353652,4 unsupervised_technique,44,0.0007548594074353652,22 specific_aspect,44,0.0007548594074353652,15 linguistic_complexity,44,0.0007548594074353652,21 larger_corpus,44,0.0007548594074353652,13 different_component,44,0.0007548594074353652,19