|
1 | | -,domain,type,data size,avg word number,avg vocabulary size,avg keyword number,avg keyword number (tractable only),avg keyword number (tractable only and multiwords),avg vocabulary diversity |
2 | | -citeulike180,BI,Full,183,3799.2677595628415,1023.1857923497267,16.469945355191257,7.775956284153006,1.0546448087431695,0.2693113139431527 |
3 | | -fao30,AG,Full,30,3672.7,983.3666666666667,31.933333333333334,15.9,5.466666666666667,0.26775033808006826 |
4 | | -fao780,AG,Full,779,3567.3478818998715,942.2387676508343,7.961489088575096,4.193838254172015,1.5571245186136071,0.26412864650279744 |
5 | | -Inspec,CS,Abst,2000,85.3395,53.0095,13.4925,5.836,4.811,0.6211601895956738 |
6 | | -kdd,CS,Abst,755,52.688741721854306,33.71920529801324,4.079470198675497,0.7456953642384105,0.5576158940397351,0.6399698340874811 |
7 | | -Krapivin2009,CS,Full,2304,5451.236545138889,902.3663194444445,5.329861111111111,3.8094618055555554,2.9479166666666665,0.16553424383117712 |
8 | | -Nguyen2007,-,Full,209,3656.186602870813,752.933014354067,10.736842105263158,7.177033492822966,4.760765550239235,0.20593396785680168 |
9 | | -PubMed,BM,Full,500,2958.59,682.442,16.142,5.682,1.512,0.23066460712704362 |
10 | | -Schutz2008,BM,Full,1231,3207.568643379366,1101.2908204711616,43.56539398862713,28.499593826157597,10.148659626320065,0.34334131016784275 |
11 | | -SemEval2010,CS,Full,243,6221.6378600823045,1037.1851851851852,15.209876543209877,11.567901234567902,8.77366255144033,0.16670613245423843 |
12 | | -SemEval2017,-,Para,493,126.50507099391481,77.13590263691684,17.11764705882353,9.27789046653144,6.320486815415822,0.6097455385059406 |
13 | | -theses100,-,Full,100,3635.28,984.87,6.78,2.39,0.75,0.2709199841552783 |
14 | | -wiki20,CS,Report,20,4489.65,923.95,35.15,12.75,6.65,0.20579555199180338 |
15 | | -www,CS,Abst,1330,57.50375939849624,36.47744360902256,4.8007518796992485,0.8842105263157894,0.5428571428571428,0.6343488493723849 |
16 | | -500N-KPCrowd-v1.1,-,News,500,269.696,144.12,47.978,16.49,3.74,0.5343794494542002 |
| 1 | +,500N-KPCrowd-v1.1,Inspec,Krapivin2009,Nguyen2007,PubMed,Schutz2008,SemEval2010,SemEval2017,citeulike180,fao30,fao780,theses100,kdd,wiki20,www |
| 2 | +Data size,500,2000,2304,209,500,1231,243,493,183,30,779,100,755,20,1330 |
| 3 | +Domain,-,CS,CS,-,BM,BM,CS,-,BI,AG,AG,-,CS,CS,CS |
| 4 | +Type,-,CS,CS,-,BM,BM,CS,-,BI,AG,AG,-,CS,CS,CS |
| 5 | +Avg phrase,77.384,26.967,814.49609375,617.9856459330143,566.298,630.2558895207148,897.8312757201646,39.699797160243406,822.2677595628415,774.0,776.2708600770218,728.36,15.954966887417218,816.7,17.9 |
| 6 | +Std phrase,62.00755231421413,12.314946650310784,252.14317468513156,113.86454129909198,196.48920885381975,287.6595497592065,207.70384981408176,12.94657221855953,173.00291983671727,93.19942775217739,147.1711422801908,131.26046777305035,17.04914862119257,322.3617688250268,16.517061126928027 |
| 7 | +Avg word,447.302,137.762,9130.471788194445,5931.397129186603,4461.298,4200.692120227457,9740.218106995884,198.01825557809332,5521.131147540984,5437.833333333333,5590.523748395379,5396.72,81.93774834437086,7145.55,90.62781954887218 |
| 8 | +Std word,476.7283406679322,66.55563354067026,2524.422828713077,1023.0662095302862,1626.42691849219,2251.1355744927955,2443.441728214183,60.297350338210734,978.82878840376,927.5287626567466,902.3992981704127,958.4219747063399,93.01618511994454,3609.7554692111767,89.12352992882947 |
| 9 | +Avg vocab,197.14,76.232,1081.1414930555557,908.4784688995215,799.822,1217.1722177091794,1217.9053497942386,106.12576064908723,1171.120218579235,1125.0666666666666,1087.3196405648266,1134.03,48.10728476821192,1088.4,52.74661654135338 |
| 10 | +Std vocab,140.59065545049575,28.59461795513273,256.2237773449945,142.4035332525959,223.72044679912463,468.37048133960053,209.0611466958877,27.475683619235635,202.9375439628631,157.13941439230183,210.26987796235758,192.34289459192405,45.666634100960046,295.40470544661264,43.33231971821068 |
| 11 | +Avg keyword,47.978,13.4925,5.329861111111111,10.736842105263158,16.142,43.56539398862713,15.209876543209877,17.11764705882353,16.469945355191257,31.933333333333334,7.961489088575096,6.78,4.079470198675497,35.15,4.8007518796992485 |
| 12 | +Avg keyword (in candidate),16.49,5.836,3.8094618055555554,7.177033492822966,5.682,28.499593826157597,11.567901234567902,9.27789046653144,7.775956284153006,15.9,4.193838254172015,2.39,0.7456953642384105,12.75,0.8842105263157894 |
| 13 | +Std keyword (in candidate),11.971545430728654,3.540353654650908,2.146071359435905,4.258652751428725,2.6714932154134297,10.253637574384731,3.347887749806898,4.866770425384573,3.413100931015965,5.61159513863928,2.3493725225755795,1.5420440979427268,0.9272715155165945,3.1760824926314495,0.9818535567010371 |
| 14 | +Avg keyword (in candidate & multi),3.74,4.811,2.9479166666666665,4.760765550239235,1.512,10.148659626320065,8.77366255144033,6.320486815415822,1.0546448087431695,5.466666666666667,1.5571245186136071,0.75,0.5576158940397351,6.65,0.5428571428571428 |
| 15 | +Std keyword (in candidate & multi),3.778941650780024,3.1664300087006554,1.9007205779066374,3.2148268033683105,1.3303593499502333,4.928390150828587,3.285177736220138,3.4309659794374823,1.0012384460016208,2.6042699979499475,1.34546638502203,0.8170067319184096,0.763612630732103,2.650943228362313,0.7499659856232418 |
| 16 | +Vocab diversity,2.268956071827128,1.8071413579599118,8.445214476404585,6.528935282716778,5.577863574645359,3.4511896173028935,7.997516480768776,1.8658830275229359,4.714401698434547,4.833343209291301,5.1415642096663365,4.758886449212102,1.7032295366317007,6.565187431091511,1.7181731358601913 |
0 commit comments