hep_vs_acl.tex 614 B

123456789101112131415161718
  1. \begin{table}
  2. \caption{Comparison of the high-energy physics corpus and the computational linguistics corpus.}
  3. \label{table:corpora}
  4. \begin{tabular}{|c|c|c|}
  5. \toprule
  6. Cohort & High-energy physics & Computational Linguistics \\
  7. \midrule
  8. Cohort size ($N$) & $2\,195$ & $578$ \\
  9. Number of abstracts ($D$) & $186\,162$ & $58\,289$ \\
  10. Vocabulary size ($V$) & $4\,751$ & $5\,966$ \\
  11. Valid topics ($K$) & 16 & 14 \\
  12. Initial time period & 2000--2009 & 2002--2011 \\
  13. Late time period & 2015--2019 & 2012--2022 \\
  14. Author disambiguation & Yes & No \\
  15. Minimum publications & $5$ & $3$ \\
  16. \bottomrule
  17. \end{tabular}
  18. \end{table}