collocatordb: user Evert's (2004) ll-function instead of Dunning's (1993)
diff --git a/templates/index.html.ep b/templates/index.html.ep
index 76cc8c3..f03db29 100644
--- a/templates/index.html.ep
+++ b/templates/index.html.ep
@@ -43,6 +43,7 @@
function () {
$("#lfmd_tt").attr("title",$("#lfmd_ttt").html());
$("#npmi_tt").attr("title",$("#npmi_ttt").html());
+ $("#ll_tt").attr("title",$("#ll_ttt").html());
}
);
});
@@ -711,6 +712,7 @@
<body onload="onload()">
<div style="display:none;" id="lfmd_ttt">PMI cubed [1], also called log-frequency biased mutual dependency [2]: $$\text{PMI}^3=\text{LFMD}=log_2\frac{p^3(w_1,w_2)}{p(w_1) p(w_2)}$$<p class="citation">[1] Daille, B. (1994): <a href="http://www.bdaille.com/index.php?option=com_docman&task=doc_download&gid=8&Itemid=">Approche mixte pour l’extraction automatique de terminologie: statistiques lexicales et filtres linguistiques</a>. PhD thesis, Université Paris 7.</p><p class="citation">[2] Thanopoulos, A., Fakotakis, N., Kokkinakis, G. (2002): <a href="http://citeseerx.ist.psu.edu/viewdoc/download?doi=10.1.1.11.8101&rep=rep1&type=pdf">Comparative evaluation of collocation extraction metrics</a>. In: Proc. of LREC 2002: 620–625.</p></div>
<div style="display:none;" id="npmi_ttt">Normalized pointwise mutual information: $$\frac{log_2\frac{p(w_1,w_2)}{p(w_1)p(w_2)}}{-log_2(p(w_1,w_2))}$$<p class="citation">Bouma, Gerlof (2009): <a href="https://svn.spraakdata.gu.se/repos/gerlof/pub/www/Docs/npmi-pfd.pdf">Normalized (pointwise) mutual information in collocation extraction</a>. In Proceedings of GSCL.</p></div>
+ <div style="display:none;" id="ll_ttt">Log-likelihood: $$2*\sum_{ij}O_{ij}*log\frac{O_{ij}}{E_{ij}}$$<p class="citation">Evert, Stefan (2004): <a href="http://purl.org/stefan.evert/PUB/Evert2004phd.pdf">The Statistics of Word Cooccurrences: Word Pairs and Collocations.</a> PhD dissertation, IMS, University of Stuttgart. Published in 2005, URN urn:nbn:de:bsz:93-opus-23714.</p></div>
<div id="header">
<div id="pagetitle">
<h1>DeReKoVecs</h1>
@@ -886,9 +888,9 @@
<thead>
% if($collocators) {
<tr>
- <th>LLR</th>
- <th id="lfmd_tt">PMI³</th>
<th id="npmi_tt">nPMI</th>
+ <th id="ll_tt">LL</th>
+ <th id="lfmd_tt">MI³</th>
<th title="PMI³ restricted to left neighbour">l-PMI³</th>
<th title="PMI³ restricted to right neighbour">r-PMI³</th>
<th title="nPMI restricted to left neighbour">l-nPMI</th>