readabilite: increase penalty for high link density
This commit is contained in:
parent
94097f481a
commit
b5b355aa6e
@ -125,7 +125,7 @@ def score_node(node):
|
||||
|
||||
if wc != 0:
|
||||
wca = count_words(' '.join([x.text_content() for x in node.findall('.//a')]))
|
||||
score = score * ( 1 - float(wca)/wc )
|
||||
score = score * ( 1 - 2 * float(wca)/wc )
|
||||
|
||||
return score
|
||||
|
||||
|
Loading…
x
Reference in New Issue
Block a user