From 490afdddd1ded101860a8a9857a16f206bffc881 Mon Sep 17 00:00:00 2001 From: Joshua Peek Date: Mon, 10 Jun 2013 10:37:55 -0500 Subject: [PATCH] some air --- lib/linguist/classifier.rb | 20 ++++++++++---------- 1 file changed, 10 insertions(+), 10 deletions(-) diff --git a/lib/linguist/classifier.rb b/lib/linguist/classifier.rb index 09efce033a..f9ba6e8a23 100644 --- a/lib/linguist/classifier.rb +++ b/lib/linguist/classifier.rb @@ -132,7 +132,7 @@ def language_probability(language) private def verbosity - @verbosity ||= (ENV['LINGUIST_DEBUG']||0).to_i + @verbosity ||= (ENV['LINGUIST_DEBUG'] || 0).to_i end # Internal: show a table of probabilities for each pair. @@ -146,19 +146,19 @@ def verbosity # appear in one language vs. the least-likely language. Dashes # indicate the least-likely language (and zero points) for each token. def dump_all_tokens(tokens, languages) - maxlen = tokens.map{|tok| tok.size}.max + maxlen = tokens.map { |tok| tok.size }.max printf "%#{maxlen}s", "" - puts " #" + languages.map{|lang| sprintf("%10s", lang)}.join + puts " #" + languages.map { |lang| sprintf("%10s", lang) }.join tokmap = Hash.new(0) - tokens.each{|tok| tokmap[tok] += 1} - tokmap.sort.each{|tok, count| - arr = languages.map{|lang| [lang, token_probability(tok, lang)] } - min = arr.map{|a,b| b}.min + tokens.each { |tok| tokmap[tok] += 1 } + tokmap.sort.each { |tok, count| + arr = languages.map { |lang| [lang, token_probability(tok, lang)] } + min = arr.map { |a,b| b }.min minlog = Math.log(min) - if !arr.inject(true) {|result, n| result && n[1] == arr[0][1]} # if not all the same + if !arr.inject(true) { |result, n| result && n[1] == arr[0][1] } printf "%#{maxlen}s%5d", tok, count - puts arr.map{|ent| - ent[1] == min ? " -" : sprintf("%10.3f", count*(Math.log(ent[1])-minlog)) + puts arr.map { |ent| + ent[1] == min ? " -" : sprintf("%10.3f", count * (Math.log(ent[1]) - minlog)) }.join end }