class NlpToolz::Language

Constants

DataSourceException
HashSet

load java classes

LanIKernel
Request
RequestException
Response

Public Class Methods

get_language(text = nil) click to toggle source
# File lib/nlp_toolz/language.rb, line 21
def self.get_language(text = nil)
  return -1 if text.nil? || text.empty?
  lang_probability = identify text
  lang_probability.first
end
identify(text) click to toggle source

set language and probability of sentence

# File lib/nlp_toolz/language.rb, line 28
def self.identify(text)
  languages = HashSet.new
  modus = 0
  reduce = true
  
  req = Request.new(text, languages, modus, reduce)
  
  LanIKernel.propertyFile = File.join(MODELS,'language','lanikernel')
  kernel = LanIKernel.getInstance()
  res = kernel.evaluate(req)
  
  @lang,@probability = get_most_probability_lang(res.getResult.toString)
end

Private Class Methods

get_most_probability_lang(result) click to toggle source
# File lib/nlp_toolz/language.rb, line 43
def self.get_most_probability_lang(result)
  res = []
  foo = result.sub!("{","").sub!("}","").split(', ').collect{ |x| x.split('=') }
  foo.each{ |x| res << [x.first,x.last.to_f] }
  res.max{|a,b| a.last <=> b.last}
end