X-Git-Url: https://git.netwichtig.de/gitweb/?a=blobdiff_plain;f=data%2Frbot%2Fplugins%2Ftranslator.rb;h=41f4cf8e8ea73670eaef192e3d95380032847d5e;hb=8b811d21babf8f9e5a10a953b595d55ebd08820d;hp=a32ea16dfa059d56789a83ae0f4942f4b54c1e08;hpb=834758616bf9e872c1a93dde83906cae9f893ee6;p=user%2Fhenk%2Fcode%2Fruby%2Frbot.git diff --git a/data/rbot/plugins/translator.rb b/data/rbot/plugins/translator.rb index a32ea16d..41f4cf8e 100644 --- a/data/rbot/plugins/translator.rb +++ b/data/rbot/plugins/translator.rb @@ -34,12 +34,12 @@ class Translator attr_reader :directions, :cache - def initialize(directions, cache={}) + def initialize(directions, cache={}, bot) @directions = directions @cache = cache + @bot = bot end - # whether the translator supports this direction def support?(from, to) from != to && @directions[from].include?(to) @@ -103,163 +103,29 @@ class Translator end end +class YandexTranslator < Translator + INFO = 'Yandex Translator ' + LANGUAGES = %w{ar az be bg ca cs da de el en es et fi fr he hr hu hy it ka lt lv mk nl no pl pt ro ru sk sl sq sr sv tr uk} -class NiftyTranslator < Translator - INFO = '@nifty Translation ' - - def initialize(cache={}) - require 'mechanize' - super(Translator::Direction.all_from_to(%w[ja en zh_CN ko], %w[ja]), cache) - @form = WWW::Mechanize.new. - get('http://nifty.amikai.com/amitext/indexUTF8.jsp'). - forms_with(:name => 'translateForm').last - end - - def do_translate(text, from, to) - @radio = @form.radiobuttons_with(:name => 'langpair').first - @radio.value = "#{from},#{to}".upcase - @radio.check - @form.fields_with(:name => 'sourceText').last.value = text - - @form.submit(@form.buttons_with(:name => 'translate').last). - forms_with(:name => 'translateForm').last.fields_with(:name => 'translatedText').last.value - end -end - - -class ExciteTranslator < Translator - INFO = 'Excite.jp Translation ' - - def initialize(cache={}) - require 'mechanize' - require 'iconv' - - super(Translator::Direction.all_from_to(%w[ja en zh_CN zh_TW ko], %w[ja]), cache) - - @forms = Hash.new do |h, k| - case k - when 'en' - h[k] = open_form('english') - when 'zh_CN', 'zh_TW' - # this way we don't need to fetch the same page twice - h['zh_CN'] = h['zh_TW'] = open_form('chinese') - when 'ko' - h[k] = open_form('korean') - end - end - end - - def open_form(name) - WWW::Mechanize.new.get("http://www.excite.co.jp/world/#{name}"). - forms_with(:name => 'world').first - end - - def do_translate(text, from, to) - non_ja_language = from != 'ja' ? from : to - form = @forms[non_ja_language] - - if non_ja_language =~ /zh_(CN|TW)/ - form_with_fields(:name => 'wb_lp').first.value = "#{from}#{to}".sub(/_(?:CN|TW)/, '').upcase - form_with_fields(:name => 'big5').first.value = ($1 == 'TW' ? 'yes' : 'no') - else - # the en<->ja page is in Shift_JIS while other pages are UTF-8 - text = Iconv.iconv('Shift_JIS', 'UTF-8', text) if non_ja_language == 'en' - form.fields_with(:name => 'wb_lp').first.value = "#{from}#{to}".upcase - end - form.fields_with(:name => 'before').first.value = text - result = form.submit.forms_with(:name => 'world').first.fields_with(:name => 'after').first.value - # the en<->ja page is in Shift_JIS while other pages are UTF-8 - if non_ja_language == 'en' - Iconv.iconv('UTF-8', 'Shift_JIS', result) - else - result - end - - end -end - - -class GoogleTranslator < Translator - INFO = 'Google Translate ' - - def initialize(cache={}) - require 'mechanize' - load_form! - - # we can probably safely assume that google translate is able to translate from - # any language in the source lang drop down list to any language in the target one - # so we create the language pairs based on that assumption - sl = @source_list.options.map { |o| o.value.sub('-', '_') } - tl = @target_list.options.map { |o| o.value.sub('-', '_') } - super(Translator::Direction.all_from_to(tl, sl), cache) - end - - def load_form! - agent = WWW::Mechanize.new - # without faking the user agent, Google Translate will serve non-UTF-8 text - agent.user_agent_alias = 'Linux Konqueror' - @form = agent.get('http://www.google.com/translate_t'). - forms_with(:action => '/translate_t').first - @source_list = @form.fields_with(:name => 'sl').last - @target_list = @form.fields_with(:name => 'tl').last - end - - def do_translate(text, from, to) - load_form! - - @source_list.value = from.sub('_', '-') - @target_list.value = to.sub('_', '-') - @form.fields_with(:name => 'text').last.value = text - @form.submit.parser.search('div#result_box').inner_html - end -end - - -class BabelfishTranslator < Translator - INFO = 'AltaVista Babel Fish Translation ' - - def initialize(cache) - require 'mechanize' - - @form = WWW::Mechanize.new.get('http://babelfish.altavista.com/babelfish/'). - forms_with(:name => 'frmTrText').first - @lang_list = @form.fields_with(:name => 'lp').first - language_pairs = @lang_list.options.map {|o| o.value.split('_')}. - reject {|p| p.empty?} - super(Translator::Direction.pairs(language_pairs), cache) - end - - def do_translate(text, from, to) - if @form.fields_with(:name => 'trtext').empty? - @form.add_field!('trtext', text) - else - @form.fields_with(:name => 'trtext').first.value = text - end - @lang_list.value = "#{from}_#{to}" - @form.submit.parser.search("div[@id='result']/div[@style]").inner_html - end -end - -class WorldlingoTranslator < Translator - INFO = 'WorldLingo Free Online Translator ' - - LANGUAGES = %w[en fr de it pt es ru nl el sv ar ja ko zh_CN zh_TW] - def initialize(cache) + URL = 'https://translate.yandex.net/api/v1.5/tr.json/translate?key=%s&lang=%s-%s&text=%s' + KEY = 'trnsl.1.1.20140326T031210Z.1e298c8adb4058ed.d93278fea8d79e0a0ba76b6ab4bfbf6ac43ada72' + def initialize(cache, bot) require 'uri' - super(Translator::Direction.all_to_all(LANGUAGES), cache) + require 'json' + super(Translator::Direction.all_to_all(LANGUAGES), cache, bot) end def translate(text, from, to) - response = Irc::Utils.bot.httputil.get_response(URI.escape( - "http://www.worldlingo.com/SEfpX0LV2xIxsIIELJ,2E5nOlz5RArCY,/texttranslate?wl_srcenc=utf-8&wl_trgenc=utf-8&wl_text=#{text}&wl_srclang=#{from.upcase}&wl_trglang=#{to.upcase}")) - # WorldLingo seems to respond an XML when error occurs - case response['Content-Type'] - when %r'text/plain' - response.body - else + res = @bot.httputil.get_response(URL % [KEY, from, to, URI.escape(text)]) + res = JSON.parse(res.body) + + if res['code'] != 200 raise Translator::NoTranslationError + else + res['text'].join(' ') end end + end class TranslatorPlugin < Plugin @@ -271,25 +137,18 @@ class TranslatorPlugin < Plugin :desc => _("Default destination language to be used with translate command")) TRANSLATORS = { - 'nifty' => NiftyTranslator, - 'excite' => ExciteTranslator, - 'google_translate' => GoogleTranslator, - 'babelfish' => BabelfishTranslator, - 'worldlingo' => WorldlingoTranslator, + 'yandex' => YandexTranslator, } def initialize super - + @failed_translators = [] @translators = {} TRANSLATORS.each_pair do |name, c| - begin - @translators[name] = c.new(@registry.sub_registry(name)) + watch_for_fail(name) do + @translators[name] = c.new(@registry.sub_registry(name), @bot) map "#{name} :from :to *phrase", :action => :cmd_translate, :thread => true - rescue Exception - warning _("Translator %{name} cannot be used: %{reason}") % - {:name => name, :reason => $!} end end @@ -301,20 +160,64 @@ class TranslatorPlugin < Plugin update_default end + def watch_for_fail(name, &block) + begin + yield + rescue Exception + debug 'Translator error: '+$!.to_s + debug $@.join("\n") + @failed_translators << { :name => name, :reason => $!.to_s } + + warning _("Translator %{name} cannot be used: %{reason}") % + {:name => name, :reason => $!} + map "#{name} [*args]", :action => :failed_translator, + :defaults => {:name => name, :reason => $!} + end + end + + def failed_translator(m, params) + m.reply _("Translator %{name} cannot be used: %{reason}") % + {:name => params[:name], :reason => params[:reason]} + end + def help(plugin, topic=nil) - if @translators.has_key?(plugin) - translator = @translators[plugin] - _('%{translator} => Look up phrase using %{info}, supported from -> to languages: %{directions}') % { - :translator => plugin, - :info => translator.class::INFO, - :directions => translator.directions.map do |source, targets| - _('%{source} -> %{targets}') % - {:source => source, :targets => targets.to_a.join(', ')} - end.join(' | ') - } + case (topic.intern rescue nil) + when :failed + unless @failed_translators.empty? + failed_list = @failed_translators.map { |t| _("%{bold}%{translator}%{bold}: %{reason}") % { + :translator => t[:name], + :reason => t[:reason], + :bold => Bold + }} + + _("Failed translators: %{list}") % { :list => failed_list.join(", ") } + else + _("None of the translators failed") + end else - _('Command: , where is one of: %{translators}. If "translator" is used in place of the translator name, the first translator in translator.default_list which supports the specified direction will be picked automatically. Use "help " to look up supported from and to languages') % - {:translators => @translators.keys.join(', ')} + if @translators.has_key?(plugin) + translator = @translators[plugin] + _('%{translator} => Look up phrase using %{info}, supported from -> to languages: %{directions}') % { + :translator => plugin, + :info => translator.class::INFO, + :directions => translator.directions.map do |source, targets| + _('%{source} -> %{targets}') % + {:source => source, :targets => targets.to_a.join(', ')} + end.join(' | ') + } + else + help_str = _('Command: , where is one of: %{translators}. If "translator" is used in place of the translator name, the first translator in translator.default_list which supports the specified direction will be picked automatically. Use "help " to look up supported from and to languages') % + {:translators => @translators.keys.join(', ')} + + help_str << "\n" + _("%{bold}Note%{bold}: %{failed_amt} translators failed, see %{reverse}%{prefix}help translate failed%{reverse} for details") % { + :failed_amt => @failed_translators.size, + :bold => Bold, + :reverse => Reverse, + :prefix => @bot.config['core.address_prefix'].first + } + + help_str + end end end @@ -328,20 +231,13 @@ class TranslatorPlugin < Plugin def cmd_translator(m, params) params[:to] = @bot.config['translator.destination'] if params[:to].nil? - - # Use google translate as translator if source language has not been given - # and auto-detect it - if params[:from].nil? - params[:from] = "auto" - translator = "google_translate" - else - translator = @default_translators.find {|t| @translators[t].support?(params[:from], params[:to])} - end + params[:from] ||= 'auto' + translator = @default_translators.find {|t| @translators[t].support?(params[:from], params[:to])} if translator - cmd_translate m, params.merge({:translator => translator, :show_provider => true}) + cmd_translate m, params.merge({:translator => translator, :show_provider => false}) else - m.reply _('None of the default translators (translator.default_list) supports translating from %{source} to %{target}') % {:source => from, :target => to} + m.reply _('None of the default translators (translator.default_list) supports translating from %{source} to %{target}') % {:source => params[:from], :target => params[:to]} end end @@ -351,35 +247,56 @@ class TranslatorPlugin < Plugin translator = @translators[tname] from, to, phrase = params[:from], params[:to], params[:phrase].to_s if translator - begin - translation = Timeout.timeout(@bot.config['translator.timeout']) do - translator.translate(phrase, from, to) + watch_for_fail(tname) do + begin + translation = Timeout.timeout(@bot.config['translator.timeout']) do + translator.translate(phrase, from, to) + end + m.reply(if params[:show_provider] + _('%{translation} (provided by %{translator})') % + {:translation => translation, :translator => tname.gsub("_", " ")} + else + translation + end) + + rescue Translator::UnsupportedDirectionError + m.reply _("%{translator} doesn't support translating from %{source} to %{target}") % + {:translator => tname, :source => from, :target => to} + rescue Translator::NoTranslationError + m.reply _('%{translator} failed to provide a translation') % + {:translator => tname} + rescue Timeout::Error + m.reply _('The translator timed out') end - m.reply(if params[:show_provider] - _('%{translation} (provided by %{translator})') % - {:translation => translation, :translator => tname.gsub("_", " ")} - else - translation - end) - - rescue Translator::UnsupportedDirectionError - m.reply _("%{translator} doesn't support translating from %{source} to %{target}") % - {:translator => tname, :source => from, :target => to} - rescue Translator::NoTranslationError - m.reply _('%{translator} failed to provide a translation') % - {:translator => tname} - rescue Timeout::Error - m.reply _('The translator timed out') end else m.reply _('No translator called %{name}') % {:name => tname} end end + + # URL translation has nothing to do with Translators so let's make it + # separate, and Google exclusive for now + def cmd_translate_url(m, params) + params[:to] = @bot.config['translator.destination'] if params[:to].nil? + params[:from] ||= 'auto' + + translate_url = "http://translate.google.com/translate?sl=%{from}&tl=%{to}&u=%{url}" % { + :from => params[:from], + :to => params[:to], + :url => CGI.escape(params[:url].to_s) + } + + m.reply(translate_url) + end end plugin = TranslatorPlugin.new req = Hash[*%w(from to).map { |e| [e.to_sym, /#{plugin.languages.join("|")}/] }.flatten] +plugin.map 'translate [:from] [:to] :url', + :action => :cmd_translate_url, :requirements => req.merge(:url => %r{^https?://[^\s]*}) +plugin.map 'translator [:from] [:to] :url', + :action => :cmd_translate_url, :requirements => req.merge(:url => %r{^https?://[^\s]*}) plugin.map 'translate [:from] [:to] *phrase', :action => :cmd_translator, :thread => true, :requirements => req plugin.map 'translator [:from] [:to] *phrase',