diff options
Diffstat (limited to 'scripts/romaji.pl')
-rw-r--r-- | scripts/romaji.pl | 273 |
1 files changed, 273 insertions, 0 deletions
diff --git a/scripts/romaji.pl b/scripts/romaji.pl new file mode 100644 index 0000000..7529ddd --- /dev/null +++ b/scripts/romaji.pl @@ -0,0 +1,273 @@ +#!/usr/bin/perl -w +# +# Copyright (c) 2002 Victor Ivanov <v0rbiz@yahoo.com> +# All rights reserved. +# +# Redistribution and use in source and binary forms, with or without +# modification, are permitted provided that the following conditions +# are met: +# 1. Redistributions of source code must retain the above copyright +# notice, this list of conditions and the following disclaimer. +# 2. Redistributions in binary form must reproduce the above copyright +# notice, this list of conditions and the following disclaimer in the +# documentation and/or other materials provided with the distribution. +# +# THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND +# ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE +# IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE +# ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE +# FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL +# DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS +# OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) +# HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT +# LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY +# OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF +# SUCH DAMAGE. +# + +use strict; +use vars qw($VERSION %IRSSI); + +$VERSION = '1.0b3'; +%IRSSI = ( + authors => 'Victor Ivanov', + contact => 'v0rbiz@yahoo.com', + name => 'romaji', + description => 'translates romaji to hiragana or katakana in text enclosed in ^R', + license => 'BSD 2-clause', + url => 'http://irssi.org/scripts/' +); + + +my(%hira) = ( + "a" => "あ", "i" => "い", "u" => "う", "e" => "え", "o" => "お", + "ka" => "か", "ki" => "き", "ku" => "く", "ke" => "け", "ko" => "こ", + "sa" => "さ", "shi" => "し", "su" => "す", "se" => "せ", "so" => "そ", + "ta" => "た", "chi" => "ち", "tsu" => "つ", "te" => "て", "to" => "と", + "na" => "な", "ni" => "に", "nu" => "ぬ", "ne" => "ね", "no" => "の", + "ha" => "は", "hi" => "ひ", "hu" => "ふ", "he" => "へ", "ho" => "ほ", "fu" => "ふ", + "ma" => "ま", "mi" => "み", "mu" => "む", "me" => "め", "mo" => "も", + "ya" => "や", "yu" => "ゆ", "yo" => "よ", + "ra" => "ら", "ri" => "り", "ru" => "る", "re" => "れ", "ro" => "ろ", + "wa" => "わ", "wi" => "ゐ", "we" => "ゑ", "wo" => "を", + "n" => "ん", + "m" => "ん", + + "ga" => "が", "gi" => "ぎ", "gu" => "ぐ", "ge" => "げ", "go" => "ご", + "za" => "ざ", "ji" => "じ", "zu" => "ず", "ze" => "ぜ", "zo" => "ぞ", + "da" => "だ", "dzi" => "ぢ", "dzu" => "づ", "de" => "で", "do" => "ど", + "ba" => "ば", "bi" => "び", "bu" => "ぶ", "be" => "べ", "bo" => "ぼ", + "pa" => "ぱ", "pi" => "ぴ", "pu" => "ぷ", "pe" => "ぺ", "po" => "ぽ", + + "fa" => "ふぁ", "fi" => "ふぃ", "fe" => "ふぇ", "fo" => "ふぉ", + "di" => "でぃ", + + "kya" => "きゃ", "kyu" => "きゅ", "kyo" => "きょ", + "sha" => "しゃ", "shu" => "しゅ", "sho" => "しょ", + "cha" => "ちゃ", "chu" => "ちゅ", "cho" => "ちょ", + "nya" => "にゃ", "nyu" => "にゅ", "nyo" => "にょ", + "hya" => "ひゃ", "hyu" => "ひゅ", "hyo" => "ひょ", + "mya" => "みゃ", "myu" => "みゅ", "myo" => "みょ", + "rya" => "りゃ", "ryu" => "りゅ", "ryo" => "りょ", + "gya" => "ぎゃ", "gyu" => "ぎゅ", "gyo" => "ぎょ", + "ja" => "じゃ", "ju" => "じゅ", "jo" => "じょ", + "jya" => "じゃ", "jyu" => "じゅ", "jyo" => "じょ", + "dza" => "ぢゃ", "dju" => "ぢゅ", "dzo" => "ぢょ", + "dja" => "ぢゃ", "djo" => "ぢょ", + "bya" => "びゃ", "byu" => "びゅ", "byo" => "びょ", + "pya" => "ぴゃ", "pyu" => "ぴゅ", "pyo" => "ぴょ", + + "TSU" => "っ" +); + +my(%kata) = ( + "a" => "ア", "i" => "イ", "u" => "ウ", "e" => "エ", "o" => "オ", + "ka" => "カ", "ki" => "キ", "ku" => "ク", "ke" => "ケ", "ko" => "コ", + "sa" => "サ", "shi" => "シ", "su" => "ス", "se" => "セ", "so" => "ソ", + "ta" => "タ", "chi" => "チ", "tsu" => "ツ", "te" => "テ", "to" => "ト", + "na" => "ナ", "ni" => "ニ", "nu" => "ヌ", "ne" => "ネ", "no" => "ノ", + "ha" => "ハ", "hi" => "ヒ", "hu" => "フ", "he" => "ヘ", "ho" => "ホ", "fu" => "フ", + "ma" => "マ", "mi" => "ミ", "mu" => "ム", "me" => "メ", "mo" => "モ", + "ya" => "ヤ", "yu" => "ユ", "yo" => "ヨ", "ye" => "エ", + "ra" => "ラ", "ri" => "リ", "ru" => "ル", "re" => "レ", "ro" => "ロ", + "wa" => "ワ", "wi" => "ヰ", "we" => "ヱ", "wo" => "ヲ", + "n" => "ン", + "m" => "ン", + + "ga" => "ガ", "gi" => "ギ", "gu" => "グ", "ge" => "ゲ", "go" => "ゴ", + "za" => "ザ", "ji" => "ジ", "zu" => "ズ", "ze" => "ゼ", "zo" => "ゾ", + "da" => "ダ", "dzi" => "ヂ", "dzu" => "ヅ", "de" => "デ", "do" => "ド", + "ba" => "バ", "bi" => "ビ", "bu" => "ブ", "be" => "ベ", "bo" => "ボ", + "pa" => "パ", "pi" => "ピ", "pu" => "プ", "pe" => "ペ", "po" => "ポ", + + "va" => "ヴァ", "vi" => "ヴィ", "vu" => "ヴ", "ve" => "ヴェ", "vo" => "ヴォ", + "fa" => "ファ", "fi" => "フィ", "fe" => "フェ", "fo" => "フォ", + "di" => "ディ", + + "dje" => "ヂェ", "dze" => "ヂェ", + + "kya" => "キャ", "kyu" => "キュ", "kyo" => "キョ", + "sha" => "シャ", "shu" => "シュ", "sho" => "ショ", + "cha" => "チャ", "chu" => "チュ", "cho" => "チョ", + "nya" => "ニャ", "nyu" => "ニュ", "nyo" => "ニョ", + "hya" => "ヒャ", "hyu" => "ヒュ", "hyo" => "ヒョ", + "mya" => "ミャ", "myu" => "ミュ", "myo" => "ミョ", + "rya" => "リャ", "ryu" => "リュ", "ryo" => "リョ", + "gya" => "ギャ", "gyu" => "ギュ", "gyo" => "ギョ", + "ja" => "ジャ", "ju" => "ジュ", "jo" => "ジョ", + "jya" => "ジャ", "jyu" => "ジュ", "jyo" => "ジョ", + "dza" => "ヂャ", "dju" => "ヂュ", "dzo" => "ヂョ", + "dja" => "ヂャ", "djo" => "ヂョ", + "bya" => "ビャ", "byu" => "ビュ", "byo" => "ビョ", + "pya" => "ピャ", "pyu" => "ピュ", "pyo" => "ピョ", + + "TSU" => "ッ" +); + +my(%comn) = ( + "-" => "ー", + "." => "。", + "," => "、", + "!" => "!", + "?" => "?", + "~" => "〜", + " " => " ", + "[" => "〔", "]" => "〕", + "{" => "【", "}" => "】", + "(" => "(", ")" => ")", + "0" => "0", "1" => "1", "2" => "2", "3" => "3", "4" => "4", + "5" => "5", "6" => "6", "7" => "7", "8" => "8", "9" => "9", + "*" => "★", # ☆ is uglier :P + # where to put ♪ ? +); + +my(@squot) = ( "「", "」" ); +my($squoti) = 0; +my(@dquot) = ( "『", "』" ); +my($dquoti) = 0; + +sub r2hk ($$) { + my($str) = ""; + my($pos) = 0; + my($inlen) = length($_[0]); + my($last) = ""; + my($href) = $_[1]; + my($inp) = lc($_[0]); + + while ($pos < $inlen) { + my($len); + my($p) = substr($inp, $pos, 3); + my($h) = ${$href}{$p}; + + # this could be done with another cycle, but this way's faster i guess + if ($h) { + $len = 3; + } else { + $p = substr($inp, $pos, 2); + $h = ${$href}{$p}; + if ($h) { + $len = 2; + } else { + $p = substr($inp, $pos, 1); + $h = ${$href}{$p}; + if (!$h) { + if ($p eq "'") { + $h = $squot[$squoti]; + $squoti = 1 - $squoti; + } elsif ($p eq "\"") { + $h = $dquot[$dquoti]; + $dquoti = 1 - $dquoti; + } else { + $h = $p; + } + } + $len = 1; + } + } + + if ($h ne $p) { + if ($last) { + if ($last eq substr($p, 0, 1)) { + $str .= ${$href}{"TSU"}; + } else { + $str .= $last; + } + $last = ""; + } + } else { + $str .= $last; + $last = $p; + $h = ""; + } + + $str .= $h; + + $pos += $len; + } + + $str .= $last; + + return $str; +} + +my($lock_ev) = 0; + +sub event1 { + my ($line, $server, $witem) = @_; + + return unless ref $witem; + if ($lock_ev) { return }; + $squoti = 0; + $dquoti = 0; + + my ($str) = ""; + my (@p) = split(//, $line); + my ($i); + my ($inside) = 0; + my ($empty) = 0; + + for ($i = 0; $i <= $#p; $i++) { + if ($inside) { + if (!$p[$i]) { + $empty++; + } else { + if ($empty == 0) { + $str .= r2hk($p[$i], \%hira); + } else { + $str .= r2hk($p[$i], \%kata); + } + $empty = 0; + $inside = 0; + } + } else { + $str .= $p[$i]; + $inside = 1; + } + } + + $lock_ev = 1; + Irssi::signal_emit('send command', $str, $server, $witem); + Irssi::signal_stop(); + $lock_ev = 0; +} + +sub cmd_romaji { + Irssi::print('%BRomaji (with ひらがな and カタカナ support) version '.$VERSION); + Irssi::print('(this is amateur product and comes with %Wno warranty%n, see the source)'); + Irssi::print('Text enclosed in Ctrl-Rs (like this) will be converted to hiragana.'); + Irssi::print('If the opening ^R is doubled, it will be converted to katakana.'); + Irssi::print('Example: genki -> げんき and genki -> ゲンキ'); +} + +Irssi::signal_add('send command', "event1"); +Irssi::command_bind('romaji', \&cmd_romaji); + +Irssi::print('%B'.$IRSSI{name}.' '.$VERSION.'%n loaded; type /romaji for more info'); + +# Add the common hash to hiragana and kitakana hashes +my($k, $v); + +while (($k, $v) = each %comn) { + $hira{$k} = $v; + $kata{$k} = $v; +} |