home *** CD-ROM | disk | FTP | other *** search
/ Source Code 1994 March / Source_Code_CD-ROM_Walnut_Creek_March_1994.iso / compsrcs / misc / volume36 / translit / part10 < prev    next >
Encoding:
Text File  |  1993-03-21  |  29.1 KB  |  604 lines

  1. Newsgroups: comp.sources.misc
  2. From: jkl@osc.edu (Jan Labanowski)
  3. Subject: v36i032:  translit - transliterate foreign alphabets, Part10/10
  4. Message-ID: <1993Mar19.224636.12570@sparky.imd.sterling.com>
  5. X-Md4-Signature: b458c29d412e027cbf355648b00c1308
  6. Date: Fri, 19 Mar 1993 22:46:36 GMT
  7. Approved: kent@sparky.imd.sterling.com
  8.  
  9. Submitted-by: jkl@osc.edu (Jan Labanowski)
  10. Posting-number: Volume 36, Issue 32
  11. Archive-name: translit/part10
  12. Environment: UNIX, MS-DOS, VMS
  13.  
  14. #! /bin/sh
  15. # This is a shell archive.  Remove anything before this line, then feed it
  16. # into a shell via "sh file" or similar.  To overwrite existing files,
  17. # type "sh file -c".
  18. # Contents:  alt-koi8.rus announcement gos-koi8.rus koi8-alt.rus
  19. #   koi8-gos.rus paths.h
  20. # Wrapped by kent@sparky on Fri Mar 19 16:00:17 1993
  21. PATH=/bin:/usr/bin:/usr/ucb:/usr/local/bin:/usr/lbin ; export PATH
  22. echo If this archive is complete, you will see the following message:
  23. echo '          "shar: End of archive 10 (of 10)."'
  24. if test -f 'alt-koi8.rus' -a "${1}" != "-c" ; then 
  25.   echo shar: Will not clobber existing file \"'alt-koi8.rus'\"
  26. else
  27.   echo shar: Extracting \"'alt-koi8.rus'\" \(5082 characters\)
  28.   sed "s/^X//" >'alt-koi8.rus' <<'END_OF_FILE'
  29. X# Jan Labanowski, jkl@osc.edu, Dec. 30, 1992
  30. X# File alt-koi8.rus
  31. X
  32. X# This is a transliteration data file for converting from ALT to KOI8
  33. X# KOI8 is meant to be GOST 19768-74 (as used by RELCOM).
  34. X# To be used with translit.c program by Jan Labanowski
  35. X
  36. X   1            file version number
  37. X
  38. X   "    "      # string delimiters
  39. X   [    ]      # list delimites
  40. X   {    }      # regular expression delimiters
  41. X
  42. X
  43. X#starting sequence
  44. X""
  45. X
  46. X
  47. X#ending sequence
  48. X""
  49. X
  50. X   0     # number of input SHIFT sequences, only one set of input characters
  51. X
  52. X   0     # number of output SHIFT sequences, only one set of output characters
  53. X  
  54. X# conversion table
  55. X# inp_set_numb  inp_seq        out_set_numb  out_seq
  56. X     0         "\0xf0"              0       "\0xB3"  # capital Yo
  57. X     0         "\0xf1"              0       "\0xA3"  # small yo
  58. X     0         "\0x80"              0       "\0xE1"  # capital A
  59. X     0         "\0x81"              0       "\0xE2"  # capital Be
  60. X     0         "\0x82"              0       "\0xF7"  # capital Ve
  61. X     0         "\0x83"              0       "\0xE7"  # capital Ghe
  62. X     0         "\0x84"              0       "\0xE4"  # capital De
  63. X     0         "\0x85"              0       "\0xE5"  # capital Ie
  64. X     0         "\0x86"              0       "\0xF6"  # capital Zhe
  65. X     0         "\0x87"              0       "\0xFA"  # capital Ze
  66. X     0         "\0x88"              0       "\0xE9"  # capital I
  67. X     0         "\0x89"              0       "\0xEA"  # capital short I
  68. X     0         "\0x8a"              0       "\0xEB"  # capital Ka
  69. X     0         "\0x8b"              0       "\0xEC"  # capital El
  70. X     0         "\0x8c"              0       "\0xED"  # capital Em
  71. X     0         "\0x8d"              0       "\0xEE"  # capital En
  72. X     0         "\0x8e"              0       "\0xEF"  # capital O
  73. X     0         "\0x8f"              0       "\0xF0"  # capital Pe
  74. X     0         "\0x90"              0       "\0xF2"  # capital Er
  75. X     0         "\0x91"              0       "\0xF3"  # capital Es
  76. X     0         "\0x92"              0       "\0xF4"  # capital Te
  77. X     0         "\0x93"              0       "\0xF5"  # capital U
  78. X     0         "\0x94"              0       "\0xE6"  # capital Ef
  79. X     0         "\0x95"              0       "\0xE8"  # capital Kha
  80. X     0         "\0x96"              0       "\0xE3"  # capital Tse
  81. X     0         "\0x97"              0       "\0xFE"  # capital Che
  82. X     0         "\0x98"              0       "\0xFB"  # capital Sha
  83. X     0         "\0x99"              0       "\0xFD"  # capital Shcha
  84. X     0         "\0x9a"              0       "\0xFF"  # capital hard sign (Ier)
  85. X     0         "\0x9b"              0       "\0xF9"  # capital Y (Iery)
  86. X     0         "\0x9c"              0       "\0xF8"  # capital soft sign Ierik
  87. X     0         "\0x9d"              0       "\0xFC"  # capital reverse round E
  88. X     0         "\0x9e"              0       "\0xE0"  # capital Yu
  89. X     0         "\0x9f"              0       "\0xF1"  # capital Ya
  90. X     0         "\0xa0"              0       "\0xC1"  # small a
  91. X     0         "\0xa1"              0       "\0xC2"  # small be
  92. X     0         "\0xa2"              0       "\0xD7"  # small ve
  93. X     0         "\0xa3"              0       "\0xC7"  # small ghe
  94. X     0         "\0xa4"              0       "\0xC4"  # small de
  95. X     0         "\0xa5"              0       "\0xC5"  # small ie
  96. X     0         "\0xa6"              0       "\0xD6"  # small zhe
  97. X     0         "\0xa7"              0       "\0xDA"  # small z
  98. X     0         "\0xa8"              0       "\0xC9"  # small i
  99. X     0         "\0xa9"              0       "\0xCA"  # small short i
  100. X     0         "\0xaa"              0       "\0xCB"  # small ka
  101. X     0         "\0xab"              0       "\0xCC"  # small el
  102. X     0         "\0xac"              0       "\0xCD"  # small em
  103. X     0         "\0xad"              0       "\0xCE"  # small en
  104. X     0         "\0xae"              0       "\0xCF"  # small o
  105. X     0         "\0xaf"              0       "\0xD0"  # small pe
  106. X     0         "\0xe0"              0       "\0xD2"  # small er
  107. X     0         "\0xe1"              0       "\0xD3"  # small es
  108. X     0         "\0xe2"              0       "\0xD4"  # small te
  109. X     0         "\0xe3"              0       "\0xD5"  # small u
  110. X     0         "\0xe4"              0       "\0xC6"  # small ef
  111. X     0         "\0xe5"              0       "\0xC8"  # small kha
  112. X     0         "\0xe6"              0       "\0xC3"  # small tse
  113. X     0         "\0xe7"              0       "\0xDE"  # small che
  114. X     0         "\0xe8"              0       "\0xDB"  # small sha
  115. X     0         "\0xe9"              0       "\0xDD"  # small shcha
  116. X     0         "\0xea"              0       "\0xDF"  # small hard sign (ier)
  117. X     0         "\0xeb"              0       "\0xD9"  # small y (iery)
  118. X     0         "\0xec"              0       "\0xD8"  # small soft sign (ierik)
  119. X     0         "\0xed"              0       "\0xDC"  # small reverse rounded e
  120. X     0         "\0xee"              0       "\0xC0"  # small yu
  121. X     0         "\0xef"              0       "\0xD1"  # small ya
  122. END_OF_FILE
  123.   if test 5082 -ne `wc -c <'alt-koi8.rus'`; then
  124.     echo shar: \"'alt-koi8.rus'\" unpacked with wrong size!
  125.   fi
  126.   # end of 'alt-koi8.rus'
  127. fi
  128. if test -f 'announcement' -a "${1}" != "-c" ; then 
  129.   echo shar: Will not clobber existing file \"'announcement'\"
  130. else
  131.   echo shar: Extracting \"'announcement'\" \(2044 characters\)
  132.   sed "s/^X//" >'announcement' <<'END_OF_FILE'
  133. XTranslit --- general transliteration program is available. It transliterates
  134. Xbetween different alphabet representations of different languages.
  135. X
  136. XIt is frequently necessary to convert from one representation to another
  137. Xrepresentation of the foreign alphabet. E.g., in the Library of Congress
  138. Xtransliteration, the Russian letter sha is transliterated as two Latin
  139. Xletters "sh" while the popular word processors use a code 232 (decimal),
  140. Xthe RELCOM network uses a code 221, and the KOI7 set uses character "["
  141. Xfor the same letter. So if your screen driver, printer, word processor,
  142. Xetc. uses different codes than the text file which you have, you need to
  143. Xtransliterate.
  144. X
  145. XThe TRANSLIT program is a powerful tool for such tasks. It converts an input
  146. Xfile in one representation to the output file in another representation using
  147. Xappropriate, user defined, transliteration table. Transliteration table allows
  148. Xfor very elaborate transliteration tasks and includes provisions for plain
  149. Xcharacter sequences, character lists, regular expressions (flexible matches),
  150. XSHIFT-OUT/IN sequences and more. The program comes with documentation and
  151. Xexamples of popular transliteration schemes. The Russian language serves
  152. Xas an example. Other files will be added with your collaboration.
  153. X
  154. XHow to get the program?
  155. X
  156. XFirst, retrieve file: readme.doc --- it describes the files in the program
  157. Xdistribution and has detailed instructions on how to obtain the program.
  158. X
  159. XVia FTP (if you are on Internet):
  160. X---------------------------------
  161. X  ftp kekule.osc.edu           (or ftp 128.146.36.48)
  162. X  Login: anonymous
  163. X  Password: Your_email_address (Please...)
  164. X  ftp> ascii  
  165. X  ftp> cd pub/russian/translit
  166. X  ftp> get readme.doc
  167. X  ftp> quit
  168. X
  169. XVia E-mail:
  170. X-----------
  171. X  Send message:
  172. X     send translit/readme.doc from russian
  173. X  to OSCPOST@osc.edu or OSCPOST@OHSTPY.BITNET.  The file readme.doc will be
  174. Xforwarded to your mailbox.
  175. X
  176. XEnjoy,
  177. X
  178. XAuthor coordinates:
  179. XJan Labanowski
  180. XP.O. Box 21821
  181. XColumbus, OH 43221-0821, USA
  182. Xjkl@osc.edu, JKL@OHSTPY.BITNET
  183. X------------------------------
  184. END_OF_FILE
  185.   if test 2044 -ne `wc -c <'announcement'`; then
  186.     echo shar: \"'announcement'\" unpacked with wrong size!
  187.   fi
  188.   # end of 'announcement'
  189. fi
  190. if test -f 'gos-koi8.rus' -a "${1}" != "-c" ; then 
  191.   echo shar: Will not clobber existing file \"'gos-koi8.rus'\"
  192. else
  193.   echo shar: Extracting \"'gos-koi8.rus'\" \(5211 characters\)
  194.   sed "s/^X//" >'gos-koi8.rus' <<'END_OF_FILE'
  195. X# Jan Labanowski, jkl@osc.edu, Dec. 30, 1992
  196. X# File gos_koi8.rus
  197. X
  198. X# This is a transliteration data file for converting GOSTSCII 84
  199. X# (approx. ISO-8859-5?) to KOI8 used by RELCOM 
  200. X# KOI8 is meant to be GOST 19768-74
  201. X
  202. X# To be used with translit.c program by Jan Labanowski
  203. X
  204. X   1            file version number
  205. X
  206. X   "    "      # string delimiters
  207. X   [    ]      # list delimites
  208. X   {    }      # regular expression delimiters
  209. X
  210. X
  211. X#starting sequence
  212. X""
  213. X
  214. X
  215. X#ending sequence
  216. X""
  217. X
  218. X   0     # number of input SHIFT sequences, only one set of input characters
  219. X
  220. X   0     # number of output SHIFT sequences, only one set of output characters
  221. X  
  222. X# conversion table
  223. X# inp_set_numb  inp_seq        out_set_numb  out_seq
  224. X      0          "\0xF0"           0         "\0xB3"
  225. X      0          "\0xF1"           0         "\0xA3"   #small yo
  226. X      0          "\0xB0"           0         "\0xE1"   #capital  A
  227. X      0          "\0xB1"           0         "\0xE2"   #capital  Be
  228. X      0          "\0xB2"           0         "\0xF7"   #capital  Ve
  229. X      0          "\0xB3"           0         "\0xE7"   #capital  Ghe
  230. X      0          "\0xB4"           0         "\0xE4"   #capital  De
  231. X      0          "\0xB5"           0         "\0xE5"   #capital  Ie
  232. X      0          "\0xB6"           0         "\0xF6"   #capital  Zhe
  233. X      0          "\0xB7"           0         "\0xFA"   #capital  Ze
  234. X      0          "\0xB8"           0         "\0xE9"   #capital  I
  235. X      0          "\0xB9"           0         "\0xEA"   #capital  short I
  236. X      0          "\0xBA"           0         "\0xEB"   #capital  Ka
  237. X      0          "\0xBB"           0         "\0xEC"   #capital  El
  238. X      0          "\0xBC"           0         "\0xED"   #capital  Em
  239. X      0          "\0xBD"           0         "\0xEE"   #capital  En
  240. X      0          "\0xBE"           0         "\0xEF"   #capital  O
  241. X      0          "\0xBF"           0         "\0xF0"   #capital  Pe
  242. X      0          "\0xC0"           0         "\0xF2"   #capital  Er
  243. X      0          "\0xC1"           0         "\0xF3"   #capital  Es
  244. X      0          "\0xC2"           0         "\0xF4"   #capital  Te
  245. X      0          "\0xC3"           0         "\0xF5"   #capital  U
  246. X      0          "\0xC4"           0         "\0xE6"   #capital  Ef
  247. X      0          "\0xC5"           0         "\0xE8"   #capital  Kha
  248. X      0          "\0xC6"           0         "\0xE3"   #capital  Tse
  249. X      0          "\0xC7"           0         "\0xFE"   #capital  Che
  250. X      0          "\0xC8"           0         "\0xFB"   #capital  Sha
  251. X      0          "\0xC9"           0         "\0xFD"   #capital  Shcha
  252. X      0          "\0xCA"           0         "\0xFF"   #capital hard sign (Ier)
  253. X      0          "\0xCB"           0         "\0xF9"   #capital  Y (Iery)
  254. X      0          "\0xCC"           0         "\0xF8"   #capit soft sign(Ierik)
  255. X      0          "\0xCD"           0         "\0xFC"   #capit reverse rounded E
  256. X      0          "\0xCE"           0         "\0xE0"   #capital  Yu
  257. X      0          "\0xCF"           0         "\0xF1"   #capital  Ya
  258. X      0          "\0xD0"           0         "\0xC1"   #small  a
  259. X      0          "\0xD1"           0         "\0xC2"   #small  be
  260. X      0          "\0xD2"           0         "\0xD7"   #small  ve
  261. X      0          "\0xD3"           0         "\0xC7"   #small  ghe
  262. X      0          "\0xD4"           0         "\0xC4"   #small  de
  263. X      0          "\0xD5"           0         "\0xC5"   #small  ie
  264. X      0          "\0xD6"           0         "\0xD6"   #small  zhe
  265. X      0          "\0xD7"           0         "\0xDA"   #small  z
  266. X      0          "\0xD8"           0         "\0xC9"   #small  i
  267. X      0          "\0xD9"           0         "\0xCA"   #small  short i
  268. X      0          "\0xDA"           0         "\0xCB"   #small  ka
  269. X      0          "\0xDB"           0         "\0xCC"   #small  el
  270. X      0          "\0xDC"           0         "\0xCD"   #small  em
  271. X      0          "\0xDD"           0         "\0xCE"   #small  en
  272. X      0          "\0xDE"           0         "\0xCF"   #small  o
  273. X      0          "\0xDF"           0         "\0xD0"   #small  pe
  274. X      0          "\0xE0"           0         "\0xD2"   #small  er
  275. X      0          "\0xE1"           0         "\0xD3"   #small  es
  276. X      0          "\0xE2"           0         "\0xD4"   #small  te
  277. X      0          "\0xE3"           0         "\0xD5"   #small  u
  278. X      0          "\0xE4"           0         "\0xC6"   #small  ef
  279. X      0          "\0xE5"           0         "\0xC8"   #small  kha
  280. X      0          "\0xE6"           0         "\0xC3"   #small  tse
  281. X      0          "\0xE7"           0         "\0xDE"   #small  che
  282. X      0          "\0xE8"           0         "\0xDB"   #small  sha
  283. X      0          "\0xE9"           0         "\0xDD"   #small  shcha
  284. X      0          "\0xEA"           0         "\0xDF"   #small hard sign (ier)
  285. X      0          "\0xEB"           0         "\0xD9"   #small  y (iery)
  286. X      0          "\0xEC"           0         "\0xD8"   #small soft sign (ierik)
  287. X      0          "\0xED"           0         "\0xDC"   #small  rev rounded e
  288. X      0          "\0xEE"           0         "\0xC0"   #small  yu
  289. X      0          "\0xEF"           0         "\0xD1"   #small  ya
  290. END_OF_FILE
  291.   if test 5211 -ne `wc -c <'gos-koi8.rus'`; then
  292.     echo shar: \"'gos-koi8.rus'\" unpacked with wrong size!
  293.   fi
  294.   # end of 'gos-koi8.rus'
  295. fi
  296. if test -f 'koi8-alt.rus' -a "${1}" != "-c" ; then 
  297.   echo shar: Will not clobber existing file \"'koi8-alt.rus'\"
  298. else
  299.   echo shar: Extracting \"'koi8-alt.rus'\" \(5096 characters\)
  300.   sed "s/^X//" >'koi8-alt.rus' <<'END_OF_FILE'
  301. X# Jan Labanowski, jkl@osc.edu, Dec. 30, 1992
  302. X# File koi8_alt.rus
  303. X
  304. X# This is a transliteration data file for converting from KOI8
  305. X# KOI8 is meant to be GOST 19768-74, to ALT (Bryabrins alternativnyj variant)
  306. X# To be used with translit.c program by Jan Labanowski
  307. X
  308. X   1            file version number
  309. X
  310. X   "    "      # string delimiters
  311. X   [    ]      # list delimites
  312. X   {    }      # regular expression delimiters
  313. X
  314. X
  315. X#starting sequence
  316. X""
  317. X
  318. X
  319. X#ending sequence
  320. X""
  321. X
  322. X   0     # number of input SHIFT sequences, only one set of input characters
  323. X
  324. X   0     # number of output SHIFT sequences, only one set of output characters
  325. X  
  326. X# conversion table
  327. X# inp_set_numb  inp_seq        out_set_numb  out_seq
  328. X     0          "\0xB3"             0       "\0xf0"  # capital Yo
  329. X     0          "\0xA3"             0       "\0xf1"  # small yo
  330. X     0          "\0xE1"             0       "\0x80"  # capital A
  331. X     0          "\0xE2"             0       "\0x81"  # capital Be
  332. X     0          "\0xF7"             0       "\0x82"  # capital Ve
  333. X     0          "\0xE7"             0       "\0x83"  # capital Ghe
  334. X     0          "\0xE4"             0       "\0x84"  # capital De
  335. X     0          "\0xE5"             0       "\0x85"  # capital Ie
  336. X     0          "\0xF6"             0       "\0x86"  # capital Zhe
  337. X     0          "\0xFA"             0       "\0x87"  # capital Ze
  338. X     0          "\0xE9"             0       "\0x88"  # capital I
  339. X     0          "\0xEA"             0       "\0x89"  # capital short I
  340. X     0          "\0xEB"             0       "\0x8a"  # capital Ka
  341. X     0          "\0xEC"             0       "\0x8b"  # capital El
  342. X     0          "\0xED"             0       "\0x8c"  # capital Em
  343. X     0          "\0xEE"             0       "\0x8d"  # capital En
  344. X     0          "\0xEF"             0       "\0x8e"  # capital O
  345. X     0          "\0xF0"             0       "\0x8f"  # capital Pe
  346. X     0          "\0xF2"             0       "\0x90"  # capital Er
  347. X     0          "\0xF3"             0       "\0x91"  # capital Es
  348. X     0          "\0xF4"             0       "\0x92"  # capital Te
  349. X     0          "\0xF5"             0       "\0x93"  # capital U
  350. X     0          "\0xE6"             0       "\0x94"  # capital Ef
  351. X     0          "\0xE8"             0       "\0x95"  # capital Kha
  352. X     0          "\0xE3"             0       "\0x96"  # capital Tse
  353. X     0          "\0xFE"             0       "\0x97"  # capital Che
  354. X     0          "\0xFB"             0       "\0x98"  # capital Sha
  355. X     0          "\0xFD"             0       "\0x99"  # capital Shcha
  356. X     0          "\0xFF"             0       "\0x9a"  # capital hard sign (Ier)
  357. X     0          "\0xF9"             0       "\0x9b"  # capital Y (Iery)
  358. X     0          "\0xF8"             0       "\0x9c"  # capital soft sign Ierik
  359. X     0          "\0xFC"             0       "\0x9d"  # capital reverse round E
  360. X     0          "\0xE0"             0       "\0x9e"  # capital Yu
  361. X     0          "\0xF1"             0       "\0x9f"  # capital Ya
  362. X     0          "\0xC1"             0       "\0xa0"  # small a
  363. X     0          "\0xC2"             0       "\0xa1"  # small be
  364. X     0          "\0xD7"             0       "\0xa2"  # small ve
  365. X     0          "\0xC7"             0       "\0xa3"  # small ghe
  366. X     0          "\0xC4"             0       "\0xa4"  # small de
  367. X     0          "\0xC5"             0       "\0xa5"  # small ie
  368. X     0          "\0xD6"             0       "\0xa6"  # small zhe
  369. X     0          "\0xDA"             0       "\0xa7"  # small z
  370. X     0          "\0xC9"             0       "\0xa8"  # small i
  371. X     0          "\0xCA"             0       "\0xa9"  # small short i
  372. X     0          "\0xCB"             0       "\0xaa"  # small ka
  373. X     0          "\0xCC"             0       "\0xab"  # small el
  374. X     0          "\0xCD"             0       "\0xac"  # small em
  375. X     0          "\0xCE"             0       "\0xad"  # small en
  376. X     0          "\0xCF"             0       "\0xae"  # small o
  377. X     0          "\0xD0"             0       "\0xaf"  # small pe
  378. X     0          "\0xD2"             0       "\0xe0"  # small er
  379. X     0          "\0xD3"             0       "\0xe1"  # small es
  380. X     0          "\0xD4"             0       "\0xe2"  # small te
  381. X     0          "\0xD5"             0       "\0xe3"  # small u
  382. X     0          "\0xC6"             0       "\0xe4"  # small ef
  383. X     0          "\0xC8"             0       "\0xe5"  # small kha
  384. X     0          "\0xC3"             0       "\0xe6"  # small tse
  385. X     0          "\0xDE"             0       "\0xe7"  # small che
  386. X     0          "\0xDB"             0       "\0xe8"  # small sha
  387. X     0          "\0xDD"             0       "\0xe9"  # small shcha
  388. X     0          "\0xDF"             0       "\0xea"  # small hard sign (ier)
  389. X     0          "\0xD9"             0       "\0xeb"  # small y (iery)
  390. X     0          "\0xD8"             0       "\0xec"  # small soft sign (ierik)
  391. X     0          "\0xDC"             0       "\0xed"  # small reverse rounded e
  392. X     0          "\0xC0"             0       "\0xee"  # small yu
  393. X     0          "\0xD1"             0       "\0xef"  # small ya
  394. END_OF_FILE
  395.   if test 5096 -ne `wc -c <'koi8-alt.rus'`; then
  396.     echo shar: \"'koi8-alt.rus'\" unpacked with wrong size!
  397.   fi
  398.   # end of 'koi8-alt.rus'
  399. fi
  400. if test -f 'koi8-gos.rus' -a "${1}" != "-c" ; then 
  401.   echo shar: Will not clobber existing file \"'koi8-gos.rus'\"
  402. else
  403.   echo shar: Extracting \"'koi8-gos.rus'\" \(5220 characters\)
  404.   sed "s/^X//" >'koi8-gos.rus' <<'END_OF_FILE'
  405. X# Jan Labanowski, jkl@osc.edu, Dec. 30, 1992
  406. X# File koi8_gos.rus
  407. X
  408. X# This is a transliteration data file for converting from KOI8 (Relcom)
  409. X# KOI8 is meant to be GOST 19768-74, to GOSTSCII 84 (approx. ISO-8859-5)
  410. X# To be used with translit.c program by Jan Labanowski
  411. X
  412. X   1            file version number
  413. X
  414. X   "    "      # string delimiters
  415. X   [    ]      # list delimites
  416. X   {    }      # regular expression delimiters
  417. X
  418. X
  419. X#starting sequence
  420. X""
  421. X
  422. X
  423. X#ending sequence
  424. X""
  425. X
  426. X   0     # number of input SHIFT sequences, only one set of input characters
  427. X
  428. X   0     # number of output SHIFT sequences, only one set of output characters
  429. X  
  430. X# conversion table
  431. X# inp_set_numb  inp_seq        out_set_numb  out_seq
  432. X      0          "\0xB3"           0          "\0xF0   #capital Yo
  433. X      0          "\0xA3"           0          "\0xF1"  #small yo
  434. X      0          "\0xE1"           0          "\0xB0"  #capital  A
  435. X      0          "\0xE2"           0          "\0xB1"  #capital  Be
  436. X      0          "\0xF7"           0          "\0xB2"  #capital  Ve
  437. X      0          "\0xE7"           0          "\0xB3"  #capital  Ghe
  438. X      0          "\0xE4"           0          "\0xB4"  #capital  De
  439. X      0          "\0xE5"           0          "\0xB5"  #capital  Ie
  440. X      0          "\0xF6"           0          "\0xB6"  #capital  Zhe
  441. X      0          "\0xFA"           0          "\0xB7"  #capital  Ze
  442. X      0          "\0xE9"           0          "\0xB8"  #capital  I
  443. X      0          "\0xEA"           0          "\0xB9"  #capital  short I
  444. X      0          "\0xEB"           0          "\0xBA"  #capital  Ka
  445. X      0          "\0xEC"           0          "\0xBB"  #capital  El
  446. X      0          "\0xED"           0          "\0xBC"  #capital  Em
  447. X      0          "\0xEE"           0          "\0xBD"  #capital  En
  448. X      0          "\0xEF"           0          "\0xBE"  #capital  O
  449. X      0          "\0xF0"           0          "\0xBF"  #capital  Pe
  450. X      0          "\0xF2"           0          "\0xC0"  #capital  Er
  451. X      0          "\0xF3"           0          "\0xC1"  #capital  Es
  452. X      0          "\0xF4"           0          "\0xC2"  #capital  Te
  453. X      0          "\0xF5"           0          "\0xC3"  #capital  U
  454. X      0          "\0xE6"           0          "\0xC4"  #capital  Ef
  455. X      0          "\0xE8"           0          "\0xC5"  #capital  Kha
  456. X      0          "\0xE3"           0          "\0xC6"  #capital  Tse
  457. X      0          "\0xFE"           0          "\0xC7"  #capital  Che
  458. X      0          "\0xFB"           0          "\0xC8"  #capital  Sha
  459. X      0          "\0xFD"           0          "\0xC9"  #capital  Shcha
  460. X      0          "\0xFF"           0          "\0xCA"  #capital hard sign (Ier)
  461. X      0          "\0xF9"           0          "\0xCB"  #capital  Y (Iery)
  462. X      0          "\0xF8"           0          "\0xCC"  #capit soft sign(Ierik)
  463. X      0          "\0xFC"           0          "\0xCD"  #capit reverse rounded E
  464. X      0          "\0xE0"           0          "\0xCE"  #capital  Yu
  465. X      0          "\0xF1"           0          "\0xCF"  #capital  Ya
  466. X      0          "\0xC1"           0          "\0xD0"  #small  a
  467. X      0          "\0xC2"           0          "\0xD1"  #small  be
  468. X      0          "\0xD7"           0          "\0xD2"  #small  ve
  469. X      0          "\0xC7"           0          "\0xD3"  #small  ghe
  470. X      0          "\0xC4"           0          "\0xD4"  #small  de
  471. X      0          "\0xC5"           0          "\0xD5"  #small  ie
  472. X      0          "\0xD6"           0          "\0xD6"  #small  zhe
  473. X      0          "\0xDA"           0          "\0xD7"  #small  z
  474. X      0          "\0xC9"           0          "\0xD8"  #small  i
  475. X      0          "\0xCA"           0          "\0xD9"  #small  short i
  476. X      0          "\0xCB"           0          "\0xDA"  #small  ka
  477. X      0          "\0xCC"           0          "\0xDB"  #small  el
  478. X      0          "\0xCD"           0          "\0xDC"  #small  em
  479. X      0          "\0xCE"           0          "\0xDD"  #small  en
  480. X      0          "\0xCF"           0          "\0xDE"  #small  o
  481. X      0          "\0xD0"           0          "\0xDF"  #small  pe
  482. X      0          "\0xD2"           0          "\0xE0"  #small  er
  483. X      0          "\0xD3"           0          "\0xE1"  #small  es
  484. X      0          "\0xD4"           0          "\0xE2"  #small  te
  485. X      0          "\0xD5"           0          "\0xE3"  #small  u
  486. X      0          "\0xC6"           0          "\0xE4"  #small  ef
  487. X      0          "\0xC8"           0          "\0xE5"  #small  kha
  488. X      0          "\0xC3"           0          "\0xE6"  #small  tse
  489. X      0          "\0xDE"           0          "\0xE7"  #small  che
  490. X      0          "\0xDB"           0          "\0xE8"  #small  sha
  491. X      0          "\0xDD"           0          "\0xE9"  #small  shcha
  492. X      0          "\0xDF"           0          "\0xEA"  #small hard sign (ier)
  493. X      0          "\0xD9"           0          "\0xEB"  #small  y (iery)
  494. X      0          "\0xD8"           0          "\0xEC"  #small soft sign (ierik)
  495. X      0          "\0xDC"           0          "\0xED"  #small  rev rounded e
  496. X      0          "\0xC0"           0          "\0xEE"  #small  yu
  497. X      0          "\0xD1"           0          "\0xEF"  #small  ya
  498. END_OF_FILE
  499.   if test 5220 -ne `wc -c <'koi8-gos.rus'`; then
  500.     echo shar: \"'koi8-gos.rus'\" unpacked with wrong size!
  501.   fi
  502.   # end of 'koi8-gos.rus'
  503. fi
  504. if test -f 'paths.h' -a "${1}" != "-c" ; then 
  505.   echo shar: Will not clobber existing file \"'paths.h'\"
  506. else
  507.   echo shar: Extracting \"'paths.h'\" \(2971 characters\)
  508.   sed "s/^X//" >'paths.h' <<'END_OF_FILE'
  509. X/* Include file for translit.c program
  510. X * Copyright (c) 1993 Jan Labanowski and JKL Enterprises, Inc.
  511. X *   Jan Labanowski, jkl@osc.edu, JKL@OHSTPY.BITNET Jan. 5, 1993
  512. X * You must modify this file before you try to compile the program
  513. X */
  514. X
  515. X
  516. X/* these are "standard" include files. Some may have different names on
  517. X   your system. If program complains here, you need to check it */
  518. X
  519. X#include <stdio.h>
  520. X#include <string.h>     /* some older machines have <strings.h> !!! */
  521. X#include <stdlib.h>     /* some machines use <unix.h> here or some/no-thing */
  522. X#include <ctype.h>
  523. X
  524. X
  525. X/* These are some defines which relate to the system and compiler
  526. X * you are running:
  527. X *     1 (one) means YES, TRUE,
  528. X *     0 (zero) means NO, FALSE
  529. X */
  530. X#define GETOPT  1   /* does your C compiler have getopt routine? Most compilers
  531. X                       do, but for example VAX C does not. Some PCs do not,
  532. X                       UN*X usually has.  Enter 1 if you have
  533. X                       getopt and 0 if you do not. */
  534. X
  535. X#define GETENV  1   /* does your C compiler and system have getenv routine?
  536. X                       To my knowledge all UN*X, VAX-VMS and MS-DOS have.
  537. X                       Enter 1 if you have it, and 0 if you do not. If you do
  538. X                       not have GETENV, you do not have environment. */
  539. X
  540. X#define STRCHR  1   /* the routine finding a position of a character in 
  541. X                       a string is called strchr. If you do not have this
  542. X                       routine, say 0, if you have it, say 1 */
  543. X
  544. X#define STRCSPN 1   /* some compiler libaries do not have the strcspn routine.
  545. X                       If you have it enter 1, if you do not, enter 0 */
  546. X
  547. X#define STATICFUN   1   /* if your compiler supports declarations of 
  548. X                           static functions:
  549. X                                static int boo(foo)
  550. X                           enter 1. If it chokes on it, change to 0.  */
  551. X
  552. X
  553. X/* if transliteration table file is not found in the current directory
  554. X * program looks for this file in directory pointed by PATH. For UNIX
  555. X * it might be something like "/usr/local/lib/", and for MS-DOS it maybe
  556. X * something like: "C:\\INCLUDE\\". Remember to put a slash(backslash)
  557. X * after last subdirectory name. For DOS remember that backslashes have
  558. X * to be quoted, i.e., you enter the backslash twice. I did not check it
  559. X * for the VAX.
  560. X */
  561. X                 /* search path for transliteration rules files */
  562. X#define TPATH    "/usr/local/lib/translit/"
  563. X
  564. X/* DECONVNAME --- default file name for conversion table (no path, just
  565. X * file name.
  566. X */
  567. X#define DEFCONVNAME "koi8-tex.rus"
  568. X
  569. X
  570. X/* if environment variables TRANSP and TRANSF are defined, the
  571. X   TPATH and DECONVNAME are taken from them, not from the above defs.
  572. X   If these environment variables are booked you need to put here
  573. X   something else.  */
  574. X
  575. X/* name of envoronment variable with TPATH */
  576. X#define TRANSPATH "TRANSP"
  577. X
  578. X/* name of environment variable with DEFCONVNAME */
  579. X#define DEFNAME   "TRANSF"
  580. X
  581. END_OF_FILE
  582.   if test 2971 -ne `wc -c <'paths.h'`; then
  583.     echo shar: \"'paths.h'\" unpacked with wrong size!
  584.   fi
  585.   # end of 'paths.h'
  586. fi
  587. echo shar: End of archive 10 \(of 10\).
  588. cp /dev/null ark10isdone
  589. MISSING=""
  590. for I in 1 2 3 4 5 6 7 8 9 10 ; do
  591.     if test ! -f ark${I}isdone ; then
  592.     MISSING="${MISSING} ${I}"
  593.     fi
  594. done
  595. if test "${MISSING}" = "" ; then
  596.     echo You have unpacked all 10 archives.
  597.     rm -f ark[1-9]isdone ark[1-9][0-9]isdone
  598. else
  599.     echo You still must unpack the following archives:
  600.     echo "        " ${MISSING}
  601. fi
  602. exit 0
  603. exit 0 # Just in case...
  604.