123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109# 1 "Camomile/internal/charmap.ml"(** Charactor mapping table *)(* Copyright (C) 2002, 2011 Yamagata Yoriyuki *)(* This library is free software; you can redistribute it and/or *)(* modify it under the terms of the GNU Lesser General Public License *)(* as published by the Free Software Foundation; either version 2 of *)(* the License, or (at your option) any later version. *)(* As a special exception to the GNU Library General Public License, you *)(* may link, statically or dynamically, a "work that uses this library" *)(* with a publicly distributed version of this library to produce an *)(* executable file containing portions of this library, and distribute *)(* that executable file under terms of your choice, without any of the *)(* additional requirements listed in clause 6 of the GNU Library General *)(* Public License. By "a publicly distributed version of this library", *)(* we mean either the unmodified Library as distributed by the authors, *)(* or a modified version of this library that is distributed under the *)(* conditions defined in clause 3 of the GNU Library General Public *)(* License. This exception does not however invalidate any other reasons *)(* why the executable file might be covered by the GNU Library General *)(* Public License . *)(* This library is distributed in the hope that it will be useful, *)(* but WITHOUT ANY WARRANTY; without even the implied warranty of *)(* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU *)(* Lesser General Public License for more details. *)(* You should have received a copy of the GNU Lesser General Public *)(* License along with this library; if not, write to the Free Software *)(* Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 *)(* USA *)(* You can contact the authour by sending email to *)(* yoriyuki.y@gmail.com *)moduletypeInterface=sigtypeenc_to_ucsvalmake_enc_to_ucs:int->(string*int)list->enc_to_ucsvalno_char_of:enc_to_ucs->inttypeprobe_statevalstart_probe:enc_to_ucs->probe_statevallook_probe:probe_state->int->intvalnext_probe:probe_state->int->probe_stateoptiontypet={name:string;ucs_to_enc:stringTbl31.t;enc_to_ucs:enc_to_ucs;}typedata=Aliasofstring|CMapoftvalof_name:string->tendmoduleConfigure(Config:ConfigInt.Type)=structtypeenc_to_ucs={enc_to_ucs_no_char:int;enc_to_ucs_tbl:Byte_labeled_dag.bytes}letmake_enc_to_ucsno_charvs={enc_to_ucs_no_char=no_char;enc_to_ucs_tbl=Byte_labeled_dag.make_bytesno_charvs}letno_char_ofenc_to_ucs=enc_to_ucs.enc_to_ucs_no_chartypeprobe_state=Byte_labeled_dag.bytesletstart_probeenc_to_ucs=enc_to_ucs.enc_to_ucs_tblletlook_probestatei=Byte_labeled_dag.look_leaf_bytesstateiletnext_probestatei=Byte_labeled_dag.look_branch_bytesstateitypet={name:string;ucs_to_enc:stringTbl31.t;enc_to_ucs:enc_to_ucs}typedata=Aliasofstring|CMapoftletloaded=Hashtbl.create0letof_namename=tryletb=Hashtbl.findloadednameinmatchWeak.getb0withNone->Hashtbl.removeloadedname;raiseNot_found|Somex->xwithNot_found->letreclookcountname=letdata:data=Database.readConfig.charmapdir"mar"input_valuenameinmatchdatawithAliass->ifcount=1thenraiseNot_foundelselook1s|CMapt->tinlett=look0nameinletb=Weak.create1inWeak.setb0(Somet);Hashtbl.addloadednameb;tend