00001 /* -*- c-basic-offset: 4; indent-tabs-mode: nil -*- */ 00002 /* ==================================================================== 00003 * Copyright (c) 1999-2004 Carnegie Mellon University. All rights 00004 * reserved. 00005 * 00006 * Redistribution and use in source and binary forms, with or without 00007 * modification, are permitted provided that the following conditions 00008 * are met: 00009 * 00010 * 1. Redistributions of source code must retain the above copyright 00011 * notice, this list of conditions and the following disclaimer. 00012 * 00013 * 2. Redistributions in binary form must reproduce the above copyright 00014 * notice, this list of conditions and the following disclaimer in 00015 * the documentation and/or other materials provided with the 00016 * distribution. 00017 * 00018 * This work was supported in part by funding from the Defense Advanced 00019 * Research Projects Agency and the National Science Foundation of the 00020 * United States of America, and the CMU Sphinx Speech Consortium. 00021 * 00022 * THIS SOFTWARE IS PROVIDED BY CARNEGIE MELLON UNIVERSITY ``AS IS'' AND 00023 * ANY EXPRESSED OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, 00024 * THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 00025 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL CARNEGIE MELLON UNIVERSITY 00026 * NOR ITS EMPLOYEES BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 00027 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 00028 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 00029 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 00030 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 00031 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 00032 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 00033 * 00034 * ==================================================================== 00035 * 00036 */ 00037 /* 00038 * encoding.h -- Take care of text encoding issue 00039 * 00040 * ********************************************** 00041 * CMU ARPA Speech Project 00042 * 00043 * Copyright (c) 2005 Carnegie Mellon University. 00044 * ALL RIGHTS RESERVED. 00045 * ********************************************** 00046 * 00047 * HISTORY 00048 * $Log$ 00049 * Revision 1.1 2006/04/05 20:27:30 dhdfu 00050 * A Great Reorganzation of header files and executables 00051 * 00052 * Revision 1.2 2006/02/22 18:45:02 arthchan2003 00053 * Merged from SPHINX3_5_2_RCI_IRII_BRANCH: Added encoding.[ch]. This is 00054 * a simple interface to convert text from one format to another. 00055 * Currently, it only support iso8859-1, gb2312 and gb2312-hex. 00056 * 00057 * Revision 1.1.2.1 2005/11/17 06:08:39 arthchan2003 00058 * Added a simple interface for text encoding conversion. 00059 * 00060 */ 00061 00062 #ifndef ENCODING 00063 #define ENCODING 00064 00065 #include <stdlib.h> 00066 #include <s3types.h> 00067 00068 00069 #ifdef __cplusplus 00070 extern "C" { 00071 #endif 00072 #if 0 00073 /* Fool Emacs. */ 00074 } 00075 #endif 00076 00077 #define IND_ISO88591 0 00078 #define ISO88591 "iso8859-1" 00079 #define IND_GB2312HEX 1 00080 #define GB2312HEX "gb2312-hex" 00081 #define IND_GB2312 2 00082 #define GB2312 "gb2312" 00083 00084 #define IND_BADENCODING -1 00085 #define BADENCODING "BAD_ENCODING" 00086 00092 int encoding_str2ind(const char *enc 00093 ); 00094 00099 S3DECODER_EXPORT 00100 int encoding_resolve(const char* inputenc, 00101 const char *outputenc 00102 ); 00103 00107 void hextocode(char* src 00109 ); 00110 00111 int ishex(const char* str); 00112 00113 #ifdef __cplusplus 00114 } 00115 #endif 00116 00117 00118 #endif