ICU-266 c++-ify UConverter (UConverterImpl resembles a vtable)

X-SVN-Rev: 723
2000-02-07 17:35:21 +00:00 · 2000-02-07 17:35:21 +00:00 · 20baeae401
commit 20baeae401
parent 7b6b7df37a
7 changed files with 176 additions and 152 deletions
--- a/icu4c/source/common/Makefile.in
+++ b/icu4c/source/common/Makefile.in
@ -75,7 +75,7 @@ uchar.o uchriter.o ucmp8.o ucmp16.o ucmp32.o ucnv.o ucnv_bld.o		\
 ucnv_cnv.o ucnv_err.o ucnv_io.o uhash.o uloc.o unicode.o unistr.o	\
 ures.o ustring.o rbread.o rbdata.o ubidi.o ubidiln.o \
 bidi.o uvector.o udata.o unames.o utf_impl.o \
-ucnv_2022.o ucnv_utf.o ucnv_sbcs.o ucnv_mbcs.o
+ucnv2022.o ucnvlat1.o ucnv_utf.o ucnvsbcs.o ucnvmbcs.o

 DEPS = $(OBJECTS:.o=.d)

--- a/icu4c/source/common/common.dsp
+++ b/icu4c/source/common/common.dsp
@ -211,7 +211,7 @@ SOURCE=.\ucnv.c
 # End Source File
 # Begin Source File

-SOURCE=.\ucnv_2022.c
+SOURCE=.\ucnv2022.c
 # End Source File
 # Begin Source File

@ -231,18 +231,22 @@ SOURCE=.\ucnv_io.c
 # End Source File
 # Begin Source File

-SOURCE=.\ucnv_mbcs.c
-# End Source File
-# Begin Source File
-
-SOURCE=.\ucnv_sbcs.c
-# End Source File
-# Begin Source File
-
 SOURCE=.\ucnv_utf.c
 # End Source File
 # Begin Source File

+SOURCE=.\ucnvlat1.c
+# End Source File
+# Begin Source File
+
+SOURCE=.\ucnvmbcs.c
+# End Source File
+# Begin Source File
+
+SOURCE=.\ucnvsbcs.c
+# End Source File
+# Begin Source File
+
 SOURCE=.\udata.c
 # ADD CPP /Ze
 # End Source File
--- a/icu4c/source/common/ucnv_2022.c
+++ b/icu4c/source/common/ucnv_2022.c
@ -3,7 +3,7 @@
 *   Copyright (C) 2000, International Business Machines
 *   Corporation and others.  All Rights Reserved.
 **********************************************************************
-*   file name:  ucnv_2022.cpp
+*   file name:  ucnv2022.cpp
 *   encoding:   US-ASCII
 *   tab size:   8 (not used)
 *   indentation:4
--- a/icu4c/source/common/ucnv_utf.c
+++ b/icu4c/source/common/ucnv_utf.c
@ -19,145 +19,6 @@
 #include "unicode/ucnv.h"
 #include "ucnv_cnv.h"

-/* ISO 8859-1 --------------------------------------------------------------- */
-
-void  T_UConverter_toUnicode_LATIN_1 (UConverter * _this,
-                                      UChar ** target,
-                                      const UChar * targetLimit,
-                                      const char **source,
-                                      const char *sourceLimit,
-                                      int32_t *offsets,
-                                      bool_t flush,
-                                      UErrorCode * err)
-{
-  unsigned char *mySource = (unsigned char *) *source;
-  UChar *myTarget = *target;
-  int32_t sourceLength = sourceLimit - (char *) mySource;
-  int32_t readLen = 0;
-  int32_t i = 0;
-
-  /*Since there is no risk of encountering illegal Chars
-   *we need to pad our latin1 chars to create Unicode codepoints
-   *we need to go as far a min(targetLen, sourceLen)
-   *in case we don't have enough buffer space
-   *we set the error flag accordingly
-   */
-  if ((targetLimit - *target) < sourceLength)
-    {
-      readLen = targetLimit - *target;
-      *err = U_INDEX_OUTOFBOUNDS_ERROR;
-    }
-  else
-    {
-      readLen = sourceLimit - (char *) mySource;
-    }
-
-  for (i = 0; i < readLen; i++) myTarget[i] = (UChar) mySource[i];
-
-  *target += i;
-  *source += i;
-  return;
-}
-
-void   T_UConverter_fromUnicode_LATIN_1 (UConverter * _this,
-                                         char **target,
-                                         const char *targetLimit,
-                                         const UChar ** source,
-                                         const UChar * sourceLimit,
-                                         int32_t *offsets,
-                                         bool_t flush,
-                                         UErrorCode * err)
-{
-  const UChar *mySource = *source;
-  unsigned char *myTarget = (unsigned char *) *target;
-  int32_t mySourceIndex = 0;
-  int32_t myTargetIndex = 0;
-  int32_t targetLength = targetLimit - (char *) myTarget;
-  int32_t sourceLength = sourceLimit - mySource;
-
-  /*writing the char to the output stream */
-  while (mySourceIndex < sourceLength)
-    {
-
-      if (myTargetIndex < targetLength)
-        {
-          if (mySource[mySourceIndex] < 0x0100)
-            {
-              /*writes the char to the output stream */
-              myTarget[myTargetIndex++] = (char) mySource[mySourceIndex++];
-            }
-          else
-            {
-              *err = U_INVALID_CHAR_FOUND;
-              _this->invalidUCharBuffer[0] = (UChar) mySource[mySourceIndex++];
-              _this->invalidUCharLength = 1;
-
-/* Needed explicit cast for myTarget on MVS to make compiler happy - JJD */
-              FromU_CALLBACK_MACRO(_this,
-                                   (char *)myTarget, 
-                                   myTargetIndex,
-                                   targetLimit, 
-                                   mySource,
-                                   mySourceIndex, 
-                                   sourceLimit,
-                                   offsets, 
-                                   flush, 
-                                   err);
-
-              if (U_FAILURE (*err)) break;
-              _this->invalidUCharLength = 0;
-            }
-        }
-      else
-        {
-          *err = U_INDEX_OUTOFBOUNDS_ERROR;
-          break;
-        }
-    }
-
-  *target += myTargetIndex;
-  *source += mySourceIndex;;
-
-  return;
-}
-
-UChar T_UConverter_getNextUChar_LATIN_1(UConverter* converter,
-                                                  const char** source,
-                                                  const char* sourceLimit,
-                                                  UErrorCode* err)
-{
-  
-  /* Empties the internal buffers if need be
-   * In this case since ErrorFunctors are never called 
-   * (LATIN_1 is a subset of Unicode)
-   */
-  
-  if ((*source)+1 > sourceLimit) 
-    {
-      *err = U_INDEX_OUTOFBOUNDS_ERROR;
-      return 0xFFFD;
-    }
-  
-  return  (UChar)*((*source)++);
-}
-
-static UConverterImpl _Latin1Impl={
-    UCNV_LATIN_1,
-
-    T_UConverter_toUnicode_LATIN_1,
-    NULL,
-    T_UConverter_fromUnicode_LATIN_1,
-    NULL,
-    T_UConverter_getNextUChar_LATIN_1
-};
-
-extern UConverterSharedData _Latin1Data={
-    sizeof(UConverterSharedData), ~0,
-    NULL, NULL, &_Latin1Impl, "LATIN_1",
-    819, UCNV_IBM, UCNV_LATIN_1, 1, 1,
-    { 0, 1, 0x1a, 0, 0, 0 }
-};
-
 /* UTF-8 -------------------------------------------------------------------- */

 /* UTF-8 Conversion DATA
--- a/icu4c/source/common/ucnvlat1.c
+++ b/icu4c/source/common/ucnvlat1.c
@ -0,0 +1,159 @@
+/*  
+**********************************************************************
+*   Copyright (C) 2000, International Business Machines
+*   Corporation and others.  All Rights Reserved.
+**********************************************************************
+*   file name:  ucnvlat1.cpp
+*   encoding:   US-ASCII
+*   tab size:   8 (not used)
+*   indentation:4
+*
+*   created on: 2000feb07
+*   created by: Markus W. Scherer
+*/
+
+#include "unicode/utypes.h"
+#include "ucmp16.h"
+#include "ucmp8.h"
+#include "unicode/ucnv_bld.h"
+#include "unicode/ucnv.h"
+#include "ucnv_cnv.h"
+
+/* ISO 8859-1 --------------------------------------------------------------- */
+
+void  T_UConverter_toUnicode_LATIN_1 (UConverter * _this,
+                                      UChar ** target,
+                                      const UChar * targetLimit,
+                                      const char **source,
+                                      const char *sourceLimit,
+                                      int32_t *offsets,
+                                      bool_t flush,
+                                      UErrorCode * err)
+{
+  unsigned char *mySource = (unsigned char *) *source;
+  UChar *myTarget = *target;
+  int32_t sourceLength = sourceLimit - (char *) mySource;
+  int32_t readLen = 0;
+  int32_t i = 0;
+
+  /*Since there is no risk of encountering illegal Chars
+   *we need to pad our latin1 chars to create Unicode codepoints
+   *we need to go as far a min(targetLen, sourceLen)
+   *in case we don't have enough buffer space
+   *we set the error flag accordingly
+   */
+  if ((targetLimit - *target) < sourceLength)
+    {
+      readLen = targetLimit - *target;
+      *err = U_INDEX_OUTOFBOUNDS_ERROR;
+    }
+  else
+    {
+      readLen = sourceLimit - (char *) mySource;
+    }
+
+  for (i = 0; i < readLen; i++) myTarget[i] = (UChar) mySource[i];
+
+  *target += i;
+  *source += i;
+  return;
+}
+
+void   T_UConverter_fromUnicode_LATIN_1 (UConverter * _this,
+                                         char **target,
+                                         const char *targetLimit,
+                                         const UChar ** source,
+                                         const UChar * sourceLimit,
+                                         int32_t *offsets,
+                                         bool_t flush,
+                                         UErrorCode * err)
+{
+  const UChar *mySource = *source;
+  unsigned char *myTarget = (unsigned char *) *target;
+  int32_t mySourceIndex = 0;
+  int32_t myTargetIndex = 0;
+  int32_t targetLength = targetLimit - (char *) myTarget;
+  int32_t sourceLength = sourceLimit - mySource;
+
+  /*writing the char to the output stream */
+  while (mySourceIndex < sourceLength)
+    {
+
+      if (myTargetIndex < targetLength)
+        {
+          if (mySource[mySourceIndex] < 0x0100)
+            {
+              /*writes the char to the output stream */
+              myTarget[myTargetIndex++] = (char) mySource[mySourceIndex++];
+            }
+          else
+            {
+              *err = U_INVALID_CHAR_FOUND;
+              _this->invalidUCharBuffer[0] = (UChar) mySource[mySourceIndex++];
+              _this->invalidUCharLength = 1;
+
+/* Needed explicit cast for myTarget on MVS to make compiler happy - JJD */
+              FromU_CALLBACK_MACRO(_this,
+                                   (char *)myTarget, 
+                                   myTargetIndex,
+                                   targetLimit, 
+                                   mySource,
+                                   mySourceIndex, 
+                                   sourceLimit,
+                                   offsets, 
+                                   flush, 
+                                   err);
+
+              if (U_FAILURE (*err)) break;
+              _this->invalidUCharLength = 0;
+            }
+        }
+      else
+        {
+          *err = U_INDEX_OUTOFBOUNDS_ERROR;
+          break;
+        }
+    }
+
+  *target += myTargetIndex;
+  *source += mySourceIndex;;
+
+  return;
+}
+
+UChar T_UConverter_getNextUChar_LATIN_1(UConverter* converter,
+                                                  const char** source,
+                                                  const char* sourceLimit,
+                                                  UErrorCode* err)
+{
+  
+  /* Empties the internal buffers if need be
+   * In this case since ErrorFunctors are never called 
+   * (LATIN_1 is a subset of Unicode)
+   */
+  
+  if ((*source)+1 > sourceLimit) 
+    {
+      *err = U_INDEX_OUTOFBOUNDS_ERROR;
+      return 0xFFFD;
+    }
+  
+  return  (UChar)*((*source)++);
+}
+
+static UConverterImpl _Latin1Impl={
+    UCNV_LATIN_1,
+
+    T_UConverter_toUnicode_LATIN_1,
+    NULL,
+    T_UConverter_fromUnicode_LATIN_1,
+    NULL,
+    T_UConverter_getNextUChar_LATIN_1
+};
+
+extern UConverterSharedData _Latin1Data={
+    sizeof(UConverterSharedData), ~0,
+    NULL, NULL, &_Latin1Impl, "LATIN_1",
+    819, UCNV_IBM, UCNV_LATIN_1, 1, 1,
+    { 0, 1, 0x1a, 0, 0, 0 }
+};
--- a/icu4c/source/common/ucnv_mbcs.c
+++ b/icu4c/source/common/ucnv_mbcs.c
@ -3,7 +3,7 @@
 *   Copyright (C) 2000, International Business Machines
 *   Corporation and others.  All Rights Reserved.
 **********************************************************************
-*   file name:  ucnv_mbcs.cpp
+*   file name:  ucnvmbcs.cpp
 *   encoding:   US-ASCII
 *   tab size:   8 (not used)
 *   indentation:4
--- a/icu4c/source/common/ucnv_sbcs.c
+++ b/icu4c/source/common/ucnv_sbcs.c
@ -3,7 +3,7 @@
 *   Copyright (C) 2000, International Business Machines
 *   Corporation and others.  All Rights Reserved.
 **********************************************************************
-*   file name:  ucnv_sbcs.cpp
+*   file name:  ucnvsbcs.cpp
 *   encoding:   US-ASCII
 *   tab size:   8 (not used)
 *   indentation:4