Added option to read from and write to files as well as console. This allows

transcode to process binary files properly - eg to Base64 an image.
2025-01-17 18:12:04 +01:00 · 2003-10-27 15:44:32 +00:00 · 2003-10-27 15:44:32 +00:00 · bf2c892506
commit bf2c892506
parent e99734c401
1 changed files with 131 additions and 75 deletions
--- a/examples/Utils/transcode.cpp
+++ b/examples/Utils/transcode.cpp
@ -15,10 +15,14 @@
 #include <Utils/utf16beucs2codecvt.h>
 #include <Utils/utf16leucs2codecvt.h>
-using namespace Arabica::convert;
+#include <fstream>
 std::ifstream inputFile;
 std::ofstream outputFile;
 using namespace Arabica::convert;
 iconvert_adaptor<char> iByteConvertor(std::cin);
 oconvert_adaptor<char> oByteConvertor(std::cout);
 bool needWCharIntermediary = false;
 #ifndef ARABICA_NO_WCHAR_T
 typedef iconvert_adaptor<wchar_t, std::char_traits<wchar_t>, char, std::char_traits<char> > Widener;
@ -28,21 +32,37 @@ Widener iCharAdaptor(iByteConvertor);
 Narrower oCharAdaptor(oByteConvertor);
 #endif 
-void transcode();
+void wchar_transcode();
-void imbueCodecvts(int argc, const char* argv[]);
+void byte_transcode();
 bool processArgs(int argc, const char* argv[]);
 bool imbueInput(int& argn, int argc, const char* argv[]);
 bool imbueOutput(int& argn, int argc, const char* argv[]);
 int main(int argc, const char* argv[])
 {
-  imbueCodecvts(argc, argv);
+  if(!processArgs(argc, argv))
  {
    std::cerr << argv[0] << "\n"
              << "  [(-ie|--input-encoding) input-encoding]\n" 
              << "  [(-oe|--output-encoding) output-encoding]\n" 
              << "  [(-i|--input) input-filename]\n"
              << "  [(-o|--output) output-filename]"
              << std::endl;
    return 0;
  }
-  transcode();
+  if(needWCharIntermediary)
    wchar_transcode();
  else
    byte_transcode();
  return 0;
 } // main
-#ifndef ARABICA_NO_WCHAR_T
+void wchar_transcode()
 void transcode()
 {
 #ifndef ARABICA_NO_WCHAR_T
  int count = 0;
  wchar_t c = iCharAdaptor.get();
  while(!iCharAdaptor.eof())
@ -60,9 +80,10 @@ void transcode()
  }
  oCharAdaptor.flush();
  oByteConvertor.flush(); 
-} // transcode
+#endif
-#else
+} // wchar_transcode
-void transcode()
+
 void byte_transcode()
 {
  int count = 0;
  char c = iByteConvertor.get();
@ -80,78 +101,113 @@ void transcode()
  } // while
  oByteConvertor.flush();
-} // transcode
+} // byte_transcode
 #endif
-void imbueCodecvts(int argc, const char* argv[])
+bool processArgs(int argc, const char* argv[])
 {
 #ifndef ARABICA_NO_WCHAR_T
  oCharAdaptor.imbue(std::locale(oCharAdaptor.getloc(), new utf16beucs2codecvt()));
 #endif
  for(int i = 1; i < argc; ++i)
  {
    std::string io(argv[i]);
-    bool input = true;
+    if(io == "-ie" || io == "--input-encoding") 
    if(io == "-i" || io == "--input")
      input = true;
    else if(io == "-o" || io == "--output")
      input = false;
    else
    {
-      std::cerr << argv[0] << " [(-i|--input) input-encoding] [(-o|--output) output-encoding] " << std::endl;
+      if(!(imbueInput(i, argc, argv)))
-      std::exit(0);
+        return false;
    } // 
    ++i;
    if(i >= argc)
    {
      std::cerr << argv[0] << " [(-i|--input) input-encoding] [(-o|--output) output-encoding] " << std::endl;
      std::exit(0);
    } // 
    std::string cvt(argv[i]);
    if(input)
    {
      if(cvt == "rot13")
        iByteConvertor.imbue(std::locale(iByteConvertor.getloc(), new rot13codecvt()));
      else if(cvt == "base64")
        iByteConvertor.imbue(std::locale(iByteConvertor.getloc(), new base64codecvt()));
 #ifndef ARABICA_NO_WCHAR_T
      else if(cvt == "utf8")
        iCharAdaptor.imbue(std::locale(iCharAdaptor.getloc(), new utf8ucs2codecvt()));
      else if(cvt == "utf16be")
        iCharAdaptor.imbue(std::locale(iCharAdaptor.getloc(), new utf16beucs2codecvt()));
      else if(cvt == "utf16le")
        iCharAdaptor.imbue(std::locale(iCharAdaptor.getloc(), new utf16leucs2codecvt()));
 #endif
      else
      {
        std::cerr << cvt << " is not a valid input encoding." << std::endl;
        std::exit(0);
      }
    }
-    else
+    else if(io == "-oe" || io == "--output-encoding") 
    {
-      if(cvt == "rot13")
+      if(!(imbueOutput(i, argc, argv)))
-        oByteConvertor.imbue(std::locale(oByteConvertor.getloc(), new rot13codecvt()));
+        return false;
-      else if(cvt == "base64")
+    }
-        oByteConvertor.imbue(std::locale(oByteConvertor.getloc(), new base64codecvt()));
+    else if(io == "-i" || io == "--input")
-#ifndef ARABICA_NO_WCHAR_T
+    {
-      else if(cvt == "utf8")
+      ++i;
-        oCharAdaptor.imbue(std::locale(oCharAdaptor.getloc(), new utf8ucs2codecvt()));
+      if(i >= argc)
-      else if(cvt == "utf16be")
+        return false;
-        oCharAdaptor.imbue(std::locale(oCharAdaptor.getloc(), new utf16beucs2codecvt()));
+      inputFile.open(argv[i], std::ios_base::in | std::ios_base::binary);
-      else if(cvt == "utf16le")
+      iByteConvertor.set_stream(inputFile);
-        oCharAdaptor.imbue(std::locale(oCharAdaptor.getloc(), new utf16leucs2codecvt()));
+    }  
-#endif
+    else if(io == "-o" || io == "--output")
-      else 
+    {
-      {
+      ++i;
-        std::cerr << cvt << " is not a valid output encoding." << std::endl;
+      if(i >= argc)
-        std::exit(0);
+        return false;
-      }
+      outputFile.open(argv[i], std::ios_base::out | std::ios_base::trunc | std::ios_base::binary);
-    } 
+      oByteConvertor.set_stream(outputFile);
-  } // for ...
+    }  
-} // imbueCodeCvts
+    else
      return false;
  }
  return true;
 } // processArgs
 bool imbueInput(int& argn, int argc, const char* argv[])
 {
  ++argn;
  if(argn >= argc)
    return false;
  std::string cvt(argv[argn]);
  if(cvt == "rot13")
    iByteConvertor.imbue(std::locale(iByteConvertor.getloc(), new rot13codecvt()));
  else if(cvt == "base64")
    iByteConvertor.imbue(std::locale(iByteConvertor.getloc(), new base64codecvt()));
 #ifndef ARABICA_NO_WCHAR_T
  else if(cvt == "utf8")
    iCharAdaptor.imbue(std::locale(iCharAdaptor.getloc(), new utf8ucs2codecvt()));
  else if(cvt == "utf16be")
    iCharAdaptor.imbue(std::locale(iCharAdaptor.getloc(), new utf16beucs2codecvt()));
  else if(cvt == "utf16le")
    iCharAdaptor.imbue(std::locale(iCharAdaptor.getloc(), new utf16leucs2codecvt()));
 #endif
  else
  {
    std::cerr << cvt << " is not a valid input encoding." << std::endl;
    return false;
  }
 #ifndef ARABICA_NO_WCHAR_T
  if((cvt == "utf8") || 
      (cvt == "utf16be") || 
      (cvt == "utf16le"))
    needWCharIntermediary = true;
 #endif
  return true;
 } // imbueInput
 bool imbueOutput(int& argn, int argc, const char* argv[])
 {
  ++argn;
  if(argn >= argc)
    return false;
  std::string cvt(argv[argn]);
  if(cvt == "rot13")
    oByteConvertor.imbue(std::locale(oByteConvertor.getloc(), new rot13codecvt()));
  else if(cvt == "base64")
    oByteConvertor.imbue(std::locale(oByteConvertor.getloc(), new base64codecvt()));
 #ifndef ARABICA_NO_WCHAR_T
  else if(cvt == "utf8")
    oCharAdaptor.imbue(std::locale(oCharAdaptor.getloc(), new utf8ucs2codecvt()));
  else if(cvt == "utf16be")
    oCharAdaptor.imbue(std::locale(oCharAdaptor.getloc(), new utf16beucs2codecvt()));
  else if(cvt == "utf16le")
    oCharAdaptor.imbue(std::locale(oCharAdaptor.getloc(), new utf16leucs2codecvt()));
 #endif
  else 
  {
    std::cerr << cvt << " is not a valid output encoding." << std::endl;
    return false;
  }
 #ifndef ARABICA_NO_WCHAR_T
    if((cvt == "utf8") || 
       (cvt == "utf16be") || 
       (cvt == "utf16le"))
      needWCharIntermediary = true;
 #endif
  return true;
 } // imbueOutputs