/*========================================================================= Program: Visualization Toolkit Module: vtkUTF8TextCodec.cxx Copyright (c) All rights reserved. See Copyright.txt or http://www.kitware.com/Copyright.htm for details. This software is distributed WITHOUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the above copyright notice for more information. =========================================================================*/ /*------------------------------------------------------------------------- Copyright 2010 Sandia Corporation. Under the terms of Contract DE-AC04-94AL85000 with Sandia Corporation, the U.S. Government retains certain rights in this software. -------------------------------------------------------------------------*/ #include "vtkUTF8TextCodec.h" #include "vtkObjectFactory.h" #include "vtkTextCodecFactory.h" #include vtkStandardNewMacro(vtkUTF8TextCodec); bool vtkUTF8TextCodec::CanHandle(const char* testStr) { if (0 == strcmp(testStr, "UTF-8")) { return true; } else { return false; } } namespace { // iterator to use in testing validity - throws all input away. class testIterator : public vtkTextCodec::OutputIterator { public: testIterator& operator++(int) override {return *this;} testIterator& operator*() override {return *this;} testIterator& operator=(const vtkUnicodeString::value_type) override {return *this;} testIterator() {} ~testIterator() override {} private: testIterator(const testIterator&) = delete; const testIterator& operator=(const testIterator&) = delete; }; } // end anonymous namespace bool vtkUTF8TextCodec::IsValid(istream& InputStream) { bool returnBool = true; // get the position of the stream so we can restore it when we are done istream::pos_type StreamPos = InputStream.tellg(); try { testIterator junk; this->ToUnicode(InputStream, junk); } catch(...) { returnBool = false; } // reset the stream InputStream.clear(); InputStream.seekg(StreamPos); return returnBool; } void vtkUTF8TextCodec::ToUnicode(istream& InputStream, vtkTextCodec::OutputIterator& Output) { try { while (!InputStream.eof()) { vtkUnicodeString::value_type CodePoint = this->NextUnicode(InputStream); *Output++ = CodePoint; } } catch (std::string& ef) { if (ef == "End of Input") { return; // we just completed the sequence... } else { throw; } } } vtkUnicodeString::value_type vtkUTF8TextCodec::NextUnicode(istream& InputStream) { istream::char_type c[5]; c[4] = '\0'; unsigned int getSize = 0; c[getSize] = InputStream.get(); if (InputStream.fail()) { throw(std::string("End of Input")); } getSize = vtk_utf8::internal::sequence_length(c); if (0 == getSize) throw(std::string("Not enough space")); for (unsigned int i = 1; i < getSize; ++i) { c[i] = InputStream.get(); if (InputStream.fail()) throw(std::string("Not enough space")); } istream::char_type* c1 = c; const vtkTypeUInt32 code_point = vtk_utf8::next(c1, &c[getSize]); return code_point; } vtkUTF8TextCodec::vtkUTF8TextCodec() : vtkTextCodec() { } vtkUTF8TextCodec::~vtkUTF8TextCodec() { } void vtkUTF8TextCodec::PrintSelf(ostream& os, vtkIndent indent) { os << indent << "vtkUTF8TextCodec (" << this << ") \n"; indent = indent.GetNextIndent(); this->Superclass::PrintSelf(os, indent.GetNextIndent()); }