Aegisub/aegisub/src/text_file_reader.cpp
Thomas Goyne 5a38d69921 Open files as binary in TextFileReader
Text mode does undesirable things like stopping when it hits an EOF
byte, which can be a valid part of a UTF-16 character, and line_iterator
handles stripping \r anyway.

Originally committed to SVN as r6958.
2012-08-19 14:11:29 -07:00

90 lines
2.9 KiB
C++

// Copyright (c) 2010, Thomas Goyne
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// * Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
// * Neither the name of the Aegisub Group nor the names of its contributors
// may be used to endorse or promote products derived from this software
// without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.
//
// Aegisub Project http://www.aegisub.org/
//
// $Id$
/// @file text_file_reader.cpp
/// @brief Read plain text files line by line
/// @ingroup utility
///
#include "config.h"
#ifndef AGI_PRE
#include <assert.h>
#include <errno.h>
#include <algorithm>
#include <string>
#include <wx/string.h>
#endif
#include <libaegisub/io.h>
#include <libaegisub/log.h>
#include "charset_detect.h"
#include "compat.h"
#include "text_file_reader.h"
TextFileReader::TextFileReader(wxString const& filename, wxString encoding, bool trim)
: trim(trim)
{
if (encoding.empty()) encoding = CharSetDetect::GetEncoding(filename);
file.reset(agi::io::Open(STD_STR(filename), true));
iter = agi::line_iterator<wxString>(*file, STD_STR(encoding));
}
TextFileReader::~TextFileReader() {
}
wxString TextFileReader::ReadLineFromFile() {
wxString str = *iter;
++iter;
if (trim) str.Trim(true).Trim(false);
if (str.StartsWith(L"\uFEFF")) str = str.Mid(1);
return str;
}
namespace agi {
#ifdef _WIN32
template<> void line_iterator<wxString>::init() {
conv.reset(new agi::charset::IconvWrapper(encoding.c_str(), "utf-16le"));
}
template<> bool line_iterator<wxString>::convert(std::string &str) {
value = wxString(str.c_str(), wxMBConvUTF16LE(), str.size());
return true;
}
#else
template<> bool line_iterator<wxString>::convert(std::string &str) {
value = str;
return true;
}
#endif
}