2010-05-29 04:25:19 +02:00
// Copyright (c) 2010, Amar Takhar
2007-04-08 08:01:41 +02:00
// All rights reserved.
//
// Redistribution and use in source and binary forms, with or without
// modification, are permitted provided that the following conditions are met:
//
// * Redistributions of source code must retain the above copyright notice,
// this list of conditions and the following disclaimer.
// * Redistributions in binary form must reproduce the above copyright notice,
// this list of conditions and the following disclaimer in the documentation
// and/or other materials provided with the distribution.
// * Neither the name of the Aegisub Group nor the names of its contributors
// may be used to endorse or promote products derived from this software
// without specific prior written permission.
//
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
// POSSIBILITY OF SUCH DAMAGE.
//
2009-07-29 07:43:02 +02:00
// Aegisub Project http://www.aegisub.org/
2007-04-08 08:01:41 +02:00
//
2009-07-29 07:43:02 +02:00
// $Id$
/// @file charset_detect.cpp
/// @brief Wrapper around text encoding detection library
/// @ingroup utility
///
2007-04-08 08:01:41 +02:00
2009-01-04 07:31:48 +01:00
# include "config.h"
2009-09-10 15:06:40 +02:00
# ifndef AGI_PRE
2009-09-11 03:07:38 +02:00
# include <fstream>
2009-09-10 07:25:25 +02:00
# include <list>
2009-09-10 15:06:40 +02:00
2009-09-11 04:30:10 +02:00
# include <wx/arrstr.h>
2009-09-10 07:25:25 +02:00
# include <wx/choicdlg.h>
2009-09-10 15:06:40 +02:00
# include <wx/intl.h>
# endif
2009-09-10 07:25:25 +02:00
2010-05-29 04:25:19 +02:00
# include <libaegisub/charset.h>
2010-06-01 10:21:30 +02:00
# include <libaegisub/log.h>
2010-05-29 04:25:19 +02:00
2009-09-10 15:06:40 +02:00
# include "charset_detect.h"
2010-05-29 04:25:19 +02:00
# include "compat.h"
2009-09-10 07:25:25 +02:00
2010-06-03 22:31:43 +02:00
namespace CharSetDetect {
2007-04-08 08:01:41 +02:00
2010-06-03 22:31:43 +02:00
wxString GetEncoding ( wxString const & filename ) {
2010-05-29 04:25:19 +02:00
bool unknown = 0 ;
2007-04-08 08:01:41 +02:00
2010-05-29 04:25:19 +02:00
agi : : charset : : CharsetListDetected list ;
agi : : charset : : CharsetListDetected : : const_iterator i_lst ;
2007-04-08 08:01:41 +02:00
2010-05-29 04:25:19 +02:00
try {
agi : : charset : : DetectAll ( STD_STR ( filename ) , list ) ;
2010-06-03 22:31:43 +02:00
} catch ( const agi : : charset : : UnknownCharset & ) {
2010-05-29 04:25:19 +02:00
unknown = 1 ;
2008-01-17 19:35:06 +01:00
}
2010-05-29 04:25:19 +02:00
/// @todo If the charset is unknown we need to display a complete list of character sets.
if ( list . size ( ) > 1 ) {
2008-01-17 19:35:06 +01:00
// Get choice from user
wxArrayString choices ;
2010-05-29 04:25:19 +02:00
2010-06-27 22:03:38 +02:00
std : : string log_choice ;
2010-05-29 04:25:19 +02:00
for ( i_lst = list . begin ( ) ; i_lst ! = list . end ( ) ; + + i_lst ) {
choices . Add ( lagi_wxString ( i_lst - > second ) ) ;
2010-06-27 22:03:38 +02:00
log_choice . append ( " " + i_lst - > second ) ;
2008-01-17 19:35:06 +01:00
}
2010-05-29 04:25:19 +02:00
2010-06-27 22:03:38 +02:00
LOG_I ( " charset/file " ) < < filename < < " ( " < < log_choice < < " ) " ;
2008-01-17 19:35:06 +01:00
int choice = wxGetSingleChoiceIndex ( _ ( " Aegisub could not narrow down the character set to a single one. \n Please pick one below: " ) , _ ( " Choose character set " ) , choices ) ;
if ( choice = = - 1 ) throw _T ( " Canceled " ) ;
2010-05-29 04:25:19 +02:00
return choices . Item ( choice ) ;
2008-01-17 19:35:06 +01:00
}
2008-01-20 08:24:04 +01:00
2010-05-29 04:25:19 +02:00
i_lst = list . begin ( ) ;
2010-06-27 22:03:38 +02:00
LOG_I ( " charset/file " ) < < filename < < " ( " < < i_lst - > second < < " ) " ;
2010-05-29 04:25:19 +02:00
return i_lst - > second ;
2008-01-20 08:24:04 +01:00
}
2010-06-03 22:31:43 +02:00
}