2010-05-29 04:25:19 +02:00
|
|
|
// Copyright (c) 2010, Amar Takhar
|
2007-04-08 08:01:41 +02:00
|
|
|
// All rights reserved.
|
|
|
|
//
|
|
|
|
// Redistribution and use in source and binary forms, with or without
|
|
|
|
// modification, are permitted provided that the following conditions are met:
|
|
|
|
//
|
|
|
|
// * Redistributions of source code must retain the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer.
|
|
|
|
// * Redistributions in binary form must reproduce the above copyright notice,
|
|
|
|
// this list of conditions and the following disclaimer in the documentation
|
|
|
|
// and/or other materials provided with the distribution.
|
|
|
|
// * Neither the name of the Aegisub Group nor the names of its contributors
|
|
|
|
// may be used to endorse or promote products derived from this software
|
|
|
|
// without specific prior written permission.
|
|
|
|
//
|
|
|
|
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
|
|
|
|
// AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
|
|
// IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
|
|
|
|
// ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
|
|
|
|
// LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
|
|
|
|
// CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
|
|
|
|
// SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
|
|
|
|
// INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
|
|
|
|
// CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
|
|
|
|
// ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
|
|
|
|
// POSSIBILITY OF SUCH DAMAGE.
|
|
|
|
//
|
2009-07-29 07:43:02 +02:00
|
|
|
// Aegisub Project http://www.aegisub.org/
|
|
|
|
|
|
|
|
/// @file charset_detect.cpp
|
|
|
|
/// @brief Wrapper around text encoding detection library
|
|
|
|
/// @ingroup utility
|
|
|
|
///
|
2007-04-08 08:01:41 +02:00
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
#include "charset_detect.h"
|
2009-09-10 15:06:40 +02:00
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
#include "compat.h"
|
2009-09-10 07:25:25 +02:00
|
|
|
|
2010-05-29 04:25:19 +02:00
|
|
|
#include <libaegisub/charset.h>
|
2013-02-05 04:17:04 +01:00
|
|
|
#include <libaegisub/charset_conv.h>
|
2010-06-01 10:21:30 +02:00
|
|
|
#include <libaegisub/log.h>
|
2010-05-29 04:25:19 +02:00
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
#include <boost/filesystem/path.hpp>
|
|
|
|
|
|
|
|
#include <wx/arrstr.h>
|
|
|
|
#include <wx/choicdlg.h>
|
|
|
|
#include <wx/intl.h>
|
2009-09-10 07:25:25 +02:00
|
|
|
|
2010-06-03 22:31:43 +02:00
|
|
|
namespace CharSetDetect {
|
2007-04-08 08:01:41 +02:00
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
std::string GetEncoding(agi::fs::path const& filename) {
|
2010-05-29 04:25:19 +02:00
|
|
|
agi::charset::CharsetListDetected list;
|
2007-04-08 08:01:41 +02:00
|
|
|
|
2010-05-29 04:25:19 +02:00
|
|
|
try {
|
2013-01-04 16:01:50 +01:00
|
|
|
list = agi::charset::DetectAll(filename);
|
2010-06-03 22:31:43 +02:00
|
|
|
} catch (const agi::charset::UnknownCharset&) {
|
2013-02-05 04:17:04 +01:00
|
|
|
// will be set to the full list of charsets below
|
2008-01-17 19:35:06 +01:00
|
|
|
}
|
|
|
|
|
2012-11-04 04:53:03 +01:00
|
|
|
if (list.size() == 1) {
|
|
|
|
auto charset = list.begin();
|
|
|
|
LOG_I("charset/file") << filename << " (" << charset->second << ")";
|
2013-01-04 16:01:50 +01:00
|
|
|
return charset->second;
|
2012-11-04 04:53:03 +01:00
|
|
|
}
|
2010-05-29 04:25:19 +02:00
|
|
|
|
2012-11-04 04:53:03 +01:00
|
|
|
wxArrayString choices;
|
|
|
|
std::string log_choice;
|
2010-06-27 22:03:38 +02:00
|
|
|
|
2012-11-04 04:53:03 +01:00
|
|
|
for (auto const& charset : list) {
|
|
|
|
choices.push_back(to_wx(charset.second));
|
|
|
|
log_choice.append(" " + charset.second);
|
2008-01-17 19:35:06 +01:00
|
|
|
}
|
2008-01-20 08:24:04 +01:00
|
|
|
|
2012-11-04 04:53:03 +01:00
|
|
|
LOG_I("charset/file") << filename << " (" << log_choice << ")";
|
|
|
|
|
2013-02-05 04:17:04 +01:00
|
|
|
if (choices.empty())
|
|
|
|
choices = agi::charset::GetEncodingsList<wxArrayString>();
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
int choice = wxGetSingleChoiceIndex(
|
|
|
|
_("Aegisub could not narrow down the character set to a single one.\nPlease pick one below:"),
|
|
|
|
_("Choose character set"),
|
|
|
|
choices);
|
|
|
|
if (choice == -1) throw agi::UserCancelException("Cancelled encoding selection");
|
2013-02-05 04:17:04 +01:00
|
|
|
if (list.empty())
|
|
|
|
return agi::charset::GetEncodingsList<std::vector<std::string>>()[choice];
|
2013-01-04 16:01:50 +01:00
|
|
|
return list[choice].second;
|
2008-01-20 08:24:04 +01:00
|
|
|
}
|
|
|
|
|
2010-06-03 22:31:43 +02:00
|
|
|
}
|