2012-10-12 04:12:42 +02:00
|
|
|
// Copyright (c) 2012, Thomas Goyne <plorkyeran@aegisub.org>
|
|
|
|
//
|
|
|
|
// Permission to use, copy, modify, and distribute this software for any
|
|
|
|
// purpose with or without fee is hereby granted, provided that the above
|
|
|
|
// copyright notice and this permission notice appear in all copies.
|
|
|
|
//
|
|
|
|
// THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
|
|
|
|
// WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
|
|
|
|
// MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR
|
|
|
|
// ANY SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
|
|
|
|
// WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN
|
|
|
|
// ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF
|
|
|
|
// OR IN CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE.
|
|
|
|
|
|
|
|
#include "ass_parser.h"
|
|
|
|
|
|
|
|
#include "ass_attachment.h"
|
|
|
|
#include "ass_dialogue.h"
|
|
|
|
#include "ass_file.h"
|
2012-12-08 03:51:09 +01:00
|
|
|
#include "ass_info.h"
|
2012-10-12 04:12:42 +02:00
|
|
|
#include "ass_style.h"
|
2014-04-22 19:21:00 +02:00
|
|
|
#include "string_codec.h"
|
2012-10-25 15:45:06 +02:00
|
|
|
#include "subtitle_format.h"
|
2012-10-12 04:12:42 +02:00
|
|
|
|
2014-04-25 16:04:08 +02:00
|
|
|
#include <libaegisub/ass/uuencode.h>
|
2014-04-23 22:53:24 +02:00
|
|
|
#include <libaegisub/make_unique.h>
|
2014-05-22 03:32:42 +02:00
|
|
|
#include <libaegisub/util.h>
|
2014-04-23 01:34:18 +02:00
|
|
|
|
2012-11-25 01:08:29 +01:00
|
|
|
#include <algorithm>
|
2013-01-04 16:01:50 +01:00
|
|
|
#include <boost/algorithm/string/case_conv.hpp>
|
|
|
|
#include <boost/algorithm/string/predicate.hpp>
|
|
|
|
#include <boost/algorithm/string/trim.hpp>
|
2014-04-22 19:21:00 +02:00
|
|
|
#include <boost/lexical_cast.hpp>
|
|
|
|
#include <boost/regex.hpp>
|
2014-05-22 03:32:42 +02:00
|
|
|
#include <boost/variant.hpp>
|
|
|
|
#include <unordered_map>
|
|
|
|
|
|
|
|
class AssParser::HeaderToProperty {
|
|
|
|
using field = boost::variant<
|
|
|
|
std::string ProjectProperties::*,
|
|
|
|
int ProjectProperties::*,
|
|
|
|
double ProjectProperties::*
|
|
|
|
>;
|
|
|
|
std::unordered_map<std::string, field> fields;
|
|
|
|
|
|
|
|
public:
|
|
|
|
HeaderToProperty()
|
|
|
|
: fields({
|
|
|
|
{"Automation Scripts", &ProjectProperties::automation_scripts},
|
|
|
|
{"Export Filters", &ProjectProperties::export_filters},
|
|
|
|
{"Export Encoding", &ProjectProperties::export_encoding},
|
|
|
|
{"Last Style Storage", &ProjectProperties::style_storage},
|
|
|
|
{"Audio URI", &ProjectProperties::audio_file},
|
|
|
|
{"Audio File", &ProjectProperties::audio_file},
|
|
|
|
{"Video File", &ProjectProperties::video_file},
|
|
|
|
{"Timecodes File", &ProjectProperties::timecodes_file},
|
|
|
|
{"Keyframes File", &ProjectProperties::keyframes_file},
|
|
|
|
{"Video Zoom Percent", &ProjectProperties::video_zoom},
|
|
|
|
{"Scroll Position", &ProjectProperties::scroll_position},
|
|
|
|
{"Active Line", &ProjectProperties::active_row},
|
|
|
|
{"Video Position", &ProjectProperties::video_position},
|
|
|
|
{"Video AR Mode", &ProjectProperties::ar_mode},
|
|
|
|
{"Video AR Value", &ProjectProperties::ar_value},
|
|
|
|
{"Aegisub Video Zoom Percent", &ProjectProperties::video_zoom},
|
|
|
|
{"Aegisub Scroll Position", &ProjectProperties::scroll_position},
|
|
|
|
{"Aegisub Active Line", &ProjectProperties::active_row},
|
|
|
|
{"Aegisub Video Position", &ProjectProperties::video_position}
|
|
|
|
})
|
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
bool ProcessProperty(AssFile *target, std::string const& key, std::string const& value) {
|
|
|
|
auto it = fields.find(key);
|
|
|
|
if (it != end(fields)) {
|
|
|
|
using namespace agi::util;
|
|
|
|
struct {
|
|
|
|
using result_type = void;
|
|
|
|
ProjectProperties &obj;
|
|
|
|
std::string const& value;
|
|
|
|
void operator()(std::string ProjectProperties::*f) const { obj.*f = value; }
|
|
|
|
void operator()(int ProjectProperties::*f) const { try_parse(value, &(obj.*f)); }
|
|
|
|
void operator()(double ProjectProperties::*f) const { try_parse(value, &(obj.*f)); }
|
|
|
|
} visitor {target->Properties, value};
|
|
|
|
boost::apply_visitor(visitor, it->second);
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
if (boost::starts_with(key, "Automation Settings ")) {
|
|
|
|
target->Properties.automation_settings[key.substr(strlen("Automation Settings"))] = value;
|
|
|
|
return true;
|
|
|
|
}
|
|
|
|
|
|
|
|
return false;
|
|
|
|
}
|
|
|
|
};
|
2012-10-19 17:57:56 +02:00
|
|
|
|
2012-10-12 04:12:42 +02:00
|
|
|
AssParser::AssParser(AssFile *target, int version)
|
2014-08-30 18:18:52 +02:00
|
|
|
: property_handler(agi::make_unique<HeaderToProperty>())
|
2014-05-22 03:32:42 +02:00
|
|
|
, target(target)
|
2012-10-12 04:12:42 +02:00
|
|
|
, version(version)
|
2012-10-12 04:57:53 +02:00
|
|
|
, state(&AssParser::ParseScriptInfoLine)
|
2012-10-12 04:12:42 +02:00
|
|
|
{
|
|
|
|
}
|
|
|
|
|
|
|
|
AssParser::~AssParser() {
|
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
void AssParser::ParseAttachmentLine(std::string const& data) {
|
|
|
|
bool is_filename = boost::starts_with(data, "fontname: ") || boost::starts_with(data, "filename: ");
|
2012-10-12 04:12:42 +02:00
|
|
|
|
2012-10-12 04:57:53 +02:00
|
|
|
bool valid_data = data.size() > 0 && data.size() <= 80;
|
2012-11-04 04:53:03 +01:00
|
|
|
for (auto byte : data) {
|
|
|
|
if (byte < 33 || byte >= 97) {
|
2012-10-12 04:57:53 +02:00
|
|
|
valid_data = false;
|
|
|
|
break;
|
2012-10-12 04:12:42 +02:00
|
|
|
}
|
2012-10-12 04:57:53 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// Data is over, add attachment to the file
|
|
|
|
if (!valid_data || is_filename) {
|
2014-03-07 18:02:24 +01:00
|
|
|
target->Attachments.push_back(*attach.release());
|
2012-10-12 04:57:53 +02:00
|
|
|
AddLine(data);
|
|
|
|
}
|
|
|
|
else {
|
|
|
|
attach->AddData(data);
|
2012-10-12 04:12:42 +02:00
|
|
|
|
2012-10-12 04:57:53 +02:00
|
|
|
// Done building
|
2013-02-07 18:56:07 +01:00
|
|
|
if (data.size() < 80)
|
2014-03-07 18:02:24 +01:00
|
|
|
target->Attachments.push_back(*attach.release());
|
2012-10-12 04:57:53 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
void AssParser::ParseScriptInfoLine(std::string const& data) {
|
|
|
|
if (boost::starts_with(data, ";")) {
|
2012-10-12 04:57:53 +02:00
|
|
|
// Skip stupid comments added by other programs
|
|
|
|
// Of course, we'll add our own in place later... ;)
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
if (boost::starts_with(data, "ScriptType:")) {
|
|
|
|
std::string version_str = data.substr(11);
|
|
|
|
boost::trim(version_str);
|
|
|
|
boost::to_lower(version_str);
|
|
|
|
if (version_str == "v4.00")
|
|
|
|
version = 0;
|
|
|
|
else if (version_str == "v4.00+")
|
|
|
|
version = 1;
|
2012-10-12 04:57:53 +02:00
|
|
|
else
|
2014-05-29 14:57:27 +02:00
|
|
|
throw SubtitleFormatParseError("Unknown SSA file format version");
|
2012-10-12 04:12:42 +02:00
|
|
|
}
|
|
|
|
|
2013-03-30 15:18:34 +01:00
|
|
|
// Nothing actually supports the Collisions property and malformed values
|
|
|
|
// crash VSFilter, so just remove it entirely
|
|
|
|
if (boost::starts_with(data, "Collisions:"))
|
|
|
|
return;
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
size_t pos = data.find(':');
|
|
|
|
if (pos == data.npos) return;
|
|
|
|
|
2014-05-22 03:32:42 +02:00
|
|
|
auto key = data.substr(0, pos);
|
|
|
|
auto value = data.substr(pos + 1);
|
|
|
|
boost::trim_left(value);
|
|
|
|
|
|
|
|
if (!property_handler->ProcessProperty(target, key, value))
|
|
|
|
target->Info.push_back(*new AssInfo(std::move(key), std::move(value)));
|
|
|
|
}
|
|
|
|
|
|
|
|
void AssParser::ParseMetadataLine(std::string const& data) {
|
|
|
|
size_t pos = data.find(':');
|
|
|
|
if (pos == data.npos) return;
|
|
|
|
|
|
|
|
auto key = data.substr(0, pos);
|
|
|
|
auto value = data.substr(pos + 1);
|
|
|
|
boost::trim_left(value);
|
|
|
|
|
|
|
|
property_handler->ProcessProperty(target, key, value);
|
2012-10-12 04:57:53 +02:00
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
void AssParser::ParseEventLine(std::string const& data) {
|
|
|
|
if (boost::starts_with(data, "Dialogue:") || boost::starts_with(data, "Comment:"))
|
2014-03-07 18:02:24 +01:00
|
|
|
target->Events.push_back(*new AssDialogue(data));
|
2012-10-12 04:57:53 +02:00
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
void AssParser::ParseStyleLine(std::string const& data) {
|
|
|
|
if (boost::starts_with(data, "Style:"))
|
2014-03-07 18:02:24 +01:00
|
|
|
target->Styles.push_back(*new AssStyle(data, version));
|
2012-10-12 04:57:53 +02:00
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
void AssParser::ParseFontLine(std::string const& data) {
|
|
|
|
if (boost::starts_with(data, "fontname: "))
|
2014-04-23 22:53:24 +02:00
|
|
|
attach = agi::make_unique<AssAttachment>(data, AssEntryGroup::FONT);
|
2012-10-12 04:57:53 +02:00
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
void AssParser::ParseGraphicsLine(std::string const& data) {
|
|
|
|
if (boost::starts_with(data, "filename: "))
|
2014-04-23 22:53:24 +02:00
|
|
|
attach = agi::make_unique<AssAttachment>(data, AssEntryGroup::GRAPHIC);
|
2012-10-12 04:57:53 +02:00
|
|
|
}
|
|
|
|
|
2014-04-22 19:21:00 +02:00
|
|
|
void AssParser::ParseExtradataLine(std::string const &data) {
|
2014-04-25 16:04:08 +02:00
|
|
|
static const boost::regex matcher("Data:[[:space:]]*(\\d+),([^,]+),(.)(.*)");
|
2014-04-22 19:21:00 +02:00
|
|
|
boost::match_results<std::string::const_iterator> mr;
|
|
|
|
|
|
|
|
if (boost::regex_match(data, mr, matcher)) {
|
|
|
|
auto id = boost::lexical_cast<uint32_t>(mr.str(1));
|
|
|
|
auto key = inline_string_decode(mr.str(2));
|
2014-04-25 16:04:08 +02:00
|
|
|
auto valuetype = mr.str(3);
|
|
|
|
auto value = mr.str(4);
|
|
|
|
if (valuetype == "e") {
|
|
|
|
// escaped/inline_string encoded
|
|
|
|
value = inline_string_decode(value);
|
|
|
|
} else if (valuetype == "u") {
|
|
|
|
// ass uuencoded
|
|
|
|
auto valuedata = agi::ass::UUDecode(value);
|
|
|
|
value = std::string(valuedata.begin(), valuedata.end());
|
|
|
|
} else {
|
|
|
|
// unknown, error?
|
|
|
|
value = "";
|
|
|
|
}
|
2014-04-22 19:21:00 +02:00
|
|
|
|
|
|
|
// ensure next_extradata_id is always at least 1 more than the largest existing id
|
|
|
|
target->next_extradata_id = std::max(id+1, target->next_extradata_id);
|
2014-09-06 18:16:44 +02:00
|
|
|
target->Extradata.push_back(ExtradataEntry{id, std::move(key), std::move(value)});
|
2014-04-22 19:21:00 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2013-01-04 16:01:50 +01:00
|
|
|
void AssParser::AddLine(std::string const& data) {
|
2012-10-12 04:57:53 +02:00
|
|
|
// Special-case for attachments since a line could theoretically be both a
|
|
|
|
// valid attachment data line and a valid section header, and if an
|
|
|
|
// attachment is in progress it needs to be treated as that
|
|
|
|
if (attach.get()) {
|
|
|
|
ParseAttachmentLine(data);
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2012-10-12 04:12:42 +02:00
|
|
|
if (data.empty()) return;
|
|
|
|
|
|
|
|
// Section header
|
2013-01-04 16:01:50 +01:00
|
|
|
if (data[0] == '[' && data.back() == ']') {
|
2012-10-12 04:12:42 +02:00
|
|
|
// Ugly hacks to allow intermixed v4 and v4+ style sections
|
2013-01-04 16:01:50 +01:00
|
|
|
const std::string low = boost::to_lower_copy(data);
|
2012-10-12 04:12:42 +02:00
|
|
|
if (low == "[v4 styles]") {
|
|
|
|
version = 0;
|
2012-10-12 04:57:53 +02:00
|
|
|
state = &AssParser::ParseStyleLine;
|
2012-10-12 04:12:42 +02:00
|
|
|
}
|
|
|
|
else if (low == "[v4+ styles]") {
|
|
|
|
version = 1;
|
2012-10-12 04:57:53 +02:00
|
|
|
state = &AssParser::ParseStyleLine;
|
2012-10-12 04:12:42 +02:00
|
|
|
}
|
2012-11-22 17:14:34 +01:00
|
|
|
else if (low == "[events]")
|
2012-10-12 04:57:53 +02:00
|
|
|
state = &AssParser::ParseEventLine;
|
2012-11-22 17:14:34 +01:00
|
|
|
else if (low == "[script info]")
|
2012-10-12 04:57:53 +02:00
|
|
|
state = &AssParser::ParseScriptInfoLine;
|
2014-05-22 03:32:42 +02:00
|
|
|
else if (low == "[aegisub project garbage]")
|
|
|
|
state = &AssParser::ParseMetadataLine;
|
|
|
|
else if (low == "[aegisub extradata]")
|
|
|
|
state = &AssParser::ParseExtradataLine;
|
2012-11-22 17:14:34 +01:00
|
|
|
else if (low == "[graphics]")
|
2012-10-12 04:57:53 +02:00
|
|
|
state = &AssParser::ParseGraphicsLine;
|
2012-11-22 17:14:34 +01:00
|
|
|
else if (low == "[fonts]")
|
2012-10-12 04:57:53 +02:00
|
|
|
state = &AssParser::ParseFontLine;
|
2012-11-22 17:14:34 +01:00
|
|
|
else
|
2012-11-24 22:58:24 +01:00
|
|
|
state = &AssParser::UnknownLine;
|
2012-10-12 04:12:42 +02:00
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
2012-10-12 04:57:53 +02:00
|
|
|
(this->*state)(data);
|
2012-10-12 04:12:42 +02:00
|
|
|
}
|