shaka-packager/packager/media/formats/webvtt/webvtt_utils.cc

353 lines
9.8 KiB
C++

// Copyright 2017 Google LLC. All rights reserved.
//
// Use of this source code is governed by a BSD-style
// license that can be found in the LICENSE file or at
// https://developers.google.com/open-source/licenses/bsd
#include <packager/media/formats/webvtt/webvtt_utils.h>
#include <algorithm>
#include <cctype>
#include <cinttypes>
#include <unordered_set>
#include <absl/strings/numbers.h>
#include <absl/strings/str_format.h>
#include <glog/logging.h>
namespace shaka {
namespace media {
namespace {
bool GetTotalMilliseconds(uint64_t hours,
uint64_t minutes,
uint64_t seconds,
uint64_t ms,
int64_t* out) {
DCHECK(out);
if (minutes > 59 || seconds > 59 || ms > 999) {
VLOG(1) << "Hours:" << hours << " Minutes:" << minutes
<< " Seconds:" << seconds << " MS:" << ms
<< " shoud have never made it to GetTotalMilliseconds";
return false;
}
*out = 60 * 60 * 1000 * hours + 60 * 1000 * minutes + 1000 * seconds + ms;
return true;
}
enum class StyleTagKind {
kUnderline,
kBold,
kItalic,
};
std::string GetOpenTag(StyleTagKind tag) {
switch (tag) {
case StyleTagKind::kUnderline:
return "<u>";
case StyleTagKind::kBold:
return "<b>";
case StyleTagKind::kItalic:
return "<i>";
}
return ""; // Not reached, but Windows doesn't like NOTIMPLEMENTED.
}
std::string GetCloseTag(StyleTagKind tag) {
switch (tag) {
case StyleTagKind::kUnderline:
return "</u>";
case StyleTagKind::kBold:
return "</b>";
case StyleTagKind::kItalic:
return "</i>";
}
return ""; // Not reached, but Windows doesn't like NOTIMPLEMENTED.
}
bool IsWhitespace(char c) {
return c == '\t' || c == '\r' || c == '\n' || c == ' ';
}
// Replace consecutive whitespaces with a single whitespace.
std::string CollapseWhitespace(const std::string& data) {
std::string output;
output.resize(data.size());
size_t chars_written = 0;
bool in_whitespace = false;
for (char c : data) {
if (IsWhitespace(c)) {
if (!in_whitespace) {
in_whitespace = true;
output[chars_written++] = ' ';
}
} else {
in_whitespace = false;
output[chars_written++] = c;
}
}
output.resize(chars_written);
return output;
}
std::string WriteFragment(const TextFragment& fragment,
std::list<StyleTagKind>* tags) {
std::string ret;
size_t local_tag_count = 0;
auto has = [tags](StyleTagKind tag) {
return std::find(tags->begin(), tags->end(), tag) != tags->end();
};
auto push_tag = [tags, &local_tag_count, &has](StyleTagKind tag) {
if (has(tag)) {
return std::string();
}
tags->push_back(tag);
local_tag_count++;
return GetOpenTag(tag);
};
if ((fragment.style.underline == false && has(StyleTagKind::kUnderline)) ||
(fragment.style.bold == false && has(StyleTagKind::kBold)) ||
(fragment.style.italic == false && has(StyleTagKind::kItalic))) {
LOG(WARNING) << "WebVTT output doesn't support disabling "
"underline/bold/italic within a cue";
}
if (fragment.newline) {
// Newlines represent separate WebVTT cues. So close the existing tags to
// be nice and re-open them on the new line.
for (auto it = tags->rbegin(); it != tags->rend(); it++) {
ret += GetCloseTag(*it);
}
ret += "\n";
for (const auto tag : *tags) {
ret += GetOpenTag(tag);
}
} else {
if (fragment.style.underline == true) {
ret += push_tag(StyleTagKind::kUnderline);
}
if (fragment.style.bold == true) {
ret += push_tag(StyleTagKind::kBold);
}
if (fragment.style.italic == true) {
ret += push_tag(StyleTagKind::kItalic);
}
if (!fragment.body.empty()) {
// Replace newlines and consecutive whitespace with a single space. If
// the user wanted an explicit newline, they should use the "newline"
// field.
ret += CollapseWhitespace(fragment.body);
} else {
for (const auto& frag : fragment.sub_fragments) {
ret += WriteFragment(frag, tags);
}
}
// Pop all the local tags we pushed.
while (local_tag_count > 0) {
ret += GetCloseTag(tags->back());
tags->pop_back();
local_tag_count--;
}
}
return ret;
}
} // namespace
bool WebVttTimestampToMs(const std::string_view& source, int64_t* out) {
DCHECK(out);
if (source.length() < 9) {
LOG(WARNING) << "Timestamp '" << source << "' is mal-formed";
return false;
}
const size_t minutes_begin = source.length() - 9;
const size_t seconds_begin = source.length() - 6;
const size_t milliseconds_begin = source.length() - 3;
uint64_t hours = 0;
uint64_t minutes = 0;
uint64_t seconds = 0;
uint64_t ms = 0;
const bool has_hours =
minutes_begin >= 3 && source[minutes_begin - 1] == ':' &&
absl::SimpleAtoi(source.substr(0, minutes_begin - 1), &hours);
if ((minutes_begin == 0 || has_hours) && source[seconds_begin - 1] == ':' &&
source[milliseconds_begin - 1] == '.' &&
absl::SimpleAtoi(source.substr(minutes_begin, 2), &minutes) &&
absl::SimpleAtoi(source.substr(seconds_begin, 2), &seconds) &&
absl::SimpleAtoi(source.substr(milliseconds_begin, 3), &ms)) {
return GetTotalMilliseconds(hours, minutes, seconds, ms, out);
}
LOG(WARNING) << "Timestamp '" << source << "' is mal-formed";
return false;
}
std::string MsToWebVttTimestamp(uint64_t ms) {
uint64_t remaining = ms;
uint64_t only_ms = remaining % 1000;
remaining /= 1000;
uint64_t only_seconds = remaining % 60;
remaining /= 60;
uint64_t only_minutes = remaining % 60;
remaining /= 60;
uint64_t only_hours = remaining;
return absl::StrFormat("%02" PRIu64 ":%02" PRIu64 ":%02" PRIu64 ".%03" PRIu64,
only_hours, only_minutes, only_seconds, only_ms);
}
std::string FloatToString(double number) {
// Keep up to microsecond accuracy but trim trailing 0s
std::string formatted = absl::StrFormat("%.6g", number);
size_t decimalPos = formatted.find('.');
if (decimalPos != std::string::npos) {
size_t lastNonZeroPos = formatted.find_last_not_of('0');
if (lastNonZeroPos >= decimalPos) {
formatted.erase(lastNonZeroPos + 1);
}
if (formatted.back() == '.') {
formatted.pop_back();
}
}
return formatted;
}
std::string WebVttSettingsToString(const TextSettings& settings) {
std::string ret;
if (!settings.region.empty()) {
ret += " region:";
ret += settings.region;
}
if (settings.line) {
switch (settings.line->type) {
case TextUnitType::kPercent:
ret += " line:";
ret += FloatToString(settings.line->value);
ret += "%";
break;
case TextUnitType::kLines:
ret += " line:";
ret += FloatToString(settings.line->value);
break;
case TextUnitType::kPixels:
LOG(WARNING) << "WebVTT doesn't support pixel line settings";
break;
}
}
if (settings.position) {
if (settings.position->type == TextUnitType::kPercent) {
ret += " position:";
ret += FloatToString(settings.position->value);
ret += "%";
} else {
LOG(WARNING) << "WebVTT only supports percent position settings";
}
}
if (settings.width) {
if (settings.width->type == TextUnitType::kPercent) {
ret += " size:";
ret += FloatToString(settings.width->value);
ret += "%";
} else {
LOG(WARNING) << "WebVTT only supports percent width settings";
}
}
if (settings.height) {
LOG(WARNING) << "WebVTT doesn't support cue heights";
}
if (settings.writing_direction != WritingDirection::kHorizontal) {
ret += " direction:";
if (settings.writing_direction == WritingDirection::kVerticalGrowingLeft) {
ret += "rl";
} else {
ret += "lr";
}
}
switch (settings.text_alignment) {
case TextAlignment::kStart:
ret += " align:start";
break;
case TextAlignment::kEnd:
ret += " align:end";
break;
case TextAlignment::kLeft:
ret += " align:left";
break;
case TextAlignment::kRight:
ret += " align:right";
break;
case TextAlignment::kCenter:
ret += " align:center";
break;
}
if (!ret.empty()) {
DCHECK_EQ(ret[0], ' ');
ret.erase(0, 1);
}
return ret;
}
std::string WebVttFragmentToString(const TextFragment& fragment) {
std::list<StyleTagKind> tags;
return WriteFragment(fragment, &tags);
}
std::string WebVttGetPreamble(const TextStreamInfo& stream_info) {
std::string ret;
for (const auto& pair : stream_info.regions()) {
if (!ret.empty()) {
ret += "\n\n";
}
if (pair.second.width.type != TextUnitType::kPercent ||
pair.second.height.type != TextUnitType::kLines ||
pair.second.window_anchor_x.type != TextUnitType::kPercent ||
pair.second.window_anchor_y.type != TextUnitType::kPercent ||
pair.second.region_anchor_x.type != TextUnitType::kPercent ||
pair.second.region_anchor_y.type != TextUnitType::kPercent) {
LOG(WARNING) << "Unsupported unit type in WebVTT region";
continue;
}
absl::StrAppendFormat(
&ret,
"REGION\n"
"id:%s\n"
"width:%f%%\n"
"lines:%d\n"
"viewportanchor:%f%%,%f%%\n"
"regionanchor:%f%%,%f%%",
pair.first.c_str(), pair.second.width.value,
static_cast<int>(pair.second.height.value),
pair.second.window_anchor_x.value, pair.second.window_anchor_y.value,
pair.second.region_anchor_x.value, pair.second.region_anchor_y.value);
if (pair.second.scroll) {
ret += "\nscroll:up";
}
}
if (!stream_info.css_styles().empty()) {
if (!ret.empty()) {
ret += "\n\n";
}
ret += "STYLE\n" + stream_info.css_styles();
}
return ret;
}
} // namespace media
} // namespace shaka