SubtitleEdit/libse/SubtitleFormats/TimelineAscii.cs
2016-02-17 20:55:24 +01:00

206 lines
7.1 KiB
C#

using System;
using System.Collections.Generic;
using System.IO;
using System.Text;
using System.Text.RegularExpressions;
namespace Nikse.SubtitleEdit.Core.SubtitleFormats
{
/// <summary>
/// Timeline Ascii export - THE MOVIE TITRE EDITOR - http://www.pld.ttu.ee/~priidu/timeline/ by priidu@pld.ttu.ee
///
/// Sample:
/// 1.
/// 00:00:43.02
/// 00:00:47.03
/// ±NE/SEVÎ
/// ³ÂÍÅ/ÑÅÁß
///
/// 2.
/// 00:01:36.00
/// 00:01:37.00
/// ±Viòð ir klât.
/// ³Îí ïðèøåë.
/// </summary>
public class TimeLineAscii : SubtitleFormat
{
private static readonly Regex RegexTimeCode = new Regex(@"^\d\d:\d\d:\d\d\.\d\d$", RegexOptions.Compiled);
private enum ExpectingLine
{
Number,
TimeStart,
TimeEnd,
Text
}
public override string Extension
{
get { return ".asc"; }
}
public override string Name
{
get { return "Timeline ascii"; }
}
public override bool IsTimeBased
{
get { return true; }
}
public override bool IsMine(List<string> lines, string fileName)
{
if (fileName == null || !fileName.EndsWith(Extension, StringComparison.OrdinalIgnoreCase))
return false;
var subtitle = new Subtitle();
LoadSubtitle(subtitle, lines, fileName);
return subtitle.Paragraphs.Count > _errorCount;
}
public override string ToText(Subtitle subtitle, string title)
{
return string.Empty;
}
public override void LoadSubtitle(Subtitle subtitle, List<string> lines, string fileName)
{
Paragraph paragraph = null;
var expecting = ExpectingLine.Number;
_errorCount = 0;
byte firstLineCode = 0;
byte secondLineCode = 0;
subtitle.Paragraphs.Clear();
IEnumerable<byte[]> byteLines = SplitBytesToLines(File.ReadAllBytes(fileName));
foreach (byte[] bytes in byteLines)
{
var line = Encoding.ASCII.GetString(bytes);
if (line.EndsWith('.') && Utilities.IsInteger(line.TrimEnd('.')))
{
if (paragraph != null && !string.IsNullOrEmpty(paragraph.Text))
subtitle.Paragraphs.Add(paragraph);
paragraph = new Paragraph();
expecting = ExpectingLine.TimeStart;
}
else if (paragraph != null && expecting == ExpectingLine.TimeStart && RegexTimeCode.IsMatch(line))
{
string[] parts = line.Split(new[] { ':', '.' }, StringSplitOptions.RemoveEmptyEntries);
if (parts.Length == 4)
{
try
{
var tc = DecodeTimeCodeFramesFourParts(parts);
paragraph.StartTime = tc;
expecting = ExpectingLine.TimeEnd;
}
catch
{
_errorCount++;
expecting = ExpectingLine.Number;
}
}
}
else if (paragraph != null && expecting == ExpectingLine.TimeEnd && RegexTimeCode.IsMatch(line))
{
string[] parts = line.Split(new[] { ':', '.' }, StringSplitOptions.RemoveEmptyEntries);
if (parts.Length == 4)
{
try
{
var tc = DecodeTimeCodeFramesFourParts(parts);
paragraph.EndTime = tc;
expecting = ExpectingLine.Text;
}
catch
{
_errorCount++;
expecting = ExpectingLine.Number;
}
}
}
else
{
if (paragraph != null && expecting == ExpectingLine.Text)
{
if (bytes.Length > 1)
{
// get text from encoding
var enc = GetEncodingFromLanguage(bytes[0]);
string s = enc.GetString(bytes, 1, bytes.Length - 1).Trim();
// italic text
if (s.StartsWith('#'))
s = "<i>" + s.Remove(0, 1) + "</i>";
paragraph.Text = (paragraph.Text + Environment.NewLine + s).Trim();
if (paragraph.Text.Length > 2000)
{
_errorCount += 100;
return;
}
if (paragraph.Text.Contains(Environment.NewLine))
{
if (secondLineCode == 0)
secondLineCode = bytes[0];
if (secondLineCode != bytes[0])
_errorCount++;
}
else
{
if (firstLineCode == 0)
firstLineCode = bytes[0];
if (firstLineCode != bytes[0])
_errorCount++;
}
}
}
}
}
if (paragraph != null && !string.IsNullOrEmpty(paragraph.Text))
subtitle.Paragraphs.Add(paragraph);
subtitle.Renumber();
}
private IEnumerable<byte[]> SplitBytesToLines(byte[] bytes)
{
var list = new List<byte[]>();
int start = 0;
int index = 0;
while (index < bytes.Length)
{
if (bytes[index] == 13)
{
int length = index - start;
var lineBytes = new byte[length];
Array.Copy(bytes, start, lineBytes, 0, length);
list.Add(lineBytes);
index += 2;
start = index;
}
else
{
index++;
}
}
return list;
}
private Encoding GetEncodingFromLanguage(byte language)
{
if (language == 179) // Russian
return Encoding.GetEncoding(1251);
if (language == 177) // Baltic
return Encoding.GetEncoding(1257);
return Encoding.GetEncoding(1252);
}
}
}