-
-
Notifications
You must be signed in to change notification settings - Fork 15
/
UsfmFileText.cs
57 lines (53 loc) · 1.87 KB
/
UsfmFileText.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
using System;
using System.IO;
using System.Text;
using SIL.Scripture;
namespace SIL.Machine.Corpora
{
public class UsfmFileText : UsfmTextBase
{
private readonly string _fileName;
public UsfmFileText(
UsfmStylesheet stylesheet,
Encoding encoding,
string fileName,
ScrVers versification = null,
bool includeMarkers = false,
bool includeAllText = false
)
: base(GetId(fileName, encoding), stylesheet, encoding, versification, includeMarkers, includeAllText)
{
_fileName = fileName;
}
protected override IStreamContainer CreateStreamContainer()
{
return new FileStreamContainer(_fileName);
}
private static string GetId(string fileName, Encoding encoding)
{
using (var reader = new StreamReader(fileName, encoding))
{
string line;
while ((line = reader.ReadLine()) != null)
{
line = line.Trim();
if (line.StartsWith("\\id "))
{
string id = line.Substring(4);
int index = id.IndexOf(" ");
if (index != -1)
id = id.Substring(0, index);
return id.Trim();
}
}
}
// It's not in the file contents, let's just pull it from the filename
string name = Path.GetFileNameWithoutExtension(fileName);
if (name.Length < 6)
throw new InvalidOperationException("The USFM does not contain an 'id' marker.");
string book = name.Substring(2, 3);
string tag = name.Substring(5, name.Length - 5);
return $"{book} - {tag}";
}
}
}