-
Notifications
You must be signed in to change notification settings - Fork 20
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
feat: RAS format 1.2, new DTD with annotations support
*updated attribute list for <s> to support annotations * feat: RAS format 1.2 * fix(docs): update version in the comment too * ci: verbose output when utf8 on win test fails * fix(test): cs-ref.readalong also needs to current dtd version * fix: more places where the current dtd 1.2 version is needed (#238) --------- Co-authored-by: David Huggins-Daines <[email protected]> Co-authored-by: Eric Joanis <[email protected]>
- Loading branch information
1 parent
aed50e2
commit d4b8a69
Showing
10 changed files
with
193 additions
and
10 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -1,3 +1,3 @@ | ||
VERSION = "1.1.0" | ||
|
||
READALONG_FILE_FORMAT_VERSION = "1.1" | ||
READALONG_FILE_FORMAT_VERSION = "1.2" |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,106 @@ | ||
<!-- VERSION: 1.2 --> | ||
<!ELEMENT read-along (meta|text|body|div|span|anchor|silence|graphic|p|s|w)*> | ||
<!ATTLIST read-along | ||
use-assets-folder CDATA #IMPLIED | ||
href CDATA #IMPLIED | ||
audio CDATA #IMPLIED | ||
xml:lang CDATA #IMPLIED | ||
language CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
version CDATA #IMPLIED> | ||
|
||
<!ELEMENT text (body|div|span|anchor|silence|graphic|p|s|w)*> | ||
<!ATTLIST text | ||
xml:lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
fallback-langs CDATA #IMPLIED | ||
id CDATA #IMPLIED> | ||
|
||
<!ELEMENT body (div|span|anchor|silence|graphic|p|s|w)*> | ||
<!ATTLIST body | ||
xml:lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
id CDATA #IMPLIED> | ||
|
||
<!ELEMENT anchor EMPTY> | ||
<!ATTLIST anchor time CDATA #REQUIRED> | ||
|
||
<!ELEMENT silence EMPTY> | ||
<!ATTLIST silence dur CDATA #REQUIRED> | ||
|
||
<!ELEMENT graphic EMPTY> | ||
<!ATTLIST graphic | ||
url CDATA #REQUIRED | ||
id CDATA #IMPLIED> | ||
|
||
<!ELEMENT div (#PCDATA|div|span|anchor|silence|graphic|p|s|w)*> | ||
<!ATTLIST div | ||
xml:lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
id CDATA #IMPLIED | ||
class CDATA #IMPLIED | ||
type CDATA #IMPLIED | ||
do-not-align CDATA #IMPLIED | ||
time CDATA #IMPLIED | ||
dur CDATA #IMPLIED> | ||
|
||
<!ELEMENT span (#PCDATA|div|span|anchor|silence|graphic|p|s|w)*> | ||
<!ATTLIST span | ||
xml:lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
id CDATA #IMPLIED | ||
class CDATA #IMPLIED | ||
type CDATA #IMPLIED | ||
do-not-align CDATA #IMPLIED | ||
time CDATA #IMPLIED | ||
dur CDATA #IMPLIED> | ||
|
||
<!ELEMENT p (#PCDATA|span|anchor|silence|s|w)*> | ||
<!ATTLIST p | ||
xml:lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
id CDATA #IMPLIED | ||
class CDATA #IMPLIED | ||
do-not-align CDATA #IMPLIED | ||
time CDATA #IMPLIED | ||
dur CDATA #IMPLIED> | ||
|
||
<!ELEMENT s (#PCDATA|span|anchor|silence|w)*> | ||
<!ATTLIST s | ||
xml:lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
id CDATA #IMPLIED | ||
class CDATA #IMPLIED | ||
do-not-align CDATA #IMPLIED | ||
time CDATA #IMPLIED | ||
dur CDATA #IMPLIED | ||
annotation-id CDATA #IMPLIED | ||
sentence-id CDATA #IMPLIED> | ||
|
||
<!ELEMENT w (#PCDATA|span|syl)*> | ||
<!ATTLIST w | ||
xml:lang CDATA #IMPLIED | ||
effective-g2p-lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
id CDATA #IMPLIED | ||
class CDATA #IMPLIED | ||
do-not-align CDATA #IMPLIED | ||
ARPABET CDATA #IMPLIED | ||
time CDATA #IMPLIED | ||
dur CDATA #IMPLIED> | ||
|
||
<!ELEMENT syl (#PCDATA|span)*> | ||
<!ATTLIST syl | ||
xml:lang CDATA #IMPLIED | ||
lang CDATA #IMPLIED | ||
id CDATA #IMPLIED | ||
class CDATA #IMPLIED | ||
do-not-align CDATA #IMPLIED | ||
ARPABET CDATA #IMPLIED | ||
time CDATA #IMPLIED | ||
dur CDATA #IMPLIED> | ||
|
||
<!ELEMENT meta EMPTY> | ||
<!ATTLIST meta name CDATA #REQUIRED | ||
content CDATA #REQUIRED | ||
id CDATA #IMPLIED> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,34 @@ | ||
<?xml version='1.0' encoding='utf-8'?> | ||
<read-along version="1.2"> | ||
<meta name="generator" content="human made" id="meta0" /> | ||
<meta name="annotations-ids" content="translation1, translation2" id="meta1" /> | ||
<meta name="annotations-labels" content="Algonquin, English" id="meta2" /> | ||
<meta name="annotations-labels-eng" content="Algonquin, English" id="meta3" /> | ||
<meta name="annotations-labels-fra" content="algonquin, anglais" id="meta4" /> | ||
<text xml:lang="fra" id="t0"> | ||
<body id="t0b0"> | ||
<div type="page" id="t0b0d0" class="two-column-layout-page"> | ||
<graphic url="avatar.png" id="t0b0d0graphic0" /> | ||
<p id="t0b0d0p0"> | ||
<s id="t0b0d0p0s0"><w id="t0b0d0p0s0w0" time="0.455" dur="1.165">Bonjour</w>.</s> | ||
<s do-not-align="true" xml:lang="otw" id="t0b0d0p0s0an01" annotation-id="translation1" sentence-id="t0b0d0p0s0"> | ||
Kwei.</s> | ||
<s do-not-align="true" xml:lang="eng" id="t0b0d0p0s0an02" annotation-id="translation2" | ||
sentence-id="t0b0d0p0s0"> | ||
Hello.</s> | ||
<s id="t0b0d0p0s1"><w id="t0b0d0p0s1w0" time="1.620" dur="0.070">Je</w> <w | ||
id="t0b0d0p0s1w1" time="1.690" dur="0.070">m</w>'<w id="t0b0d0p0s1w2" time="1.760" | ||
dur="0.240">appelle</w> <w id="t0b0d0p0s1w3" time="2.000" dur="1.705">Éric</w> <w | ||
id="t0b0d0p0s1w4" time="3.705" dur="1.905">Joanis</w>.</s> | ||
<s do-not-align="true" xml:lang="otw" id="t0b0d0p0s1an01" annotation-id="translation1" | ||
sentence-id="t0b0d0p0s1">Éric | ||
Joanis nindijinikàz.</s> | ||
<s do-not-align="true" xml:lang="eng" id="t0b0d0p0s1an01" annotation-id="translation2" | ||
sentence-id="t0b0d0p0s1">My | ||
name is Éric Joanis.</s> | ||
</p> | ||
</div> | ||
|
||
</body> | ||
</text> | ||
</read-along> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,34 @@ | ||
<?xml version='1.0' encoding='utf-8'?> | ||
<read-along version="1.2"> | ||
<meta name="generator" content="human made" id="meta0" /> | ||
<meta name="annotations-ids" content="translation1, translation2" id="meta1" /> | ||
<meta name="annotations-labels" content="Algonquin, English" id="meta2" /> | ||
<meta name="annotations-labels-eng" content="Algonquin, English" id="meta3" /> | ||
<meta name="annotations-labels-fra" content="algonquin, anglais" id="meta4" /> | ||
<text xml:lang="fra" id="t0"> | ||
<body id="t0b0"> | ||
<div type="page" id="t0b0d0" class="two-column-layout-page"> | ||
<graphic url="avatar.png" id="t0b0d0graphic0" /> | ||
<p id="t0b0d0p0"> | ||
<s id="t0b0d0p0s0"><w id="t0b0d0p0s0w0" time="0.455" dur="1.165">Bonjour</w>.</s> | ||
<s do-not-align="true" xml:lang="otw" id="t0b0d0p0s0an01" annotation-id="translation1" sentence-id="t0b0d0p0s0"> | ||
Kwei.</s> | ||
<s do-not-align="true" xml:lang="eng" id="t0b0d0p0s0an02" annotation-id="translation2" | ||
sentence-id="t0b0d0p0s0"> | ||
Hello.</s> | ||
<s id="t0b0d0p0s1"><w id="t0b0d0p0s1w0" time="1.620" dur="0.070">Je</w> <w | ||
id="t0b0d0p0s1w1" time="1.690" dur="0.070">m</w>'<w id="t0b0d0p0s1w2" time="1.760" | ||
dur="0.240">appelle</w> <w id="t0b0d0p0s1w3" time="2.000" dur="1.705">Éric</w> <w | ||
id="t0b0d0p0s1w4" time="3.705" dur="1.905">Joanis</w>.</s> | ||
<s do-not-align="true" xml:lang="otw" id="t0b0d0p0s1an01" annotation-id="translation1" | ||
sentence-id="t0b0d0p0s1">Éric | ||
Joanis nindijinikàz.</s> | ||
<s do-not-align="true" xml:lang="eng" id="t0b0d0p0s1an01" annotation-id="translation2" | ||
sentence-id="t0b0d0p0s1">My | ||
name is Éric Joanis.</s> | ||
</p> | ||
</div> | ||
|
||
</body> | ||
</text> | ||
</read-along> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters