1 | <?xml version="1.0" encoding="UTF-8"?>
|
---|
2 | <!--<xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform" xmlns:java="http://xml.apache.org/xslt/java" xmlns:ss="urn:schemas-microsoft-com:office:spreadsheet">-->
|
---|
3 | <xsl:stylesheet version="1.0" xmlns:xsl="http://www.w3.org/1999/XSL/Transform" xmlns:java="http://xml.apache.org/xslt/java">
|
---|
4 | <!--On Translation Memory eXchange open-XML: http://www.opentag.com/tmx.htm and http://www.gala-global.org/oscarStandards/tmx/tmx14b.html
|
---|
5 | And for character entities: http://www.w3.org/MarkUp/html3/latin1.html
|
---|
6 | More information: http://xml.coverpages.org/tmxSpec971212.html#O-TMF-->
|
---|
7 |
|
---|
8 | <!-- HOW AND WHEN TO USE THIS FILE
|
---|
9 | A Translation Memory eXchange (TMX) file is an openXML file that contains translated strings that can serve as
|
---|
10 | a reference library for future translation work.
|
---|
11 |
|
---|
12 | When users want to take all the up to date translated strings in Greenstone and use it in the Google Translator Kit
|
---|
13 | (GTT) as the basis to continue their translation work on the remaining strings (yet to be translated), this XSLT file
|
---|
14 | can be used to generate a TMX from the already-translated strings. The user can then upload this into the GTT.
|
---|
15 | Further translation work that the translator does in the GTT will be added to its growing internal TMX file which
|
---|
16 | appears to be inaccessible.
|
---|
17 |
|
---|
18 | The process of generating a TMX file of Greenstone's up to date strings for a language is as follows:
|
---|
19 |
|
---|
20 | 1. Generate an xml file containing all the up to date chunks (those strings that don't require translation work).
|
---|
21 | GS2/bin/java>perl -S gti.pl get-uptodate-chunks mi coredm > ../../macros/maori/uptodatechunks_core.xml
|
---|
22 |
|
---|
23 | 2. Generate a TMX file from that XML file as follows:
|
---|
24 | GS2/bin/java>java -cp /research/ak19/gs2-svn/bin/java/ApplyXSLT.jar org.nzdl.gsdl.ApplyXSLT -x ../../macros/maori/uptodatechunks_core.xml -t ../script/gti-generate-tmx-xml.xsl -l mi > ../../maori/uptodatecore-mi.tmx
|
---|
25 |
|
---|
26 | GS2/bin/java>less ../../maori/uptodatecore-mi.tmx
|
---|
27 |
|
---|
28 | 3. Send this to the user and they can upload it into GTT.
|
---|
29 |
|
---|
30 |
|
---|
31 | (The DOCTYPE has only been commented out below in order to let a further XSLT process the output of this file into a spreadsheet .txt file.
|
---|
32 | Since a third XSLT file exists which operates on another XML file to obtain the spreadsheet .txt file, the DOCTYPE can be reinstated if required.)
|
---|
33 | -->
|
---|
34 |
|
---|
35 |
|
---|
36 | <xsl:output method="xml" encoding="UTF-8"/>
|
---|
37 | <xsl:param name="sourcelang"/>
|
---|
38 | <xsl:param name="targetlang"/>
|
---|
39 |
|
---|
40 | <xsl:template match="GTIResponse">
|
---|
41 | <!-- if applying this XSLT file results in an error mentioning ".../tmx14.dtd (No such file or directory)"
|
---|
42 | then comment out the DOCTYPE declaration below -->
|
---|
43 | <!--<xsl:text disable-output-escaping="yes"> <!DOCTYPE tmx PUBLIC "-//LISA OSCAR:1998//DTD for Translation Memory eXchange//EN" "tmx14.dtd" > </xsl:text>-->
|
---|
44 |
|
---|
45 | <tmx version="1.4" xmlns="http://www.lisa.org/tmx14"><xsl:text> </xsl:text> <!--newline-->
|
---|
46 | <header
|
---|
47 | creationtool="Greenstone Translator Interface"
|
---|
48 | creationtoolversion="Greenstone2.85"
|
---|
49 | datatype="PlainText"
|
---|
50 | segtype="sentence"
|
---|
51 | adminlang="en"
|
---|
52 | srclang="{$sourcelang}"
|
---|
53 | o-tmf="GreenstoneTranslationFile">
|
---|
54 | </header><xsl:text> </xsl:text> <!--newline-->
|
---|
55 | <body>
|
---|
56 | <xsl:text> </xsl:text> <!--2 newlines-->
|
---|
57 | <xsl:apply-templates select="TranslationFile"/>
|
---|
58 |
|
---|
59 |
|
---|
60 | <xsl:apply-templates select="Chunks"/>
|
---|
61 |
|
---|
62 | <xsl:apply-templates select="UptodateChunks"/>
|
---|
63 |
|
---|
64 | <!-- control the order: first all the strings needing to be updated, then all those that need translating-->
|
---|
65 | <xsl:apply-templates select="ChunksRequiringUpdating"/>
|
---|
66 | <xsl:apply-templates select="ChunksRequiringTranslation"/>
|
---|
67 | </body>
|
---|
68 | </tmx>
|
---|
69 | </xsl:template>
|
---|
70 |
|
---|
71 |
|
---|
72 | <!-- The input file contains information as follows:
|
---|
73 | <TranslationFile key="coredm" target_file_path="macros/mongolian.dm" num_chunks_translated="353" num_chunks_requiring_translation="32" num_chunks_requiring_updating="18"/>
|
---|
74 | We want this useful information to be present in the output TMX file too. Each attribute of a TranslationFile element will be a separate <prop> property value,
|
---|
75 | where the TranslationFile attribute names become the values of each property's type attribute, and the TranslationFile attribute values are the property contents.-->
|
---|
76 | <xsl:template match="TranslationFile">
|
---|
77 | <xsl:for-each select="@*">
|
---|
78 | <prop type="{name()}"><xsl:value-of select="."/></prop>
|
---|
79 | <xsl:text> </xsl:text><!--newline-->
|
---|
80 | </xsl:for-each>
|
---|
81 | </xsl:template>
|
---|
82 |
|
---|
83 | <xsl:template match="UptodateChunks">
|
---|
84 | <xsl:text> </xsl:text>
|
---|
85 | <note><xsl:text xml:lang="en">Uptodate chunks</xsl:text></note><xsl:text> </xsl:text>
|
---|
86 | <xsl:apply-templates select="Chunk">
|
---|
87 | <xsl:sort select="@key"/>
|
---|
88 | </xsl:apply-templates>
|
---|
89 | </xsl:template>
|
---|
90 |
|
---|
91 | <xsl:template match="ChunksRequiringTranslation">
|
---|
92 | <xsl:text> </xsl:text> <!--newline-->
|
---|
93 | <note><xsl:text xml:lang="en">Chunks requiring translating</xsl:text></note><xsl:text> </xsl:text> <!--newline-->
|
---|
94 | <xsl:apply-templates select="Chunk">
|
---|
95 | <xsl:sort select="@key"/>
|
---|
96 | </xsl:apply-templates>
|
---|
97 | </xsl:template>
|
---|
98 |
|
---|
99 | <xsl:template match="ChunksRequiringUpdating">
|
---|
100 | <xsl:text> </xsl:text> <!--newline-->
|
---|
101 | <note><xsl:text xml:lang="en">Chunks requiring updating</xsl:text></note><xsl:text> </xsl:text> <!--newline-->
|
---|
102 | <xsl:apply-templates select="Chunk">
|
---|
103 | <xsl:sort select="@key"/>
|
---|
104 | </xsl:apply-templates>
|
---|
105 | </xsl:template>
|
---|
106 |
|
---|
107 | <xsl:template match="Chunks">
|
---|
108 | <xsl:text> </xsl:text>
|
---|
109 | <note><xsl:text xml:lang="en">All chunks</xsl:text></note><xsl:text> </xsl:text>
|
---|
110 | <xsl:apply-templates select="Chunk">
|
---|
111 | <xsl:sort select="@key"/>
|
---|
112 | </xsl:apply-templates>
|
---|
113 | </xsl:template>
|
---|
114 |
|
---|
115 |
|
---|
116 | <xsl:template match="Chunk">
|
---|
117 | <tu><xsl:text> </xsl:text> <!--newline-->
|
---|
118 | <tuv xml:lang="{$sourcelang}">
|
---|
119 | <prop type="source"><xsl:value-of select="@key"/></prop><xsl:text> </xsl:text> <!--newline-->
|
---|
120 | <seg>
|
---|
121 | <xsl:for-each select="SourceFileText">
|
---|
122 | <xsl:variable name="tempText0" select='java:org.nzdl.gsdl.ApplyXSLT.getChunkString(.)'/> <!-- removes collection-specific attribute-like prefix in paperspast.dm-->
|
---|
123 | <xsl:variable name="tempText1" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText0, "\n", "&#10; ")'/>
|
---|
124 | <xsl:variable name="tempText2" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText1, "<", "&lt;")'/>
|
---|
125 | <xsl:variable name="tempText3" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText2, ">", "&gt;")'/>
|
---|
126 | <xsl:variable name="escapedText" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText3, "&", "&amp;")'/> <!-- ampersands-->
|
---|
127 | <xsl:value-of select='$escapedText' disable-output-escaping="yes"/>
|
---|
128 | </xsl:for-each>
|
---|
129 | </seg><xsl:text> </xsl:text> <!--newline-->
|
---|
130 | </tuv><xsl:text> </xsl:text> <!--newline-->
|
---|
131 | <tuv xml:lang="{$targetlang}">
|
---|
132 | <prop type="target"><xsl:value-of select="@key"/></prop><xsl:text> </xsl:text> <!--newline-->
|
---|
133 | <seg>
|
---|
134 | <xsl:for-each select="TargetFileText">
|
---|
135 | <xsl:variable name="tempText0" select='java:org.nzdl.gsdl.ApplyXSLT.getChunkString(.)'/> <!-- removes collection-specific attribute-like prefix in paperspast.dm-->
|
---|
136 | <xsl:variable name="tempText1" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText0, "\n", "&#10; ")'/>
|
---|
137 | <xsl:variable name="tempText2" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText1, "<", "&lt;")'/>
|
---|
138 | <xsl:variable name="tempText3" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText2, ">", "&gt;")'/>
|
---|
139 | <xsl:variable name="escapedText" select='java:org.nzdl.gsdl.ApplyXSLT.replaceAll($tempText3, "&", "&amp;")'/> <!-- ampersands-->
|
---|
140 | <xsl:value-of select='$escapedText' disable-output-escaping="yes"/>
|
---|
141 | </xsl:for-each>
|
---|
142 | </seg><xsl:text> </xsl:text> <!--newline-->
|
---|
143 | </tuv><xsl:text> </xsl:text> <!--newline-->
|
---|
144 | </tu><xsl:text> </xsl:text> <!--newline-->
|
---|
145 | </xsl:template>
|
---|
146 |
|
---|
147 | <!--<xsl:template match="*">Do nothing for all other templates matched</xsl:template>-->
|
---|
148 |
|
---|
149 | </xsl:stylesheet>
|
---|