-
Notifications
You must be signed in to change notification settings - Fork 2
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Precompiled ARPA+ G2p and code fixes
- Loading branch information
Showing
23 changed files
with
3,235 additions
and
123 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,51 @@ | ||
using System; | ||
using System.Collections.Generic; | ||
using System.Linq; | ||
using Microsoft.ML.OnnxRuntime; | ||
using OpenUtau.Api; | ||
using ArpaPlusPhonemizer; | ||
|
||
namespace OpenUtau.Core.G2p { | ||
public class ArpabetPlusG2p : G2pPack { | ||
private static readonly string[] graphemes = new string[] { | ||
"", "", "", "", "\'", "-", "a", "b", "c", "d", "e", | ||
"f", "g", "h", "i", "j", "k", "l", "m", "n", "o", "p", | ||
"q", "r", "s", "t", "u", "v", "w", "x", "y", "z", | ||
}; | ||
|
||
private static readonly string[] phonemes = new string[] { | ||
"", "", "", "", "aa", "ae", "ah", "ao", "aw", "ax", "ay", "b", "ch", | ||
"d", "dh", "dr", "dx", "eh", "er", "ey", "f", "g", "hh", "ih", "iy", "jh", | ||
"k", "l", "m", "n", "ng", "ow", "oy", "p", "q", "r", "s", "sh", "t", | ||
"th", "tr", "uh", "uw", "v", "w", "y", "z", "zh", | ||
}; | ||
|
||
private static object lockObj = new object(); | ||
private static Dictionary<string, int> graphemeIndexes; | ||
private static IG2p dict; | ||
private static InferenceSession session; | ||
private static Dictionary<string, string[]> predCache = new Dictionary<string, string[]>(); | ||
|
||
public ArpabetPlusG2p() { | ||
lock (lockObj) { | ||
if (graphemeIndexes == null) { | ||
graphemeIndexes = graphemes | ||
.Skip(4) | ||
.Select((g, i) => Tuple.Create(g, i)) | ||
.ToDictionary(t => t.Item1, t => t.Item2 + 4); | ||
var tuple = LoadPack( | ||
ArpaPlusPhonemizer.Resources.g2p_arpabet_plus, | ||
s => s.ToLowerInvariant(), | ||
s => RemoveTailDigits(s.ToLowerInvariant())); | ||
dict = tuple.Item1; | ||
session = tuple.Item2; | ||
} | ||
} | ||
GraphemeIndexes = graphemeIndexes; | ||
Phonemes = phonemes; | ||
Dict = dict; | ||
Session = session; | ||
PredCache = predCache; | ||
} | ||
} | ||
} |
Large diffs are not rendered by default.
Oops, something went wrong.
Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,130 @@ | ||
<?xml version="1.0" encoding="utf-8"?> | ||
<root> | ||
<!-- | ||
Microsoft ResX Schema | ||
Version 2.0 | ||
The primary goals of this format is to allow a simple XML format | ||
that is mostly human readable. The generation and parsing of the | ||
various data types are done through the TypeConverter classes | ||
associated with the data types. | ||
Example: | ||
... ado.net/XML headers & schema ... | ||
<resheader name="resmimetype">text/microsoft-resx</resheader> | ||
<resheader name="version">2.0</resheader> | ||
<resheader name="reader">System.Resources.ResXResourceReader, System.Windows.Forms, ...</resheader> | ||
<resheader name="writer">System.Resources.ResXResourceWriter, System.Windows.Forms, ...</resheader> | ||
<data name="Name1"><value>this is my long string</value><comment>this is a comment</comment></data> | ||
<data name="Color1" type="System.Drawing.Color, System.Drawing">Blue</data> | ||
<data name="Bitmap1" mimetype="application/x-microsoft.net.object.binary.base64"> | ||
<value>[base64 mime encoded serialized .NET Framework object]</value> | ||
</data> | ||
<data name="Icon1" type="System.Drawing.Icon, System.Drawing" mimetype="application/x-microsoft.net.object.bytearray.base64"> | ||
<value>[base64 mime encoded string representing a byte array form of the .NET Framework object]</value> | ||
<comment>This is a comment</comment> | ||
</data> | ||
There are any number of "resheader" rows that contain simple | ||
name/value pairs. | ||
Each data row contains a name, and value. The row also contains a | ||
type or mimetype. Type corresponds to a .NET class that support | ||
text/value conversion through the TypeConverter architecture. | ||
Classes that don't support this are serialized and stored with the | ||
mimetype set. | ||
The mimetype is used for serialized objects, and tells the | ||
ResXResourceReader how to depersist the object. This is currently not | ||
extensible. For a given mimetype the value must be set accordingly: | ||
Note - application/x-microsoft.net.object.binary.base64 is the format | ||
that the ResXResourceWriter will generate, however the reader can | ||
read any of the formats listed below. | ||
mimetype: application/x-microsoft.net.object.binary.base64 | ||
value : The object must be serialized with | ||
: System.Runtime.Serialization.Formatters.Binary.BinaryFormatter | ||
: and then encoded with base64 encoding. | ||
mimetype: application/x-microsoft.net.object.soap.base64 | ||
value : The object must be serialized with | ||
: System.Runtime.Serialization.Formatters.Soap.SoapFormatter | ||
: and then encoded with base64 encoding. | ||
mimetype: application/x-microsoft.net.object.bytearray.base64 | ||
value : The object must be serialized into a byte array | ||
: using a System.ComponentModel.TypeConverter | ||
: and then encoded with base64 encoding. | ||
--> | ||
<xsd:schema id="root" xmlns="" xmlns:xsd="http://www.w3.org/2001/XMLSchema" xmlns:msdata="urn:schemas-microsoft-com:xml-msdata"> | ||
<xsd:import namespace="http://www.w3.org/XML/1998/namespace" /> | ||
<xsd:element name="root" msdata:IsDataSet="true"> | ||
<xsd:complexType> | ||
<xsd:choice maxOccurs="unbounded"> | ||
<xsd:element name="metadata"> | ||
<xsd:complexType> | ||
<xsd:sequence> | ||
<xsd:element name="value" type="xsd:string" minOccurs="0" /> | ||
</xsd:sequence> | ||
<xsd:attribute name="name" use="required" type="xsd:string" /> | ||
<xsd:attribute name="type" type="xsd:string" /> | ||
<xsd:attribute name="mimetype" type="xsd:string" /> | ||
<xsd:attribute ref="xml:space" /> | ||
</xsd:complexType> | ||
</xsd:element> | ||
<xsd:element name="assembly"> | ||
<xsd:complexType> | ||
<xsd:attribute name="alias" type="xsd:string" /> | ||
<xsd:attribute name="name" type="xsd:string" /> | ||
</xsd:complexType> | ||
</xsd:element> | ||
<xsd:element name="data"> | ||
<xsd:complexType> | ||
<xsd:sequence> | ||
<xsd:element name="value" type="xsd:string" minOccurs="0" msdata:Ordinal="1" /> | ||
<xsd:element name="comment" type="xsd:string" minOccurs="0" msdata:Ordinal="2" /> | ||
</xsd:sequence> | ||
<xsd:attribute name="name" type="xsd:string" use="required" msdata:Ordinal="1" /> | ||
<xsd:attribute name="type" type="xsd:string" msdata:Ordinal="3" /> | ||
<xsd:attribute name="mimetype" type="xsd:string" msdata:Ordinal="4" /> | ||
<xsd:attribute ref="xml:space" /> | ||
</xsd:complexType> | ||
</xsd:element> | ||
<xsd:element name="resheader"> | ||
<xsd:complexType> | ||
<xsd:sequence> | ||
<xsd:element name="value" type="xsd:string" minOccurs="0" msdata:Ordinal="1" /> | ||
</xsd:sequence> | ||
<xsd:attribute name="name" type="xsd:string" use="required" /> | ||
</xsd:complexType> | ||
</xsd:element> | ||
</xsd:choice> | ||
</xsd:complexType> | ||
</xsd:element> | ||
</xsd:schema> | ||
<resheader name="resmimetype"> | ||
<value>text/microsoft-resx</value> | ||
</resheader> | ||
<resheader name="version"> | ||
<value>2.0</value> | ||
</resheader> | ||
<resheader name="reader"> | ||
<value>System.Resources.ResXResourceReader, System.Windows.Forms, Version=4.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089</value> | ||
</resheader> | ||
<resheader name="writer"> | ||
<value>System.Resources.ResXResourceWriter, System.Windows.Forms, Version=4.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089</value> | ||
</resheader> | ||
<assembly alias="System.Windows.Forms" name="System.Windows.Forms, Version=4.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089" /> | ||
<data name="arpasing_template" type="System.Resources.ResXFileRef, System.Windows.Forms"> | ||
<value>arpasing.template.yaml;System.Byte[], mscorlib, Version=4.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089</value> | ||
</data> | ||
<data name="envccv_template" type="System.Resources.ResXFileRef, System.Windows.Forms"> | ||
<value>envccv.template.yaml;System.Byte[], mscorlib, Version=4.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089</value> | ||
</data> | ||
<data name="xsampa_template" type="System.Resources.ResXFileRef, System.Windows.Forms"> | ||
<value>xsampa.template.yaml;System.Byte[], mscorlib, Version=4.0.0.0, Culture=neutral, PublicKeyToken=b77a5c561934e089</value> | ||
</data> | ||
</root> |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,45 @@ | ||
%YAML 1.2 | ||
--- | ||
symbols: | ||
- {symbol: aa, type: vowel} | ||
- {symbol: ae, type: vowel} | ||
- {symbol: ah, type: vowel} | ||
- {symbol: ao, type: vowel} | ||
- {symbol: aw, type: vowel} | ||
- {symbol: ay, type: vowel} | ||
- {symbol: b, type: stop} | ||
- {symbol: ch, type: affricate} | ||
- {symbol: d, type: stop} | ||
- {symbol: dh, type: fricative} | ||
- {symbol: eh, type: vowel} | ||
- {symbol: er, type: vowel} | ||
- {symbol: ey, type: vowel} | ||
- {symbol: f, type: fricative} | ||
- {symbol: g, type: stop} | ||
- {symbol: hh, type: aspirate} | ||
- {symbol: ih, type: vowel} | ||
- {symbol: iy, type: vowel} | ||
- {symbol: jh, type: affricate} | ||
- {symbol: k, type: stop} | ||
- {symbol: l, type: liquid} | ||
- {symbol: m, type: nasal} | ||
- {symbol: n, type: nasal} | ||
- {symbol: ng, type: nasal} | ||
- {symbol: ow, type: vowel} | ||
- {symbol: oy, type: vowel} | ||
- {symbol: p, type: stop} | ||
- {symbol: r, type: liquid} | ||
- {symbol: s, type: fricative} | ||
- {symbol: sh, type: fricative} | ||
- {symbol: t, type: stop} | ||
- {symbol: th, type: fricative} | ||
- {symbol: uh, type: vowel} | ||
- {symbol: uw, type: vowel} | ||
- {symbol: v, type: fricative} | ||
- {symbol: w, type: semivowel} | ||
- {symbol: y, type: semivowel} | ||
- {symbol: z, type: fricative} | ||
- {symbol: zh, type: fricative} | ||
entries: | ||
- grapheme: openutau | ||
phonemes: [ow, p, eh, n, w, uw, t, ah, w, uw] |
Oops, something went wrong.