Compare commits
39 Commits
Author | SHA1 | Date | |
---|---|---|---|
|
c119aa6b0e | ||
|
9dde5726cd | ||
|
f2e9c85880 | ||
|
056f5a4c6f | ||
|
504e55b2d8 | ||
|
948a232ae2 | ||
|
b2920c7557 | ||
|
cf2d7e636a | ||
|
c5410fc550 | ||
|
4270e22fe0 | ||
|
29fa2dd405 | ||
|
a8abca0841 | ||
|
82f84c5853 | ||
|
67a9e35028 | ||
|
440e30c097 | ||
|
9c65ddadbf | ||
|
f252de4a8d | ||
|
d7d7ea7db1 | ||
|
b65186907f | ||
|
36a06634a3 | ||
|
b0f2d37d6f | ||
|
965f209665 | ||
|
ab8bd3e11c | ||
|
7cdb5b1ed9 | ||
|
617ce141d0 | ||
|
2d04fbe049 | ||
|
0ae425525d | ||
|
f7e816c014 | ||
|
2368fca0f1 | ||
|
719fedbd93 | ||
|
a1d2d4181b | ||
|
3eaa44b358 | ||
|
aee7fc502c | ||
|
9210a97d48 | ||
|
64fad81e10 | ||
|
7056241f37 | ||
|
065c8a6cdf | ||
|
636b7133a1 | ||
|
ed09fd3610 |
@ -19,7 +19,7 @@ tasks:
|
||||
- push
|
||||
- tag
|
||||
branches:
|
||||
- master
|
||||
- r0.9
|
||||
|
||||
scopes: [
|
||||
"queue:create-task:highest:proj-deepspeech/*",
|
||||
@ -32,7 +32,7 @@ tasks:
|
||||
|
||||
payload:
|
||||
maxRunTime: 600
|
||||
image: "ubuntu:16.04"
|
||||
image: "ubuntu:18.04"
|
||||
|
||||
features:
|
||||
taskclusterProxy: true
|
||||
@ -45,7 +45,7 @@ tasks:
|
||||
- "--login"
|
||||
- "-cxe"
|
||||
- >
|
||||
echo "deb http://archive.ubuntu.com/ubuntu/ xenial-updates main" > /etc/apt/sources.list.d/xenial-updates.list &&
|
||||
echo "deb http://archive.ubuntu.com/ubuntu/ bionic-updates main" > /etc/apt/sources.list.d/bionic-updates.list &&
|
||||
apt-get -qq update && apt-get -qq -y install git python3-pip curl sudo &&
|
||||
adduser --system --home /home/build-user build-user &&
|
||||
cd /home/build-user/ &&
|
||||
|
@ -15,11 +15,11 @@ Prerequisites for training a model
|
||||
Getting the training code
|
||||
^^^^^^^^^^^^^^^^^^^^^^^^^
|
||||
|
||||
Clone the latest released stable branch from Github (e.g. 0.9.2, check `here <https://github.com/mozilla/DeepSpeech/releases>`_):
|
||||
Clone the latest released stable branch from Github (e.g. 0.9.3, check `here <https://github.com/mozilla/DeepSpeech/releases>`_):
|
||||
|
||||
.. code-block:: bash
|
||||
|
||||
git clone --branch v0.9.2 https://github.com/mozilla/DeepSpeech
|
||||
git clone --branch v0.9.3 https://github.com/mozilla/DeepSpeech
|
||||
|
||||
If you plan on committing code or you want to report bugs, please use the master branch.
|
||||
|
||||
|
@ -37,8 +37,8 @@ If you want to use the pre-trained English model for performing speech-to-text,
|
||||
|
||||
.. code-block:: bash
|
||||
|
||||
wget https://github.com/mozilla/DeepSpeech/releases/download/v0.9.1/deepspeech-0.9.1-models.pbmm
|
||||
wget https://github.com/mozilla/DeepSpeech/releases/download/v0.9.1/deepspeech-0.9.1-models.scorer
|
||||
wget https://github.com/mozilla/DeepSpeech/releases/download/v0.9.3/deepspeech-0.9.3-models.pbmm
|
||||
wget https://github.com/mozilla/DeepSpeech/releases/download/v0.9.3/deepspeech-0.9.3-models.scorer
|
||||
|
||||
There are several pre-trained model files available in official releases. Files ending in ``.pbmm`` are compatible with clients and language bindings built against the standard TensorFlow runtime. Usually these packages are simply called ``deepspeech``. These files are also compatible with CUDA enabled clients and language bindings. These packages are usually called ``deepspeech-gpu``. Files ending in ``.tflite`` are compatible with clients and language bindings built against the `TensorFlow Lite runtime <https://www.tensorflow.org/lite/>`_. These models are optimized for size and performance in low power devices. On desktop platforms, the compatible packages are called ``deepspeech-tflite``. On Android and Raspberry Pi, we only publish TensorFlow Lite enabled packages, and they are simply called ``deepspeech``. You can see a full list of supported platforms and which TensorFlow runtime is supported at :ref:`supported-platforms-inference`.
|
||||
|
||||
@ -136,7 +136,7 @@ Note: the following command assumes you `downloaded the pre-trained model <#gett
|
||||
|
||||
.. code-block:: bash
|
||||
|
||||
deepspeech --model deepspeech-0.9.1-models.pbmm --scorer deepspeech-0.9.1-models.scorer --audio my_audio_file.wav
|
||||
deepspeech --model deepspeech-0.9.3-models.pbmm --scorer deepspeech-0.9.3-models.scorer --audio my_audio_file.wav
|
||||
|
||||
The ``--scorer`` argument is optional, and represents an external language model to be used when transcribing the audio.
|
||||
|
||||
@ -200,7 +200,7 @@ Note: the following command assumes you `downloaded the pre-trained model <#gett
|
||||
|
||||
.. code-block:: bash
|
||||
|
||||
./deepspeech --model deepspeech-0.9.1-models.pbmm --scorer deepspeech-0.9.1-models.scorer --audio audio_input.wav
|
||||
./deepspeech --model deepspeech-0.9.3-models.pbmm --scorer deepspeech-0.9.3-models.scorer --audio audio_input.wav
|
||||
|
||||
See the help output with ``./deepspeech -h`` for more details.
|
||||
|
||||
|
@ -1 +1 @@
|
||||
Subproject commit df643fca46b4d8ab654f547ef2e36132f1154412
|
||||
Subproject commit 2b6ca883c073a7def7766dbbbd5d0d28fb84e612
|
@ -20,15 +20,15 @@ To install and use DeepSpeech all you have to do is:
|
||||
pip3 install deepspeech
|
||||
|
||||
# Download pre-trained English model files
|
||||
curl -LO https://github.com/mozilla/DeepSpeech/releases/download/v0.9.1/deepspeech-0.9.1-models.pbmm
|
||||
curl -LO https://github.com/mozilla/DeepSpeech/releases/download/v0.9.1/deepspeech-0.9.1-models.scorer
|
||||
curl -LO https://github.com/mozilla/DeepSpeech/releases/download/v0.9.3/deepspeech-0.9.3-models.pbmm
|
||||
curl -LO https://github.com/mozilla/DeepSpeech/releases/download/v0.9.3/deepspeech-0.9.3-models.scorer
|
||||
|
||||
# Download example audio files
|
||||
curl -LO https://github.com/mozilla/DeepSpeech/releases/download/v0.9.1/audio-0.9.1.tar.gz
|
||||
tar xvf audio-0.9.1.tar.gz
|
||||
curl -LO https://github.com/mozilla/DeepSpeech/releases/download/v0.9.3/audio-0.9.3.tar.gz
|
||||
tar xvf audio-0.9.3.tar.gz
|
||||
|
||||
# Transcribe an audio file
|
||||
deepspeech --model deepspeech-0.9.1-models.pbmm --scorer deepspeech-0.9.1-models.scorer --audio audio/2830-3980-0043.wav
|
||||
deepspeech --model deepspeech-0.9.3-models.pbmm --scorer deepspeech-0.9.3-models.scorer --audio audio/2830-3980-0043.wav
|
||||
|
||||
A pre-trained English model is available for use and can be downloaded following the instructions in :ref:`the usage docs <usage-docs>`. For the latest release, including pre-trained models and checkpoints, `see the GitHub releases page <https://github.com/mozilla/DeepSpeech/releases/latest>`_.
|
||||
|
||||
@ -44,7 +44,7 @@ Quicker inference can be performed using a supported NVIDIA GPU on Linux. See th
|
||||
pip3 install deepspeech-gpu
|
||||
|
||||
# Transcribe an audio file.
|
||||
deepspeech --model deepspeech-0.9.1-models.pbmm --scorer deepspeech-0.9.1-models.scorer --audio audio/2830-3980-0043.wav
|
||||
deepspeech --model deepspeech-0.9.3-models.pbmm --scorer deepspeech-0.9.3-models.scorer --audio audio/2830-3980-0043.wav
|
||||
|
||||
Please ensure you have the required :ref:`CUDA dependencies <cuda-inference-deps>`.
|
||||
|
||||
|
@ -26,8 +26,8 @@ class SpeechRecognitionImpl : NSObject, AVCaptureAudioDataOutputSampleBufferDele
|
||||
private var audioData = Data()
|
||||
|
||||
override init() {
|
||||
let modelPath = Bundle.main.path(forResource: "deepspeech-0.9.1-models", ofType: "tflite")!
|
||||
let scorerPath = Bundle.main.path(forResource: "deepspeech-0.9.1-models", ofType: "scorer")!
|
||||
let modelPath = Bundle.main.path(forResource: "deepspeech-0.9.2-models", ofType: "tflite")!
|
||||
let scorerPath = Bundle.main.path(forResource: "deepspeech-0.9.2-models", ofType: "scorer")!
|
||||
|
||||
model = try! DeepSpeechModel(modelPath: modelPath)
|
||||
try! model.enableExternalScorer(scorerPath: scorerPath)
|
||||
|
@ -26,7 +26,7 @@ then:
|
||||
DEEPSPEECH_AUDIO: "https://github.com/mozilla/DeepSpeech/releases/download/v0.4.1/audio-0.4.1.tar.gz"
|
||||
PIP_DEFAULT_TIMEOUT: "60"
|
||||
EXAMPLES_CLONE_URL: "https://github.com/mozilla/DeepSpeech-examples"
|
||||
EXAMPLES_CHECKOUT_TARGET: "master"
|
||||
EXAMPLES_CHECKOUT_TARGET: "r0.9"
|
||||
|
||||
command:
|
||||
- "/bin/bash"
|
||||
|
@ -12,4 +12,4 @@ taskcluster:
|
||||
- push
|
||||
- tag
|
||||
branches:
|
||||
- master
|
||||
- r0.9
|
||||
|
@ -34,7 +34,7 @@ payload:
|
||||
MSYS: 'winsymlinks:nativestrict'
|
||||
GIT_LFS_SKIP_SMUDGE: '1'
|
||||
EXAMPLES_CLONE_URL: "https://github.com/mozilla/DeepSpeech-examples"
|
||||
EXAMPLES_CHECKOUT_TARGET: "master"
|
||||
EXAMPLES_CHECKOUT_TARGET: "r0.9"
|
||||
|
||||
command:
|
||||
- >-
|
||||
|
@ -1 +1 @@
|
||||
0.9.0-alpha.10
|
||||
0.9.3
|
||||
|
Loading…
Reference in New Issue
Block a user