20240127在ubuntu20.04.6下配置whisper

20240131在ubuntu20.04.6下配置whisper

2024/1/31 15:48

首先你要有一张NVIDIA的显卡，比如我用的PDD拼多多的二手GTX1080显卡。【并且极其可能是矿卡！】800￥

2、请正确安装好NVIDIA最新的驱动程序和CUDA。可选安装！

3、配置whisper

rootroot@rootroot-X99-Turbo:~ $rootroot@rootroot-X99-Turbo:\~$ python -m pip install --upgrade pip
【可以不安装conda】
rootroot@rootroot-X99-Turbo:~ $wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh rootroot@rootroot-X99-Turbo:\~$ ffmpeg
rootroot@rootroot-X99-Turbo:~ $pip install -U openai-whisper rootroot@rootroot-X99-Turbo:\~$ pip install tiktoken
rootroot@rootroot-X99-Turbo:~ $pip install setuptools-rust rootroot@rootroot-X99-Turbo:\~$ whisper audio.mp3 --model medium --language Chinese
rootroot@rootroot-X99-Turbo:~ $whisper chi.mp4 --model medium --language Chinese rootroot@rootroot-X99-Turbo:\~$ sudo apt-get install ffmpeg
rootroot@rootroot-X99-Turbo:~$ time(whisper chs.mp4 --model medium --language Chinese)

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ python -m pip install --upgrade pip

Collecting pip

Downloading pip-23.3.2-py3-none-any.whl (2.1 MB)

|████████████████████████████████| 2.1 MB 690 kB/s

Installing collected packages: pip

Successfully installed pip-23.3.2

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ sudo mkdir /opt/tools

rootroot@rootroot-X99-Turbo:~$ cd /opt/tools/

rootroot@rootroot-X99-Turbo:/opt/tools$

rootroot@rootroot-X99-Turbo:/opt/tools$ ll

total 8

drwxr-xr-x 2 root root 4096 1月 26 12:21 ./

drwxr-xr-x 4 root root 4096 1月 26 12:21 ../

rootroot@rootroot-X99-Turbo:/opt/tools$

rootroot@rootroot-X99-Turbo:/opt/tools$ cd ~

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ wget https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh

--2024-01-26 12:22:28-- https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh

Resolving repo.anaconda.com (repo.anaconda.com)... 104.16.130.3, 104.16.131.3, 2606:4700::6810:8203, ...

Connecting to repo.anaconda.com (repo.anaconda.com)|104.16.130.3|:443... connected.

HTTP request sent, awaiting response... 200 OK

Length: 141613749 (135M) [application/octet-stream]

Saving to: 'Miniconda3-latest-Linux-x86_64.sh'

Miniconda3-latest-Linux-x86_64.sh 100%[=============================================================================================>] 135.05M 2.82MB/s in 51s

2024-01-26 12:23:20 (2.65 MB/s) - 'Miniconda3-latest-Linux-x86_64.sh' saved [141613749/141613749]

rootroot@rootroot-X99-Turbo:~$ ffmpeg

built with gcc 9 (Ubuntu 9.4.0-1ubuntu1~20.04.1)

configuration: --prefix=/usr --extra-version=0ubuntu0.1 --toolchain=hardened --libdir=/usr/lib/x86_64-linux-gnu --incdir=/usr/include/x86_64-linux-gnu --arch=amd64 --enable-gpl --disable-stripping --enable-avresample --disable-filter=resample --enable-avisynth --enable-gnutls --enable-ladspa --enable-libaom --enable-libass --enable-libbluray --enable-libbs2b --enable-libcaca --enable-libcdio --enable-libcodec2 --enable-libflite --enable-libfontconfig --enable-libfreetype --enable-libfribidi --enable-libgme --enable-libgsm --enable-libjack --enable-libmp3lame --enable-libmysofa --enable-libopenjpeg --enable-libopenmpt --enable-libopus --enable-libpulse --enable-librsvg --enable-librubberband --enable-libshine --enable-libsnappy --enable-libsoxr --enable-libspeex --enable-libssh --enable-libtheora --enable-libtwolame --enable-libvidstab --enable-libvorbis --enable-libvpx --enable-libwavpack --enable-libwebp --enable-libx265 --enable-libxml2 --enable-libxvid --enable-libzmq --enable-libzvbi --enable-lv2 --enable-omx --enable-openal --enable-opencl --enable-opengl --enable-sdl2 --enable-libdc1394 --enable-libdrm --enable-libiec61883 --enable-nvenc --enable-chromaprint --enable-frei0r --enable-libx264 --enable-shared

libavutil 56. 31.100 / 56. 31.100

libavcodec 58. 54.100 / 58. 54.100

libavformat 58. 29.100 / 58. 29.100

libavdevice 58. 8.100 / 58. 8.100

libavfilter 7. 57.100 / 7. 57.100

libavresample 4. 0. 0 / 4. 0. 0

libswscale 5. 5.100 / 5. 5.100

libswresample 3. 5.100 / 3. 5.100

libpostproc 55. 5.100 / 55. 5.100

Hyper fast Audio and Video encoder

usage: ffmpeg [options] [[infile options] -i infile]... {[outfile options] outfile}...

Use -h to get full help or, even better, run 'man ffmpeg'

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ pip install -U openai-whisper

Defaulting to user installation because normal site-packages is not writeable

Requirement already satisfied: openai-whisper in ./.local/lib/python3.8/site-packages (20231117)

Requirement already satisfied: triton<3,>=2.0.0 in ./.local/lib/python3.8/site-packages (from openai-whisper) (2.2.0)

Requirement already satisfied: numba in ./.local/lib/python3.8/site-packages (from openai-whisper) (0.58.1)

Requirement already satisfied: numpy in ./.local/lib/python3.8/site-packages (from openai-whisper) (1.24.4)

Requirement already satisfied: torch in ./.local/lib/python3.8/site-packages (from openai-whisper) (2.1.2)

Requirement already satisfied: tqdm in ./.local/lib/python3.8/site-packages (from openai-whisper) (4.66.1)

Requirement already satisfied: more-itertools in ./.local/lib/python3.8/site-packages (from openai-whisper) (10.2.0)

Requirement already satisfied: tiktoken in ./.local/lib/python3.8/site-packages (from openai-whisper) (0.5.2)

Requirement already satisfied: filelock in ./.local/lib/python3.8/site-packages (from triton<3,>=2.0.0->openai-whisper) (3.13.1)

Requirement already satisfied: llvmlite<0.42,>=0.41.0dev0 in ./.local/lib/python3.8/site-packages (from numba->openai-whisper) (0.41.1)

Requirement already satisfied: importlib-metadata in ./.local/lib/python3.8/site-packages (from numba->openai-whisper) (7.0.1)

Requirement already satisfied: regex>=2022.1.18 in ./.local/lib/python3.8/site-packages (from tiktoken->openai-whisper) (2023.12.25)

Requirement already satisfied: requests>=2.26.0 in ./.local/lib/python3.8/site-packages (from tiktoken->openai-whisper) (2.31.0)

Requirement already satisfied: typing-extensions in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (4.9.0)

Requirement already satisfied: sympy in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (1.12)

Requirement already satisfied: networkx in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (3.1)

Requirement already satisfied: jinja2 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (3.1.3)

Requirement already satisfied: fsspec in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (2023.12.2)

Requirement already satisfied: nvidia-cuda-nvrtc-cu12==12.1.105 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (12.1.105)

Requirement already satisfied: nvidia-cuda-runtime-cu12==12.1.105 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (12.1.105)

Requirement already satisfied: nvidia-cuda-cupti-cu12==12.1.105 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (12.1.105)

Requirement already satisfied: nvidia-cudnn-cu12==8.9.2.26 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (8.9.2.26)

Requirement already satisfied: nvidia-cublas-cu12==12.1.3.1 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (12.1.3.1)

Requirement already satisfied: nvidia-cufft-cu12==11.0.2.54 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (11.0.2.54)

Requirement already satisfied: nvidia-curand-cu12==10.3.2.106 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (10.3.2.106)

Requirement already satisfied: nvidia-cusolver-cu12==11.4.5.107 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (11.4.5.107)

Requirement already satisfied: nvidia-cusparse-cu12==12.1.0.106 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (12.1.0.106)

Requirement already satisfied: nvidia-nccl-cu12==2.18.1 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (2.18.1)

Requirement already satisfied: nvidia-nvtx-cu12==12.1.105 in ./.local/lib/python3.8/site-packages (from torch->openai-whisper) (12.1.105)

Collecting triton<3,>=2.0.0 (from openai-whisper)

Downloading triton-2.1.0-0-cp38-cp38-manylinux2014_x86_64.manylinux_2_17_x86_64.whl.metadata (1.3 kB)

Requirement already satisfied: nvidia-nvjitlink-cu12 in ./.local/lib/python3.8/site-packages (from nvidia-cusolver-cu12==11.4.5.107->torch->openai-whisper) (12.3.101)

Requirement already satisfied: charset-normalizer<4,>=2 in ./.local/lib/python3.8/site-packages (from requests>=2.26.0->tiktoken->openai-whisper) (3.3.2)

Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests>=2.26.0->tiktoken->openai-whisper) (2.8)

Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/lib/python3/dist-packages (from requests>=2.26.0->tiktoken->openai-whisper) (1.25.8)

Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.26.0->tiktoken->openai-whisper) (2019.11.28)

Requirement already satisfied: zipp>=0.5 in ./.local/lib/python3.8/site-packages (from importlib-metadata->numba->openai-whisper) (3.17.0)

Requirement already satisfied: MarkupSafe>=2.0 in ./.local/lib/python3.8/site-packages (from jinja2->torch->openai-whisper) (2.1.3)

Requirement already satisfied: mpmath>=0.19 in ./.local/lib/python3.8/site-packages (from sympy->torch->openai-whisper) (1.3.0)

Downloading triton-2.1.0-0-cp38-cp38-manylinux2014_x86_64.manylinux_2_17_x86_64.whl (89.2 MB)

━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━ 89.2/89.2 MB 25.9 MB/s eta 0:00:00

Installing collected packages: triton

Attempting uninstall: triton

Found existing installation: triton 2.2.0

Uninstalling triton-2.2.0:

Successfully uninstalled triton-2.2.0

Successfully installed triton-2.1.0

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ pip install tiktoken

Defaulting to user installation because normal site-packages is not writeable

Requirement already satisfied: tiktoken in ./.local/lib/python3.8/site-packages (0.5.2)

Requirement already satisfied: regex>=2022.1.18 in ./.local/lib/python3.8/site-packages (from tiktoken) (2023.12.25)

Requirement already satisfied: requests>=2.26.0 in ./.local/lib/python3.8/site-packages (from tiktoken) (2.31.0)

Requirement already satisfied: charset-normalizer<4,>=2 in ./.local/lib/python3.8/site-packages (from requests>=2.26.0->tiktoken) (3.3.2)

Requirement already satisfied: idna<4,>=2.5 in /usr/lib/python3/dist-packages (from requests>=2.26.0->tiktoken) (2.8)

Requirement already satisfied: urllib3<3,>=1.21.1 in /usr/lib/python3/dist-packages (from requests>=2.26.0->tiktoken) (1.25.8)

Requirement already satisfied: certifi>=2017.4.17 in /usr/lib/python3/dist-packages (from requests>=2.26.0->tiktoken) (2019.11.28)

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ pip install setuptools-rust

Defaulting to user installation because normal site-packages is not writeable

Requirement already satisfied: setuptools-rust in ./.local/lib/python3.8/site-packages (1.8.1)

Requirement already satisfied: setuptools>=62.4 in ./.local/lib/python3.8/site-packages (from setuptools-rust) (69.0.3)

Requirement already satisfied: semantic-version<3,>=2.8.2 in ./.local/lib/python3.8/site-packages (from setuptools-rust) (2.10.0)

Requirement already satisfied: tomli>=1.2.1 in ./.local/lib/python3.8/site-packages (from setuptools-rust) (2.0.1)

rootroot@rootroot-X99-Turbo:~$ sudo apt update && sudo apt install ffmpeg

Get:1 file:/var/cuda-repo-ubuntu2004-12-0-local InRelease [1,575 B]

Get:2 file:/var/cuda-repo-ubuntu2004-12-3-local InRelease [1,572 B]

Get:1 file:/var/cuda-repo-ubuntu2004-12-0-local InRelease [1,575 B]

Get:2 file:/var/cuda-repo-ubuntu2004-12-3-local InRelease [1,572 B]

Hit:3 http://mirrors.tuna.tsinghua.edu.cn/ubuntu focal InRelease

Hit:4 http://mirrors.tuna.tsinghua.edu.cn/ubuntu focal-updates InRelease

Hit:5 http://mirrors.tuna.tsinghua.edu.cn/ubuntu focal-backports InRelease

Hit:6 http://security.ubuntu.com/ubuntu focal-security InRelease

Hit:7 http://ppa.launchpad.net/graphics-drivers/ppa/ubuntu focal InRelease

Reading package lists... Done

Building dependency tree

Reading state information... Done

30 packages can be upgraded. Run 'apt list --upgradable' to see them.

Reading package lists... Done

Building dependency tree

Reading state information... Done

ffmpeg is already the newest version (7:4.2.7-0ubuntu0.1).

0 upgraded, 0 newly installed, 0 to remove and 30 not upgraded.

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ whisper audio.mp3 --model medium --language Chinese

100%|█████████████████████████████████████| 1.42G/1.42G [03:24<00:00, 7.48MiB/s]

Traceback (most recent call last):

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/audio.py", line 58, in load_audio

out = run(cmd, capture_output=True, check=True).stdout

File "/usr/lib/python3.8/subprocess.py", line 516, in run

raise CalledProcessError(retcode, process.args,

subprocess.CalledProcessError: Command '['ffmpeg', '-nostdin', '-threads', '0', '-i', 'audio.mp3', '-f', 's16le', '-ac', '1', '-acodec', 'pcm_s16le', '-ar', '16000', '-']' returned non-zero exit status 1.

The above exception was the direct cause of the following exception:

Traceback (most recent call last):

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/transcribe.py", line 478, in cli

result = transcribe(model, audio_path, temperature=temperature, **args)

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/transcribe.py", line 122, in transcribe

mel = log_mel_spectrogram(audio, model.dims.n_mels, padding=N_SAMPLES)

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/audio.py", line 140, in log_mel_spectrogram

audio = load_audio(audio)

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/audio.py", line 60, in load_audio

raise RuntimeError(f"Failed to load audio: {e.stderr.decode()}") from e

built with gcc 9 (Ubuntu 9.4.0-1ubuntu1~20.04.1)

libavutil 56. 31.100 / 56. 31.100

libavcodec 58. 54.100 / 58. 54.100

libavformat 58. 29.100 / 58. 29.100

libavdevice 58. 8.100 / 58. 8.100

libavfilter 7. 57.100 / 7. 57.100

libavresample 4. 0. 0 / 4. 0. 0

libswscale 5. 5.100 / 5. 5.100

libswresample 3. 5.100 / 3. 5.100

libpostproc 55. 5.100 / 55. 5.100

audio.mp3: No such file or directory

built with gcc 9 (Ubuntu 9.4.0-1ubuntu1~20.04.1)

libavutil 56. 31.100 / 56. 31.100

libavcodec 58. 54.100 / 58. 54.100

libavformat 58. 29.100 / 58. 29.100

libavdevice 58. 8.100 / 58. 8.100

libavfilter 7. 57.100 / 7. 57.100

libavresample 4. 0. 0 / 4. 0. 0

libswscale 5. 5.100 / 5. 5.100

libswresample 3. 5.100 / 3. 5.100

libpostproc 55. 5.100 / 55. 5.100

audio.mp3: No such file or directory

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ whisper chi.mp4 --model medium --language Chinese

Traceback (most recent call last):

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/audio.py", line 58, in load_audio

out = run(cmd, capture_output=True, check=True).stdout

File "/usr/lib/python3.8/subprocess.py", line 516, in run

raise CalledProcessError(retcode, process.args,

subprocess.CalledProcessError: Command '['ffmpeg', '-nostdin', '-threads', '0', '-i', 'chi.mp4', '-f', 's16le', '-ac', '1', '-acodec', 'pcm_s16le', '-ar', '16000', '-']' returned non-zero exit status 1.

The above exception was the direct cause of the following exception:

Traceback (most recent call last):

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/transcribe.py", line 478, in cli

result = transcribe(model, audio_path, temperature=temperature, **args)

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/transcribe.py", line 122, in transcribe

mel = log_mel_spectrogram(audio, model.dims.n_mels, padding=N_SAMPLES)

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/audio.py", line 140, in log_mel_spectrogram

audio = load_audio(audio)

File "/home/rootroot/.local/lib/python3.8/site-packages/whisper/audio.py", line 60, in load_audio

raise RuntimeError(f"Failed to load audio: {e.stderr.decode()}") from e

built with gcc 9 (Ubuntu 9.4.0-1ubuntu1~20.04.1)

libavutil 56. 31.100 / 56. 31.100

libavcodec 58. 54.100 / 58. 54.100

libavformat 58. 29.100 / 58. 29.100

libavdevice 58. 8.100 / 58. 8.100

libavfilter 7. 57.100 / 7. 57.100

libavresample 4. 0. 0 / 4. 0. 0

libswscale 5. 5.100 / 5. 5.100

libswresample 3. 5.100 / 3. 5.100

libpostproc 55. 5.100 / 55. 5.100

chi.mp4: No such file or directory

built with gcc 9 (Ubuntu 9.4.0-1ubuntu1~20.04.1)

libavutil 56. 31.100 / 56. 31.100

libavcodec 58. 54.100 / 58. 54.100

libavformat 58. 29.100 / 58. 29.100

libavdevice 58. 8.100 / 58. 8.100

libavfilter 7. 57.100 / 7. 57.100

libavresample 4. 0. 0 / 4. 0. 0

libswscale 5. 5.100 / 5. 5.100

libswresample 3. 5.100 / 3. 5.100

libpostproc 55. 5.100 / 55. 5.100

chi.mp4: No such file or directory

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ sudo apt-get install ffmpeg

Reading package lists... Done

Building dependency tree

Reading state information... Done

ffmpeg is already the newest version (7:4.2.7-0ubuntu0.1).

0 upgraded, 0 newly installed, 0 to remove and 30 not upgraded.

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ ll *.mp4

-rwx------ 1 rootroot rootroot 3465644 1月 12 01:28 chs.mp4*

rootroot@rootroot-X99-Turbo:~$

rootroot@rootroot-X99-Turbo:~$ whisper chs.mp4 --model medium --language Chinese