Deploying text-generation-webui

Hello everybody,

I would be really thankful if you help.
I am trying to deploy GitHub - oobabooga/text-generation-webui: A Gradio web UI for Large Language Models. Supports transformers, GPTQ, AWQ, llama.cpp (GGUF), Llama models. .
Unfortunately I always get email that free-builder crashed due to insufficient RAM and get this error

 => ERROR [builder 6/6] RUN . /build/venv/bin/activate &&     python3 setup_cuda.py bdist_wheel -d .                           580.7s
------
 > [builder 6/6] RUN . /build/venv/bin/activate &&     python3 setup_cuda.py bdist_wheel -d .:
#0 4.231 No CUDA runtime is found, using CUDA_HOME='/usr/local/cuda'
#0 4.269 running bdist_wheel
#0 4.328 running build
#0 4.328 running build_ext
#0 4.348 /build/venv/lib/python3.10/site-packages/torch/utils/cpp_extension.py:424: UserWarning: There are no x86_64-linux-gnu-g++ version bounds defined for CUDA version 11.8
#0 4.348   warnings.warn(f'There are no {compiler_name} version bounds defined for CUDA version {cuda_str_version}')
#0 4.348 building 'quant_cuda' extension
#0 4.348 creating /build/build
#0 4.349 creating /build/build/temp.linux-x86_64-cpython-310
#0 4.390 Emitting ninja build file /build/build/temp.linux-x86_64-cpython-310/build.ninja...
#0 4.403 Compiling objects...
#0 4.403 Allowing ninja to set a default number of workers... (overridable by setting the environment variable MAX_JOBS=N)
#0 563.9 [1/2] /usr/local/cuda/bin/nvcc  -I/build/venv/lib/python3.10/site-packages/torch/include -I/build/venv/lib/python3.10/site-packages/torch/include/torch/csrc/api/include -I/build/venv/lib/python3.10/site-packages/torch/include/TH -I/build/venv/lib/python3.10/site-packages/torch/include/THC -I/usr/local/cuda/include -I/build/venv/include -I/usr/include/python3.10 -c -c /build/quant_cuda_kernel.cu -o /build/build/temp.linux-x86_64-cpython-310/quant_cuda_kernel.o -D__CUDA_NO_HALF_OPERATORS__ -D__CUDA_NO_HALF_CONVERSIONS__ -D__CUDA_NO_BFLOAT16_CONVERSIONS__ -D__CUDA_NO_HALF2_OPERATORS__ --expt-relaxed-constexpr --compiler-options ''"'"'-fPIC'"'"'' -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1011"' -DTORCH_EXTENSION_NAME=quant_cuda -D_GLIBCXX_USE_CXX11_ABI=0 -gencode=arch=compute_35,code=sm_35 -gencode=arch=compute_50,code=sm_50 -gencode=arch=compute_60,code=sm_60 -gencode=arch=compute_61,code=sm_61 -gencode=arch=compute_70,code=sm_70 -gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_80,code=sm_80 -gencode=arch=compute_86,code=compute_86 -gencode=arch=compute_86,code=sm_86 -std=c++17
#0 563.9 FAILED: /build/build/temp.linux-x86_64-cpython-310/quant_cuda_kernel.o 
#0 563.9 /usr/local/cuda/bin/nvcc  -I/build/venv/lib/python3.10/site-packages/torch/include -I/build/venv/lib/python3.10/site-packages/torch/include/torch/csrc/api/include -I/build/venv/lib/python3.10/site-packages/torch/include/TH -I/build/venv/lib/python3.10/site-packages/torch/include/THC -I/usr/local/cuda/include -I/build/venv/include -I/usr/include/python3.10 -c -c /build/quant_cuda_kernel.cu -o /build/build/temp.linux-x86_64-cpython-310/quant_cuda_kernel.o -D__CUDA_NO_HALF_OPERATORS__ -D__CUDA_NO_HALF_CONVERSIONS__ -D__CUDA_NO_BFLOAT16_CONVERSIONS__ -D__CUDA_NO_HALF2_OPERATORS__ --expt-relaxed-constexpr --compiler-options ''"'"'-fPIC'"'"'' -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1011"' -DTORCH_EXTENSION_NAME=quant_cuda -D_GLIBCXX_USE_CXX11_ABI=0 -gencode=arch=compute_35,code=sm_35 -gencode=arch=compute_50,code=sm_50 -gencode=arch=compute_60,code=sm_60 -gencode=arch=compute_61,code=sm_61 -gencode=arch=compute_70,code=sm_70 -gencode=arch=compute_75,code=sm_75 -gencode=arch=compute_80,code=sm_80 -gencode=arch=compute_86,code=compute_86 -gencode=arch=compute_86,code=sm_86 -std=c++17
#0 563.9 nvcc warning : The 'compute_35', 'compute_37', 'sm_35', and 'sm_37' architectures are deprecated, and may be removed in a future release (Use -Wno-deprecated-gpu-targets to suppress warning).
#0 563.9 Killed
#0 579.6 [2/2] c++ -MMD -MF /build/build/temp.linux-x86_64-cpython-310/quant_cuda.o.d -Wno-unused-result -Wsign-compare -DNDEBUG -g -fwrapv -O2 -Wall -g -fstack-protector-strong -Wformat -Werror=format-security -g -fwrapv -O2 -fPIC -I/build/venv/lib/python3.10/site-packages/torch/include -I/build/venv/lib/python3.10/site-packages/torch/include/torch/csrc/api/include -I/build/venv/lib/python3.10/site-packages/torch/include/TH -I/build/venv/lib/python3.10/site-packages/torch/include/THC -I/usr/local/cuda/include -I/build/venv/include -I/usr/include/python3.10 -c -c /build/quant_cuda.cpp -o /build/build/temp.linux-x86_64-cpython-310/quant_cuda.o -DTORCH_API_INCLUDE_EXTENSION_H '-DPYBIND11_COMPILER_TYPE="_gcc"' '-DPYBIND11_STDLIB="_libstdcpp"' '-DPYBIND11_BUILD_ABI="_cxxabi1011"' -DTORCH_EXTENSION_NAME=quant_cuda -D_GLIBCXX_USE_CXX11_ABI=0 -std=c++17
#0 579.6 ninja: build stopped: subcommand failed.
#0 579.6 Traceback (most recent call last):
#0 579.6   File "/build/venv/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 2100, in _run_ninja_build
#0 579.6     subprocess.run(
#0 579.6   File "/usr/lib/python3.10/subprocess.py", line 526, in run
#0 579.6     raise CalledProcessError(retcode, process.args,
#0 579.6 subprocess.CalledProcessError: Command '['ninja', '-v']' returned non-zero exit status 1.
#0 579.6 
#0 579.6 The above exception was the direct cause of the following exception:
#0 579.6 
#0 579.6 Traceback (most recent call last):
#0 579.6   File "/build/setup_cuda.py", line 4, in <module>
#0 579.6     setup(
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/__init__.py", line 103, in setup
#0 579.6     return distutils.core.setup(**attrs)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/core.py", line 185, in setup
#0 579.6     return run_commands(dist)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/core.py", line 201, in run_commands
#0 579.6     dist.run_commands()
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/dist.py", line 969, in run_commands
#0 579.6     self.run_command(cmd)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/dist.py", line 989, in run_command
#0 579.6     super().run_command(command)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/dist.py", line 988, in run_command
#0 579.6     cmd_obj.run()
#0 579.6   File "/build/venv/lib/python3.10/site-packages/wheel/bdist_wheel.py", line 364, in run
#0 579.6     self.run_command("build")
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/cmd.py", line 318, in run_command
#0 579.6     self.distribution.run_command(command)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/dist.py", line 989, in run_command
#0 579.6     super().run_command(command)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/dist.py", line 988, in run_command
#0 579.6     cmd_obj.run()
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/command/build.py", line 131, in run
#0 579.6     self.run_command(cmd_name)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/cmd.py", line 318, in run_command
#0 579.6     self.distribution.run_command(command)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/dist.py", line 989, in run_command
#0 579.6     super().run_command(command)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/dist.py", line 988, in run_command
#0 579.6     cmd_obj.run()
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/command/build_ext.py", line 88, in run
#0 579.6     _build_ext.run(self)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/command/build_ext.py", line 345, in run
#0 579.6     self.build_extensions()
#0 579.6   File "/build/venv/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 873, in build_extensions
#0 579.6     build_ext.build_extensions(self)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/command/build_ext.py", line 467, in build_extensions
#0 579.6     self._build_extensions_serial()
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/command/build_ext.py", line 493, in _build_extensions_serial
#0 579.6     self.build_extension(ext)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/command/build_ext.py", line 249, in build_extension
#0 579.6     _build_ext.build_extension(self, ext)
#0 579.6   File "/build/venv/lib/python3.10/site-packages/setuptools/_distutils/command/build_ext.py", line 548, in build_extension
#0 579.6     objects = self.compiler.compile(
#0 579.6   File "/build/venv/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 686, in unix_wrap_ninja_compile
#0 579.6     _write_ninja_file_and_compile_objects(
#0 579.6   File "/build/venv/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 1774, in _write_ninja_file_and_compile_objects
#0 579.6     _run_ninja_build(
#0 579.6   File "/build/venv/lib/python3.10/site-packages/torch/utils/cpp_extension.py", line 2116, in _run_ninja_build
#0 579.6     raise RuntimeError(message) from e
#0 579.6 RuntimeError: Error compiling objects for extension
------
Error: failed to fetch an image or build from source: error building: failed to solve: executor failed running [/bin/sh -c . /build/venv/bin/activate &&     python3 setup_cuda.py bdist_wheel -d .]: exit code: 1