From b8df855b654cf28367535cef44549f7b737043b5 Mon Sep 17 00:00:00 2001 From: yumoqing Date: Mon, 20 Apr 2026 16:33:49 +0800 Subject: [PATCH] bugfix --- README.md | 511 ++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 511 insertions(+) diff --git a/README.md b/README.md index e69de29..0b58a09 100644 --- a/README.md +++ b/README.md @@ -0,0 +1,511 @@ +# 在GPU上跑的服务 + +## clip.service +多媒体embedding服务,提供文本,图像,视频和音频的embedding服务 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +WorkingDirectory=/share/run/clip +ExecStart=/share/run/clip/start.sh +ExecStop=/share/run/clip/stop.sh +StandardOutput=append:/var/log/clip/clip.log +StandardError=append:/var/log/clip/clip.log +SyslogIdentifier=clip + +[Install] +WantedBy=multi-user.target +``` + +### 模型 +* 使用的模型名:laion/CLIP-ViT-B-32-laion2B-s34B-b79K +* 模型路径 + +### 运行脚本 +``` +#!/bin/bash + +CUDA_VISIBLE_DEVICES=4 /share/vllm-0.8.5/bin/python -m llmengine +.mm_embedding -p 8882 +``` + +## entities.service +实体关系 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +WorkingDirectory=/share/run/entities +ExecStart=/share/run/entities/start.sh +ExecStop=/share/run/entities/stop.sh +StandardOutput=append:/var/log/entities/entities.log +StandardError=append:/var/log/entities/entities.log +SyslogIdentifier=entities + +[Install] +WantedBy=multi-user.target +``` + +### 模型 +路径:/share/models/LTP/small + +### 运行脚本 +``` +#!/bin/bash + +CUDA_VISIBLE_DEVICES=7 /share/vllm-0.8.5/bin/python -m llmengine.entity -p 9990 /share/models/LTP/small +``` + +## f5tts.service +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +User=ymq +Group=ymq +WorkingDirectory=/share/ymq/run/f5tts +Type=forking +ExecStart=/share/ymq/run/f5tts/start.sh +ExecStop=/share/ymq/run/f5tts/stop.sh +StandardOutput=append:/var/log/f5tts/f5tts.log +StandardError=append:/var/log/f5tts/f5tts.log +SyslogIdentifier=f5tts + +[Install] +WantedBy=multi-user.target +``` + +### 模型 +* 模型路径 +/share/models/SWivid/F5-TTS/F5TTS_v1_Base/model_1250000.safetensors + +### 软件仓库 +https://git.opencomputing.cn/yumoqing/f5tts + +### 执行脚本 +``` +#!/usr/bin/bash + +echo start 3 instances for f5tts engine +rundir=/share/ymq/run/f5tts +CUDA_VISIBLE_DEVICES=6 ${rundir}/f5tts.env/bin/python ${rundir}/app/f5tts.py -w ${rundir} -p 9995 & +CUDA_VISIBLE_DEVICES=6 ${rundir}/f5tts.env/bin/python ${rundir}/app/f5tts.py -w ${rundir} -p 9995 & +CUDA_VISIBLE_DEVICES=6 ${rundir}/f5tts.env/bin/python ${rundir}/app/f5tts.py -w ${rundir} -p 9995 & +CUDA_VISIBLE_DEVICES=6 ${rundir}/f5tts.env/bin/python ${rundir}/app/f5tts.py -w ${rundir} -p 9995 & +``` + +f5tts.service +## fastwhisper.service +ASR模型 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +User=ymq +Group=ymq +Type=forking +WorkingDirectory=/d/ymq/run/fastwhisper +ExecStart=/d/ymq/run/fastwhisper/start.sh +ExecStop=/d/ymq/run/fastwhisper/stop.sh +StandardOutput=append:/d/ymq/run/fastwhisper/logs/fastwhisper.log +StandardError=append:/d/ymq/run/fastwhisper/logs/fastwhisper.log +SyslogIdentifier=fastwhisper + +[Install] +WantedBy=multi-user.target +``` +### 模型 +* 路径 +/data/ymq/models/deepdml/faster-whisper-large-v3-turbo-ct2 + +### 软件仓库 +https://git.opencomputing.cn/yumoqing/fastwhisper + +### 执行脚本 +``` +cd /d/ymq/run/fastwhisper +/d/ymq/run/fastwhisper/py3/bin/python /d/ymq/run/fastwhisper/app/fastwhisper.py -w /d/ymq/run/fastwhisper & +exit 0 +``` + +## fvlm.service +fast vlm 模型服务 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +User=ymq +Group=ymq +Type=forking +WorkingDirectory=/share/ymq/run/fvlm +# ExecStart=/share/ymq/run/fvlm/fvlm.env/bin/python app/fastvlm.py -p 9994 +ExecStart=/share/ymq/run/fvlm/start.sh +ExecStop=/share/ymq/run/fvlm/stop.sh +StandardOutput=append:/var/log/fvlm/fvlm.log +StandardError=append:/var/log/fvlm/fvlm.log +SyslogIdentifier=fvlm + +[Install] +WantedBy=multi-user.target +``` + +### 模型 +* 路径 +/share/models/apple/llava-fastvithd_0.5b_stage3 + +### 软件仓库 +https://git.kaiyuancloud.cn/yumoqing/fvlm + +### 脚本 +``` +#!/usr/bin/bash + +CUDA_VISIBLE_DEVICES=6 /share/ymq/run/fvlm/fvlm.env/bin/python app/fastvlm.py -p 9994 & +``` +## m2m.service +多语言翻译 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +WorkingDirectory=/share/run/m2m +ExecStart=/share/run/m2m/start.sh +ExecStop=/share/run/m2m/stop.sh +StandardOutput=append:/var/log/m2m/m2m.log +StandardError=append:/var/log/m2m/m2m.log +SyslogIdentifier=m2m + +[Install] +WantedBy=multi-user.target +``` +### 模型 +* 路径 +/share/models/facebook/m2m100_1.2B + +### 运行脚本 +#!/bin/bash +``` +/share/vllm-0.8.5/bin/python -m llmengine.m2m -p 8883 /share/models/facebook/m2m100_1.2B +``` +## neo4j.service +知识图谱数据库 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +Type=forking +WorkingDirectory=/share/run/neo4j +ExecStart=/share/run/neo4j/start.sh +ExecStop=/share/run/neo4j/stop.sh +StandardOutput=append:/var/log/neo4j/neo4j.log +StandardError=append:/var/log/neo4j/neo4j.log +SyslogIdentifier=/share/run/neo4j +TimeoutStartSec=300 + +[Install] +WantedBy=multi-user.target +``` + +### 模型路径 +* 路径 + +### 软件仓库 +https://git.kaiyuancloud.cn/yumoqing/llmengine +### 运行脚本 +``` +#!/bin/bash +CUDA_VISIBLE_DEVICES=7 /share/vllm-0.8.5/bin/python -m llmengine.neo4j -p 8885 Neo4j & +``` +## nvidia-asr.service +英伟达的ASR模型 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +User=ymq +Group=ymq +Type=forking +WorkingDirectory=/share/ymq/run/nvidia-asr +ExecStart=/share/ymq/run/nvidia-asr/start.sh +ExecStop=/share/ymq/run/nvidia-asr/stop.sh +StandardOutput=append:/var/log/asr/asr.log +StandardError=append:/var/log/asr/asr.log +SyslogIdentifier=asr +[Install] +WantedBy=multi-user.target +``` + +### 模型 +* 路径 +/share/models/nvidia/parakeet-tdt-0.6b-v2/parakeet-tdt-0.6b-v2.nemo +### 软件仓库 +https://git.opencomputing.cn/yumoqing/nvidia-asr.git + +### 执行脚本 +``` +#!/usr/bin/bash + +rundir=/share/ymq/run/nvidia-asr +cd $rundir +CUDA_VISIBLE_DEVICES=6 $rundir/nvidia-asr.env/bin/python app/asr.py -p 9992 & +# CUDA_VISIBLE_DEVICES=6 $rundir/nvidia-asr.env/bin/python app/asr.py -p 9992 & +``` + + +## ollama.service +``` +[Unit] +Description=Ollama Service +After=network-online.target + +[Service] +ExecStart=/d/ollama/start.sh +# CUDA_VISIBLE_DEVICES=2,3 /usr/local/bin/ollama serve +User=ollama +Group=ollama +Restart=always +RestartSec=3 +Environment="PATH=/d/ymq/.local/bin:/d/ymq/bin:/d/ymq/bin:/usr/l +ocal/cuda-12/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/b +in:/sbin:/bin:/usr/games:/usr/local/games:/snap/bin" + +[Install] +WantedBy=default.target +``` + +## qwen3.service +qwen3-0.6b模型 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +WorkingDirectory=/share/run/qwen3 +Type=forking +ExecStart=/share/run/qwen3/start.sh +ExecStop=/share/run/qwen3/stop.sh +StandardOutput=append:/var/log/qwen3/qwen3.log +StandardError=append:/var/log/qwen3/qwen3.log +SyslogIdentifier=qwen3 + +[Install] +``` +### 模型 +* 路径 +/d/models/Qwen/Qwen3-0.6B + +### 执行脚本 +``` +#!/usr/bin/bash + +rundir=/share/run/qwen3 +CUDA_VISIBLE_DEVICES=7 /share/vllm-0.8.5/bin/python -m llmengine.server -w ${rundir} -p 9089 /d/models/Qwen/Qwen3-0.6B & +exit 0 +``` + +## qwen3coder.service +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +WorkingDirectory=/share/run/qwen3coder +Type=forking +ExecStart=/share/run/qwen3coder/start.sh +ExecStop=/share/run/qwen3coder/stop.sh +StandardOutput=append:/var/log/qwen3coder/qwen3coder.log +StandardError=append:/var/log/qwen3coder/qwen3coder.log +SyslogIdentifier=qwen3coder + +[Install] +WantedBy=multi-user.target +``` + +### 模型 +* 路径 +/d/models/Qwen/Qwen3-Coder-30B-A3B-Instruct + +### 执行脚本 +``` +#!/usr/bin/bash + +rundir=/share/run/qwen3coder +CUDA_VISIBLE_DEVICES=0 /share/vllm-0.8.5/bin/python -m llmengine.server -w ${rundir} -p 9088 /d/models/Qwen/Qwen3-Coder-30B-A3B-Instruct & +exit 0 +``` +## reranker.service +``` +[Unit] +Description=A Rerank Service using Qwen3-Reranker-0.6B +# After=network.target DeepSeek70B-kyyds671b-ray.service +# Requires=DeepSeek70B-kyyds671b-ray.service +StartLimitIntervalSec=60 +StartLimitBurst=5 + +[Service] +# 核心启动参数(保持原有配置) +WorkingDirectory=/share/run/reranker +#定义环境变量,所有节点的启动脚本与服务需一致 +#Environment="NCCL_SOCKET_IFNAME=enp196s0f0np0" +#ExecStartPre=/data/kyyds671b/ray_check.sh +ExecStart=/share/run/reranker/start.sh +ExecStop=/share/run/reranker/stop.sh + +# 超时与停止控制(新增部分) +# 启动超时延长至 120 秒 +# TimeoutStartSec=120 +# 停止等待时间 30 秒 +# TimeoutStopSec=30 +# 优先发送 SIGINT 信号(更适合 Python 程序) +# KillSignal=SIGINT +# 最终强制终止信号 +# RestartKillSignal=SIGKILL +# 混合终止模式 +# KillMode=mixed +# 重启策略 +# Restart=on-failure +# RestartSec=10s +# 服务管理(保持原有配置+增强) +#Restart=always +#RestartSec=10 # 重启间隔从 5 秒调整为 10 秒 +#append 是继续写入相当于>> file是从新写入 相当于> +StandardOutput=append:/var/log/rerank/rerank.log +StandardError=append:/var/log/rerank/error.log +SyslogIdentifier=rerank +# 资源限制(保持可选配置) +#LimitNOFILE=65536 +#LimitNPROC=65536 +# GPU 支持 +#Environment=CUDA_VISIBLE_DEVICES=0,1 + +[Install] +WantedBy=multi-user.target +``` + +### 模型 +* 路径 +/share/models/BAAI/bge-reranker-v2-m3 +### 脚本 +``` +#!/bin/bash + +# CUDA_VISIBLE_DEVICES=7 /share/vllm-0.8.5/bin/python -m llmengine.rerank -p 9997 /d/ymq/models/Qwen/Qwen3-Reranker-0___6B +CUDA_VISIBLE_DEVICES=4 /share/vllm-0.8.5/bin/python -m llmengine.rerank -p 9997 /share/models/BAAI/bge-reranker-v2-m3 +``` + +## subtitler.service +歌曲歌词对齐服务 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +User=ymq +Group=ymq +Type=forking +WorkingDirectory=/d/ymq/py/subtitle +ExecStart=/d/ymq/py/subtitle/start.sh +ExecStop=/d/ymq/py/subtitle/stop.sh +StandardOutput=append:/var/log/subtitler/subtitler.log +StandardError=append:/var/log/subtitler/subtitler.log +SyslogIdentifier=subtitler + +[Install] +WantedBy=multi-user.target +``` +### 模型 +* 路径 +1 /data/ymq/models/MahmoudAshraf/mms-300m-1130-forced-aligner +对齐模型 +2 /data/ymq/models/mdx_models/UVR-MDX-NET-Voc_FT.onnx 分割人声和伴奏 + +### 仓库 +https://git.opencomputing.cn/yumoqing/subtitle +### 脚本 +``` +#!/usr/bin/bash +cd /d/ymq/py/subtitle +/d/ymq/py/subtitle/py3/bin/python /d/ymq/py/subtitle/app/subtitler.py -p 9901 -w /d/ymq/py/subtitle & +exit 0 +``` +## triples.service +获取三元组 +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +Type=forking +WorkingDirectory=/share/run/triples +ExecStart=/share/run/triples/start.sh +ExecStop=/share/run/triples/stop.sh +StandardOutput=append:/var/log/triples/triples.log +StandardError=append:/var/log/triples/triples.log +SyslogIdentifier=/share/run/triples + +[Install] +WantedBy=multi-user.target +``` + +### 模型 +* 路径 +/share/models/Babelscape/mrebel-large + +### 脚本 +``` +#!/bin/bash + +CUDA_VISIBLE_DEVICES=7 /share/vllm-0.8.5/bin/python -m llmengine.triple -p 9991 /share/models/Babelscape/mrebel-large & +CUDA_VISIBLE_DEVICES=7 /share/vllm-0.8.5/bin/python -m llmengine.triple -p 9991 /share/models/Babelscape/mrebel-large & +CUDA_VISIBLE_DEVICES=7 /share/vllm-0.8.5/bin/python -m llmengine.triple -p 9991 /share/models/Babelscape/mrebel-large & +``` + +## vdb.service +milvus向量数据库 + +``` +[Unit] +Wants=systemd-networkd.service + +[Service] +User=wangmeihua +Group=wangmeihua +Type=forking +WorkingDirectory=/d/wangmeihua/vdbtest/vdb +ExecStart=/d/wangmeihua/vdbtest/vdb/start.sh +ExecStop=/d/wangmeihua/vdbtest/vdb/stop.sh +StandardOutput=append:/var/log/vdb/vdb.log +StandardError=append:/var/log/vdb/vdb.log +SyslogIdentifier=vdb + +[Install] +WantedBy=multi-user.target +``` +### 仓库 +https://git.opencomputing.cn/yumoqing/vdb +### 脚本 +``` +#!/usr/bin/bash + +# 检查是否有 vdb 进程正在运行 +PID=$(ps aux | grep "vdbapp.py" | grep -v grep | awk '{print $2}' | head -1) + +if [ -n "$PID" ]; then + echo "错误:VDB 服务已在运行 (PID: $PID)" + echo "请先停止现有服务:kill $PID" + exit 1 +fi + +cd /share/wangmeihua/vdbtest/vdb +/share/wangmeihua/vdbtest/vdb/vdbvenv/bin/python /d/wangmeihua/vdbtest/vdb/app/vdbapp.py -p 8887 -w /d/wangmeihua/vdbtest/vdb & +echo "VDB 服务已启动 (PID: $!)" +exit 0 +```