Merge branch 'master' of https://github.com/colourfulspring/DiffSinger

colourfulspring · colourfulspring · commit 9a3391c68d70 · 2022-08-18T16:45:00.000+08:00
diff --git a/.github/workflows/main.yml b/.github/workflows/main.yml
@@ -0,0 +1,44 @@
+on:
+  workflow_dispatch:
+    inputs:
+      version:
+        description: '版本号'
+        default: '0.0.0'
+        required: true
+        type: string
+
+jobs:
+  pack-windows:
+    runs-on: ${{ matrix.os }}
+
+    strategy:
+      matrix:
+        os: [ 'windows-latest' ]
+
+    steps:
+    - uses: actions/checkout@v1
+
+    - name: Download Winpython
+      uses: carlosperate/download-file-action@v1.0.3
+      with:
+        file-url: https://github.com/winpython/winpython/releases/download/4.3.20210620/Winpython64-3.8.10.0dot.exe
+        file-name: Winpython64-3.8.10.0dot.exe
+        location: ${{ github.workspace }}
+
+    - name: Extract Winpython
+      run: 7z x -o"${{ github.workspace }}" "${{ github.workspace }}/Winpython64-3.8.10.0dot.exe"
+
+    - name: Install python packages
+      run: .\build.bat
+
+    - name: remove Winpython installer
+      run: del "${{ github.workspace }}/Winpython64-3.8.10.0dot.exe"
+
+    - name: pack
+      run: 7z a .\diffsinger-server.zip .\*
+
+    - name: upload
+      uses: actions/upload-artifact@v1.0.0
+      with:
+        name: diffsinger-server-cpu-${{ inputs.version }}.zip
+        path: ${{ github.workspace }}\diffsinger-server.zip
diff --git a/.gitignore b/.gitignore
@@ -8,4 +8,8 @@ local_tools/
 *.wav
 infer_out/
 config.yaml
-*.onnx
+*.onnx
+
+.vscode
+WPy64-38100
+Winpython64-3.8.10.0dot.exe
diff --git a/build.bat b/build.bat
@@ -0,0 +1,5 @@
+WPy64-38100\python-3.8.10.amd64\python -m pip install "https://download.pytorch.org/whl/cpu/torch-1.6.0%%2Bcpu-cp38-cp38-win_amd64.whl"
+WPy64-38100\python-3.8.10.amd64\python -m pip install https://download.pytorch.org/whl/torchaudio-0.6.0-cp38-none-win_amd64.whl
+WPy64-38100\python-3.8.10.amd64\python -m pip install "https://download.pytorch.org/whl/cpu/torchvision-0.7.0%%2Bcpu-cp38-cp38-win_amd64.whl"
+WPy64-38100\python-3.8.10.amd64\python -m pip install -r requirements_2080.txt
+WPy64-38100\python-3.8.10.amd64\python -m pip install -r requirements_server.txt
diff --git a/requirements_server.txt b/requirements_server.txt
@@ -0,0 +1 @@
+pyzmq==23.2.0
diff --git a/run.bat b/run.bat
@@ -0,0 +1 @@
+WPy64-38100\python-3.8.10.amd64\python.exe server.py
diff --git a/server.py b/server.py
@@ -0,0 +1,145 @@
+# coding=utf8
+print('Starting diffsinger server...')
+import json
+import os
+import sys
+import traceback
+import zmq
+
+from inference.svs.ds_e2e import DiffSingerE2EInfer
+
+notedict={
+    0:"C",
+    1:"C#",
+    2:"D",
+    3:"D#",
+    4:"E",
+    5:"F",
+    6:"F#",
+    7:"G",
+    8:"G#",
+    9:"A",
+    10:"A#",
+    11:"B"
+}
+
+def poll_socket(socket, timetick = 100):
+    poller = zmq.Poller()
+    poller.register(socket, zmq.POLLIN)
+    # wait up to 100msec
+    try:
+        while True:
+            obj = dict(poller.poll(timetick))
+            if socket in obj and obj[socket] == zmq.POLLIN:
+                yield socket.recv()
+    except KeyboardInterrupt:
+        pass
+    # Escape while loop if there's a keyboard interrupt.
+
+def readblocks(ustfile):
+    #迭代器，从ust文件中逐个读取块，以字典形式返回
+    current_block_data=dict()
+    for line in ustfile.readlines():
+        if(line.startswith("[")):#块的开始
+            #先返回上一个
+            if(len(current_block_data)>=1):
+                yield current_block_data
+            #然后开新块
+            current_block_data={"name":line.strip("[#]\n")}
+            pass
+        else:
+            (key,value)=line.strip("\n").split("=")
+            current_block_data[key]=value
+            pass
+    if(len(current_block_data)>=1):#返回最后一个
+        yield current_block_data
+
+def acoustic(ustpath:str):
+    #解析ust文件为diffsinger所需格式
+    #参考：main.py
+    wavpath=ustpath[:-4]+".wav"
+
+    tempo=120
+    project=""
+    voiceDir=""
+    cacheDir=""
+    
+    ph_seq=[]
+    note_seq=[]
+    ph_dur=[]
+    is_slur_seq=[]
+
+    with open(ustpath) as ustfile:
+        for block in readblocks(ustfile):
+            if(block["name"]=="SETTING"):#音轨信息块
+                tempo=float(block["Tempo"])
+                project=block["Project"]
+                voiceDir=block["VoiceDir"]
+                cacheDir=block["CacheDir"]
+            elif(block["name"].isdigit()):#音符
+                lyric=block["Lyric"]
+                notenum=int(block["NoteNum"])
+                length=int(block["Length"])
+                if(lyric=="-"):#；连音符
+                    ph_seq.append(ph_seq[-1])
+                    note_seq.append(notedict[notenum%12]+str(notenum//12-1))
+                    ph_dur.append(str(length/(tempo*8)))
+                    is_slur_seq.append("1")
+                elif(lyric!="R"):
+                    ph_seq.append(lyric)
+                    note_seq.append(notedict[notenum%12]+str(notenum//12-1))
+                    ph_dur.append(str(length/(tempo*8)))
+                    is_slur_seq.append("0")
+    ph_seq=" ".join(ph_seq)
+    print("Phonemes:",ph_seq)
+    inp={
+        "text":"",
+        "ph_seq":ph_seq,
+        "note_seq":" ".join(note_seq),
+        "ph_dur":" ".join(ph_dur),
+        "note_dur_seq":" ".join(ph_dur),
+        "is_slur_seq":" ".join(is_slur_seq),
+        'input_type': 'phoneme'
+    }
+    #合成
+    DiffSingerE2EInfer.example_run(inp, target=wavpath)
+    return {
+        'path_wav': wavpath,
+    }
+
+#为了方便调试，把argv配置放外面
+root_dir = os.path.dirname(__file__)
+sys.argv = [
+f'{root_dir}/inference/svs/ds_e2e.py',
+'--config',
+f'{root_dir}/usr/configs/midi/e2e/opencpop/ds100_adj_rel.yaml',
+'--exp_name',
+'0228_opencpop_ds100_rel']
+
+def main():
+    context = zmq.Context()
+    socket = context.socket(zmq.REP)
+    socket.bind('tcp://*:38442')
+    print('Started diffsinger server')
+
+    for message in poll_socket(socket):
+        request = json.loads(message)
+        print("="*40)
+        print('Received request: %s' % request)
+        response = {}
+        try:
+            #if request[0] == 'timing':
+            #    response['result'] = timing(request[1])
+            if request[0] == 'acoustic':
+                response['result'] = acoustic(request[1])
+            else:
+                raise NotImplementedError('unexpected command %s' % request[0])
+        except Exception as e:
+            response['error'] = str(e)
+            traceback.print_exc()
+
+        print('Sending response: %s' % response)
+        socket.send_string(json.dumps(response))
+
+if(__name__=="__main__"):
+    main()
diff --git a/utils/hparams.py b/utils/hparams.py
@@ -45,7 +45,11 @@ def set_hparams(config='', exp_name='', hparams_str='', print_hparams=True, glob
     loaded_config = set()
 
     def load_config(config_fn):  # deep first
-        with open(config_fn, encoding='utf-8') as f:
+        if(config_fn.startswith("/")):
+            config_fn_path=os.path.abspath(config_fn[1:])
+        else:
+            config_fn_path=config_fn
+        with open(config_fn_path, encoding='utf-8') as f:
             hparams_ = yaml.safe_load(f)
         loaded_config.add(config_fn)
         if 'base_config' in hparams_:

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1 @@`
	`1`	`+WPy64-38100\python-3.8.10.amd64\python.exe server.py`