Spaces:

M4869
/

WavMark

Runtime error

App Files Files Community

xxxfortest commited on Sep 16, 2023

Commit

7342b32

1 Parent(s): edb49b9

update

Browse files

Files changed (6) hide show

1_upload.sh +6 -1
app.py +47 -52
example.wav +0 -0
requirements.txt +1 -1
停泊/app.py +148 -0
停泊/requirements_bk.txt +6 -0

1_upload.sh CHANGED Viewed

@@ -1,3 +1,8 @@
 git add .
 git commit -m "Add application file"
-git push

+git config --global http.proxy http://127.0.0.1:7890
+git config --global https.proxy https://127.0.0.1:7890
 git add .
 git commit -m "Add application file"
+git push
+#git remote set-url origin https://huggingface.co/spaces/M4869/WavMark

app.py CHANGED Viewed

@@ -12,8 +12,8 @@ from huggingface_hub import hf_hub_download, HfApi
 from wavmark.utils import file_reader
-# Function to add watermark to audio
 def add_watermark(audio_path, watermark_text):
     assert len(watermark_text) == 16
     watermark_npy = np.array([int(i) for i in watermark_text])
     # todo: 控制时间
@@ -24,83 +24,74 @@ def add_watermark(audio_path, watermark_text):
     tmp_file_name = datetime.datetime.now().strftime('%Y-%m-%d_%H-%M-%S') + "_" + str(uuid.uuid4()) + ".wav"
     tmp_file_path = '/tmp/' + tmp_file_name
     soundfile.write(tmp_file_path, watermarked_signal, sr)
-    return tmp_file_path
-# Function to decode watermark from audio
 def decode_watermark(audio_path):
-    watermarked_signal, sr, audio_length_second = file_reader.read_as_single_channel_16k(audio_path, 16000)
     payload_decoded, _ = wavmark.decode_watermark(model, watermarked_signal, show_progress=False)
     if payload_decoded is None:
-        return "No Watermark"
-    return payload_decoded
-# Main web app
-def main():
-    max_upload_size = 20 * 1024 * 1024  # 20 MB in bytes
     if "def_value" not in st.session_state:
         def_val_npy = np.random.choice([0, 1], size=32 - len_start_bit)
         def_val_str = "".join([str(i) for i in def_val_npy])
         st.session_state.def_value = def_val_str
-    st.title("Neural Audio Watermark")
-    st.write("Choose the action you want to perform:")
-    action = st.selectbox("Select Action", ["Add Watermark", "Decode Watermark"])
-    if action == "Add Watermark":
-        audio_file = st.file_uploader("Upload Audio File (WAV)", type=["wav"], accept_multiple_files=False,
-                                      max_upload_size=max_upload_size)
-        if audio_file:
-            tmp_input_audio_file = os.path.join("/tmp/", audio_file.name)
-            with open(tmp_input_audio_file, "wb") as f:
-                f.write(audio_file.getbuffer())
-            st.audio(tmp_input_audio_file, format="audio/wav")
-            watermark_text = st.text_input("Enter Watermark", value=st.session_state.def_value)
             add_watermark_button = st.button("Add Watermark", key="add_watermark_btn")
             if add_watermark_button:  # 点击按钮后执行的
                 if audio_file and watermark_text:
                     with st.spinner("Adding Watermark..."):
-                        # add_watermark_button.empty()
-                        # st.button("Add Watermark", disabled=True)
-                        # st.button("Add Watermark", disabled=True, key="add_watermark_btn_disabled")
-                        t1 = time.time()
-                        watermarked_audio = add_watermark(tmp_input_audio_file, watermark_text)
-                        encode_time_cost = time.time() - t1
                         st.write("Watermarked Audio:")
                         st.audio(watermarked_audio, format="audio/wav")
-                        st.write("Time Cost:%d seconds" % encode_time_cost)
                         # st.button("Add Watermark", disabled=False)
-    elif action == "Decode Watermark":
-        audio_file = st.file_uploader("Upload Audio File (WAV/MP3)", type=["wav", "mp3"], accept_multiple_files=False,
-                                      max_upload_size=max_upload_size)
-        if audio_file:
-            if st.button("Decode Watermark"):
-                # 1.保存
-                tmp_file_for_decode_path = os.path.join("/tmp/", audio_file.name)
-                with open(tmp_file_for_decode_path, "wb") as f:
-                    f.write(audio_file.getbuffer())
-                # 2.执行
                 with st.spinner("Decoding..."):
-                    t1 = time.time()
-                    decoded_watermark = decode_watermark(tmp_file_for_decode_path)
-                    decode_cost = time.time() - t1
-                print("decoded_watermark", decoded_watermark)
-                # Display the decoded watermark
-                st.write("Decoded Watermark:", decoded_watermark)
-                st.write("Time Cost:%d seconds" % (decode_cost))
 if __name__ == "__main__":
@@ -108,5 +99,9 @@ if __name__ == "__main__":
     device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
     model = wavmark.load_model().to(device)
     main()

 from wavmark.utils import file_reader
 def add_watermark(audio_path, watermark_text):
+    t1 = time.time()
     assert len(watermark_text) == 16
     watermark_npy = np.array([int(i) for i in watermark_text])
     # todo: 控制时间
     tmp_file_name = datetime.datetime.now().strftime('%Y-%m-%d_%H-%M-%S') + "_" + str(uuid.uuid4()) + ".wav"
     tmp_file_path = '/tmp/' + tmp_file_name
     soundfile.write(tmp_file_path, watermarked_signal, sr)
+    encode_time_cost = time.time() - t1
+    return tmp_file_path, encode_time_cost
 def decode_watermark(audio_path):
+    assert os.path.exists(audio_path)
+    t1 = time.time()
+    watermarked_signal, _, audio_length_second = file_reader.read_as_single_channel_16k(audio_path, 16000)
+    max_second = 5
+    if audio_length_second > max_second:
+        watermarked_signal = watermarked_signal[0:16000 * max_second]
     payload_decoded, _ = wavmark.decode_watermark(model, watermarked_signal, show_progress=False)
+    decode_cost = time.time() - t1
     if payload_decoded is None:
+        return "No Watermark", decode_cost
+    payload_decoded_str = "".join([str(i) for i in payload_decoded])
+    st.write("Result:", payload_decoded_str)
+    st.write("Time Cost:%d seconds" % (decode_cost))
+def create_default_value():
     if "def_value" not in st.session_state:
         def_val_npy = np.random.choice([0, 1], size=32 - len_start_bit)
         def_val_str = "".join([str(i) for i in def_val_npy])
         st.session_state.def_value = def_val_str
+# Main web app
+def main():
+    create_default_value()
+    st.title("WavMark")
+    st.write("https://github.com/wavmark/wavmark")
+    audio_file = st.file_uploader("Upload Audio", type=["wav", "mp3"], accept_multiple_files=False)
+    if audio_file:
+        # 保存文件到本地：
+        tmp_input_audio_file = os.path.join("/tmp/", audio_file.name)
+        with open(tmp_input_audio_file, "wb") as f:
+            f.write(audio_file.getbuffer())
+        # 展示文件到页面上
+        # st.audio(tmp_input_audio_file, format="audio/wav")
+        action = st.selectbox("Select Action", ["Add Watermark", "Decode Watermark"])
+        if action == "Add Watermark":
+            watermark_text = st.text_input("The watermark (0, 1 list of length-16):", value=st.session_state.def_value)
             add_watermark_button = st.button("Add Watermark", key="add_watermark_btn")
             if add_watermark_button:  # 点击按钮后执行的
                 if audio_file and watermark_text:
                     with st.spinner("Adding Watermark..."):
+                        watermarked_audio, encode_time_cost = add_watermark(tmp_input_audio_file, watermark_text)
                         st.write("Watermarked Audio:")
+                        print("watermarked_audio:", watermarked_audio)
                         st.audio(watermarked_audio, format="audio/wav")
+                        st.write("Time Cost: %d seconds" % encode_time_cost)
                         # st.button("Add Watermark", disabled=False)
+        elif action == "Decode Watermark":
+            if st.button("Decode"):
                 with st.spinner("Decoding..."):
+                    decode_watermark(tmp_input_audio_file)
 if __name__ == "__main__":
     device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
     model = wavmark.load_model().to(device)
     main()
+    # audio_path = "/Users/my/Library/Mobile Documents/com~apple~CloudDocs/CODE/PycharmProjects/4_语音水印/419_huggingface水印/WavMark/example.wav"
+    # decoded_watermark, decode_cost = decode_watermark(audio_path)
+    # print(decoded_watermark)

example.wav ADDED Viewed

Binary file (257 kB). View file

requirements.txt CHANGED Viewed

@@ -1,4 +1,4 @@
-wavmark
 soundfile
 librosa
 resampy

+wavmark==0.0.2
 soundfile
 librosa
 resampy

停泊/app.py ADDED Viewed

	@@ -0,0 +1,148 @@

+import pdb
+import time
+import streamlit as st
+import os
+from utils import wm_add_v2, file_reader, model_util, wm_decode_v2, bin_util
+from models import my_model_v7_recover
+import torch
+import uuid
+import datetime
+import numpy as np
+import soundfile
+from huggingface_hub import hf_hub_download, HfApi
+# Function to add watermark to audio
+def add_watermark(audio_path, watermark_text):
+    assert len(watermark_text) == 5
+    start_bit, msg_bit, watermark = wm_add_v2.create_parcel_message(len_start_bit, 32, watermark_text)
+    data, sr, audio_length_second = file_reader.read_as_single_channel_16k(audio_path, 16000)
+    _, signal_wmd, time_cost = wm_add_v2.add_watermark(watermark, data, 16000, 0.1, device, model)
+    tmp_file_name = datetime.datetime.now().strftime('%Y-%m-%d_%H-%M-%S') + "_" + str(uuid.uuid4()) + ".wav"
+    tmp_file_path = '/tmp/' + tmp_file_name
+    soundfile.write(tmp_file_path, signal_wmd, sr)
+    return tmp_file_path
+# Function to decode watermark from audio
+def decode_watermark(audio_path):
+    data, sr, audio_length_second = file_reader.read_as_single_channel_16k(audio_path, 16000)
+    data = data[0:5 * sr]
+    start_bit = wm_add_v2.fix_pattern[0:len_start_bit]
+    support_count, mean_result, results = wm_decode_v2.extract_watermark_v2(
+        data,
+        start_bit,
+        0.1,
+        16000,
+        0.3,
+        model,
+        device, "best")
+    if mean_result is None:
+        return "No Watermark"
+    payload = mean_result[len_start_bit:]
+    return bin_util.binArray2HexStr(payload)
+# Main web app
+def main():
+    max_upload_size = 20 * 1024 * 1024  # 20 MB in bytes
+    if "def_value" not in st.session_state:
+        st.session_state.def_value = bin_util.binArray2HexStr(np.random.choice([0, 1], size=32 - len_start_bit))
+    st.title("Neural Audio Watermark")
+    st.write("Choose the action you want to perform:")
+    action = st.selectbox("Select Action", ["Add Watermark", "Decode Watermark"])
+    if action == "Add Watermark":
+        audio_file = st.file_uploader("Upload Audio File (WAV)", type=["wav"], accept_multiple_files=False,
+                                      max_upload_size=max_upload_size)
+        if audio_file:
+            tmp_input_audio_file = os.path.join("/tmp/", audio_file.name)
+            with open(tmp_input_audio_file, "wb") as f:
+                f.write(audio_file.getbuffer())
+            st.audio(tmp_input_audio_file, format="audio/wav")
+            watermark_text = st.text_input("Enter Watermark Text (5 English letters)", value=st.session_state.def_value)
+            add_watermark_button = st.button("Add Watermark", key="add_watermark_btn")
+            if add_watermark_button:  # 点击按钮后执行的
+                if audio_file and watermark_text:
+                    with st.spinner("Adding Watermark..."):
+                        # add_watermark_button.empty()
+                        # st.button("Add Watermark", disabled=True)
+                        # st.button("Add Watermark", disabled=True, key="add_watermark_btn_disabled")
+                        t1 = time.time()
+                        watermarked_audio = add_watermark(tmp_input_audio_file, watermark_text)
+                        encode_time_cost = time.time() - t1
+                        st.write("Watermarked Audio:")
+                        st.audio(watermarked_audio, format="audio/wav")
+                        st.write("Time Cost:%d seconds" % encode_time_cost)
+                        # st.button("Add Watermark", disabled=False)
+    elif action == "Decode Watermark":
+        audio_file = st.file_uploader("Upload Audio File (WAV/MP3)", type=["wav", "mp3"], accept_multiple_files=False,
+                                      max_upload_size=max_upload_size)
+        if audio_file:
+            if st.button("Decode Watermark"):
+                # 1.保存
+                tmp_file_for_decode_path = os.path.join("/tmp/", audio_file.name)
+                with open(tmp_file_for_decode_path, "wb") as f:
+                    f.write(audio_file.getbuffer())
+                # 2.执行
+                with st.spinner("Decoding..."):
+                    t1 = time.time()
+                    decoded_watermark = decode_watermark(tmp_file_for_decode_path)
+                    decode_cost = time.time() - t1
+                print("decoded_watermark", decoded_watermark)
+                # Display the decoded watermark
+                st.write("Decoded Watermark:", decoded_watermark)
+                st.write("Time Cost:%d seconds" % (decode_cost))
+def load_model(resume_path):
+    n_fft = 1000
+    hop_length = 400
+    # https://huggingface.co/M4869/InvertibleWM/blob/main/step59000_snr39.99_pesq4.35_BERP_none0.30_mean1.81_std1.81.pkl
+    # api_key = st.secrets["api_key"]
+    # print(api_key, api_key)
+    api_key = "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"
+    model_ckpt_path = hf_hub_download(repo_id="M4869/InvertibleWM",
+                                      filename="step59000_snr39.99_pesq4.35_BERP_none0.30_mean1.81_std1.81.pkl",
+                                      token=api_key
+                                      )
+    # print("model_ckpt_path", model_ckpt_path)
+    resume_path = model_ckpt_path
+    # return
+    model = my_model_v7_recover.Model(16000, 32, n_fft, hop_length,
+                                      use_recover_layer=False, num_layers=8).to(device)
+    checkpoint = torch.load(resume_path, map_location=torch.device('cpu'))
+    state_dict = model_util.map_state_dict(checkpoint['model'])
+    model.load_state_dict(state_dict, strict=True)
+    model.eval()
+    return model
+if __name__ == "__main__":
+    len_start_bit = 12
+    device = torch.device('cuda:0' if torch.cuda.is_available() else 'cpu')
+    model = load_model("./data/step59000_snr39.99_pesq4.35_BERP_none0.30_mean1.81_std1.81.pkl")
+    main()
+    # decode_watermark("/Users/my/Downloads/7a95b353a46893903e9f946c24170b210ce14e8c52c63bb2ab3d144e.wav")

停泊/requirements_bk.txt ADDED Viewed

	@@ -0,0 +1,6 @@

+soundfile
+librosa
+resampy
+torch==1.13.1
+torchvision==0.14.1
+torchaudio==0.13.1