Spaces:

towing
/

byt5-base-alibi-mt-app

Sleeping

App Files Files Community

name commited on Jun 24, 2024

Commit

6d3e512

1 Parent(s): eddec9a

add files

Browse files

Files changed (3) hide show

README.md +7 -4
app.py +41 -0
requirements.txt +5 -0

README.md CHANGED Viewed

@@ -1,13 +1,16 @@
 ---
-title: Byt5 Base Alibi Mt App
 emoji: 😻
-colorFrom: green
 colorTo: gray
 sdk: gradio
-sdk_version: 4.36.1
 app_file: app.py
 pinned: false
-license: mit
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: mt-v1.0
 emoji: 😻
+colorFrom: purple
 colorTo: gray
 sdk: gradio
+sdk_version: 3.50.2
 app_file: app.py
 pinned: false
+license: apache-2.0
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference
+rebuild

app.py ADDED Viewed

	@@ -0,0 +1,41 @@

+import gradio as gr
+from tow.model_byt5.tokenizer import Tokenizer_byt5
+from tow.model_byt5.model import Transformer_byt5
+import json
+import torch
+from huggingface_hub import hf_hub_download
+model_weights_path = hf_hub_download(repo_id="df-h/byt5-base-alibi-mt", filename="pytorch_model.bin")
+model_config_path = hf_hub_download(repo_id="df-h/byt5-base-alibi-mt", filename="config.json")
+def translate(inputs):
+    with open(model_config_path, 'r') as f:
+        config = json.load(f)
+    state_dict = torch.load(model_weights_path, map_location=torch.device('cpu'))
+    model = Transformer_byt5(config=config)
+    model.load_state_dict(state_dict)
+    model = model.eval()
+    tokenizer = Tokenizer_byt5()
+    ids = tokenizer(inputs, max_length=512)
+    len_pad = 512 - len(ids)
+    if len_pad > 0:
+        ids = ids + [0 for x in range(len_pad)]
+    print(ids)
+    inputs = torch.tensor([ids]).to(torch.device('cpu'))
+    outputs = model.generate(inputs, max_length=512)
+    text = tokenizer.ids2text(outputs.tolist()[0])
+    return text
+demo = gr.Interface(
+    fn=translate,
+    inputs=[
+        gr.components.Textbox(label="input", value="zh2en:一个描述实际事物的函数，其中的高频信息往往对应着很小的 “振幅”， 否则整个函数会很奇怪是个压扁的 “弹簧” ，不具实际意义。"),
+    ],
+    outputs=["text"],
+    cache_examples=False,
+    title="Translation",
+    description="Support tasks: en2es, en2ja, en2zh, ja2zh, es2zh, es2ja"
+)
+demo.launch(debug=True, share=True, server_name="0.0.0.0")

requirements.txt ADDED Viewed

	@@ -0,0 +1,5 @@

+transformers==4.36.2
+sentencepiece==0.1.99
+numpy==1.24.2
+torch==2.0.1
+-e git+https://github.com/repo/tow.git@a21644091cefd744ac1c8a87be4bae1e6a8c1898#egg=tow