Spaces:

Sebbe33
/

Transcription_gemini

Running

App Files Files Community

Sebbe33 commited on Feb 22

Commit

f91380b

verified ·

1 Parent(s): 835bf99

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -32

app.py CHANGED Viewed

@@ -1,6 +1,5 @@
 import os
 import tempfile
 import streamlit as st
 from google import genai
 from jinja2 import Template
@@ -46,37 +45,18 @@ if st.button("Generate Transcript"):
             # Upload audio file
             uploaded_file = client.files.upload(file=tmp_file_path)
-            # Create prompt template
-            prompt_template = Template("""Generate a transcript of the episode. Include timestamps and identify speakers.
-Speakers are:
-{% for speaker in speakers %}- {{ speaker }}{% if not loop.last %}\n{% endif %}{% endfor %}
-eg:
-[00:00] Brady: Hello there.
-[00:02] Tim: Hi Brady.
-It is important to include the correct speaker names. Use the names you identified earlier. If you really don't know the speaker's name, identify them with a letter of the alphabet, eg there may be an unknown speaker 'A' and another unknown speaker 'B'.
-If there is music or a short jingle playing, signify like so:
-[01:02] [MUSIC] or [01:02] [JINGLE]
-If you can identify the name of the music or jingle playing then use that instead, eg:
-[01:02] [Firework by Katy Perry] or [01:02] [The Sofa Shop jingle]
-If there is some other sound playing try to identify the sound, eg:
-[01:02] [Bell ringing]
-Each individual caption should be quite short, a few short sentences at most.
-Signify the end of the episode with [END].
-Don't use any markdown formatting, like bolding or italics.
-Only use characters from the English alphabet, unless you genuinely believe foreign characters are correct.
-It is important that you use the correct words and spell everything correctly. Use the context of the podcast to help.
-If the hosts discuss something like a movie, book or celebrity, make sure the movie, book, or celebrity name is spelled correctly.""")
             prompt = prompt_template.render(speakers=speakers)
@@ -93,4 +73,11 @@ If the hosts discuss something like a movie, book or celebrity, make sure the mo
         except Exception as e:
             st.error(f"An error occurred: {str(e)}")
         finally:
-            os.remove(tmp_file_path)

 import os
 import tempfile
 import streamlit as st
 from google import genai
 from jinja2 import Template
             # Upload audio file
             uploaded_file = client.files.upload(file=tmp_file_path)
+            # New token counting functionality
+            try:
+                token_info = client.models.count_tokens(
+                    model='gemini-2.0-flash',
+                    contents=[uploaded_file]
+                )
+                st.info(f"File contains approximately {token_info.total_tokens} tokens")
+            except AttributeError:
+                st.warning("Token counting not available in current API version")
+            # Create prompt template
+            prompt_template = Template("""[...your existing template here...]""")
             prompt = prompt_template.render(speakers=speakers)
         except Exception as e:
             st.error(f"An error occurred: {str(e)}")
         finally:
+            os.remove(tmp_file_path)
+# Credits section in sidebar
+st.sidebar.markdown("""
+**Credits**
+- Transcription powered by [Gemini API](https://ai.google.dev/)
+- Heavy inspired by https://github.com/philschmid/gemini-samples/blob/main/examples/gemini-transcribe-with-timestamps.ipynb
+""")