Spaces:
Sleeping
Sleeping
File size: 1,663 Bytes
06a53dc d90bac0 06a53dc b97fe69 d90bac0 b97fe69 e0683ca b97fe69 e0683ca 06a53dc b97fe69 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 |
import sqlite3
import os
def initialize_database():
"""Initialize the SQLite database and create the 'documents' table if it doesn't exist."""
# Connect to the SQLite database (or create it if it doesn't exist)
conn = sqlite3.connect('dataset.db')
cursor = conn.cursor()
# Create the 'documents' table if it doesn't exist
cursor.execute('''
CREATE TABLE IF NOT EXISTS documents (
id INTEGER PRIMARY KEY AUTOINCREMENT,
text TEXT NOT NULL,
topics TEXT
)
''')
# Commit changes and close the connection
conn.commit()
conn.close()
from huggingface_hub import HfApi
def commit_to_huggingface():
"""Commit the dataset.db file to the Hugging Face Space repository."""
api_token = os.getenv("hf_key")
api = HfApi(token=api_token)
# Replace with your Space's repository name
repo_id = "Danielrahmai1991/dataset_interface"
# Upload and commit the dataset.db file
api.upload_file(
path_or_fileobj="dataset.db",
path_in_repo="dataset.db",
repo_id=repo_id,
repo_type="space"
)
def save_to_db(chunks, topics=None):
"""Save chunks to the SQLite database."""
# Ensure the database and table are initialized
initialize_database()
# Connect to the database
conn = sqlite3.connect('dataset.db')
cursor = conn.cursor()
# Insert chunks into the database
for chunk in chunks:
cursor.execute('INSERT INTO documents (text, topics) VALUES (?, ?)', (chunk, topics))
# Commit changes and close the connection
conn.commit()
conn.close()
commit_to_huggingface()
|