Spaces:

ahmedkasem
/

quran-nlp

Sleeping

App Files Files Community

deveix commited on Apr 22, 2024

Commit

c883d77

1 Parent(s): 8b248fd

add quran

Browse files

Files changed (3) hide show

app/main.py +25 -18
app/quran.csv +0 -0
requirements.txt +2 -1

app/main.py CHANGED Viewed

@@ -8,7 +8,7 @@ import uvicorn
 from dotenv import load_dotenv
 from fastapi.middleware.cors import CORSMiddleware
 from uuid import uuid4
-import httpx
 import joblib
 import librosa
@@ -113,18 +113,21 @@ def index_file(filepath):
     return index
-async def get_ayah_info(ayah):
-    """Asynchronously fetches Ayah information from the Al-Quran API."""
-    url = f"https://api.alquran.cloud/v1/search/{ayah}/all/ar"
-    async with httpx.AsyncClient() as client:
-        response = await client.get(url)
-        if response.status_code == 200:
-            return response.json()
-        else:
-            return {"error": "Failed to fetch data"}
-async def get_text_by_block_number(filepath, block_numbers):
     """ Retrieve specific blocks from a file based on block numbers, where each block is separated by '\n\n'. """
     blocks_text = []
     with open(filepath, 'r', encoding='utf-8') as file:
@@ -133,20 +136,24 @@ async def get_text_by_block_number(filepath, block_numbers):
         for block_number, block in enumerate(blocks, 1):  # Starting block numbers at 1 for human readability
             if block_number in block_numbers:
-                print(block)
                 splitted = block.split('\n')
                 ayah = splitted[0]
                 tafsir = splitted[1]
                 # Replace single newlines within blocks with space and strip leading/trailing whitespace
-                ayah_info = await get_ayah_info(ayah)  # This makes the API call
                 blocks_text.append({
-                    "ayah": ayah.replace("  ", ''),
                     "tafsir": tafsir,
-                    "ayah_info": ayah_info
-                    # "block": formatted_block
                 })
                 if len(blocks_text) == len(block_numbers):  # Stop reading once all required blocks are retrieved
                     break
     return blocks_text

 from dotenv import load_dotenv
 from fastapi.middleware.cors import CORSMiddleware
 from uuid import uuid4
+# import httpx
 import joblib
 import librosa
     return index
+# async def get_ayah_info(ayah):
+#     """Asynchronously fetches Ayah information from the Al-Quran API."""
+#     url = f"https://api.alquran.cloud/v1/search/{ayah}/all/ar"
+#     async with httpx.AsyncClient() as client:
+#         response = await client.get(url)
+#         if response.status_code == 200:
+#             return response.json()
+#         else:
+#             return {"error": "Failed to fetch data"}
+# async
+import pandas as pd
+df = pd.read_csv('/app/quran.csv')
+def get_text_by_block_number(filepath, block_numbers):
     """ Retrieve specific blocks from a file based on block numbers, where each block is separated by '\n\n'. """
     blocks_text = []
     with open(filepath, 'r', encoding='utf-8') as file:
         for block_number, block in enumerate(blocks, 1):  # Starting block numbers at 1 for human readability
             if block_number in block_numbers:
                 splitted = block.split('\n')
                 ayah = splitted[0]
                 tafsir = splitted[1]
                 # Replace single newlines within blocks with space and strip leading/trailing whitespace
+                # ayah_info = await get_ayah_info(ayah)  # This makes the API call
+                row_data = df.iloc[block_number].to_dict()
+                print(row_data)
                 blocks_text.append({
+                    #                 "ayah": ayah.replace("  ", ''),
+                    #                 "tafsir": tafsir,
+                    # "ayah": ayah.replace("  ", ''),
                     "tafsir": tafsir,
+                    **row_data
                 })
                 if len(blocks_text) == len(block_numbers):  # Stop reading once all required blocks are retrieved
                     break
     return blocks_text

app/quran.csv ADDED Viewed

The diff for this file is too large to render. See raw diff

requirements.txt CHANGED Viewed

@@ -20,4 +20,5 @@ python-multipart
 ffmpeg-python
 noisereduce
 scikit-learn==1.2.2
-httpx

 ffmpeg-python
 noisereduce
 scikit-learn==1.2.2
+# httpx
+pandas