hellorahulk commited on
Commit
c325e25
·
verified ·
1 Parent(s): 04f69e7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +44 -33
app.py CHANGED
@@ -12,10 +12,10 @@ def numbers_to_xlsx(numbers_file):
12
  Efficiently converts a Numbers file to XLSX format with optimized memory usage.
13
 
14
  Args:
15
- numbers_file: The uploaded Numbers file object.
16
 
17
  Returns:
18
- str: Path to the converted xlsx file, or error message if conversion fails.
19
  """
20
  if not numbers_file:
21
  return None
@@ -26,44 +26,55 @@ def numbers_to_xlsx(numbers_file):
26
  os.makedirs(output_dir, exist_ok=True)
27
  output_path = os.path.join(output_dir, "converted.xlsx")
28
 
29
- # Read the Numbers file efficiently
30
  doc = Document(numbers_file.name)
31
 
32
- # Validate document structure
33
- if not doc.sheets or not doc.sheets[0].tables:
 
 
34
  return None
 
 
 
35
 
36
- # Get the first table's data efficiently
37
- table = doc.sheets[0].tables[0]
38
-
39
- # Extract headers and data in one pass
40
- rows = list(table.rows(values_only=True))
41
- if not rows:
42
- return None
43
-
44
- headers = rows[0]
45
- data = rows[1:]
46
-
47
- # Use pandas optimized DataFrame construction
48
- df = pd.DataFrame(data, columns=headers)
49
-
50
- # Optimize Excel writing with correct options
51
- writer = pd.ExcelWriter(
52
- output_path,
53
- engine='openpyxl'
54
- )
55
-
56
- df.to_excel(
57
- writer,
58
- index=False,
59
- sheet_name='Sheet1'
60
- )
 
 
 
61
 
62
- # Freeze the header row using openpyxl directly
63
- writer.sheets['Sheet1'].freeze_panes = 'A2'
64
  writer.close()
65
 
66
- return output_path
 
 
 
 
 
67
 
68
  except Exception as e:
69
  print(f"Error converting file: {str(e)}")
 
12
  Efficiently converts a Numbers file to XLSX format with optimized memory usage.
13
 
14
  Args:
15
+ numbers_file: The uploaded Numbers file object from Gradio.
16
 
17
  Returns:
18
+ str: Path to the converted xlsx file, or None if conversion fails.
19
  """
20
  if not numbers_file:
21
  return None
 
26
  os.makedirs(output_dir, exist_ok=True)
27
  output_path = os.path.join(output_dir, "converted.xlsx")
28
 
29
+ # Read the Numbers file efficiently using the temporary path
30
  doc = Document(numbers_file.name)
31
 
32
+ # Get all sheets and validate
33
+ sheets = doc.sheets
34
+ if not sheets:
35
+ print("No sheets found in the document")
36
  return None
37
+
38
+ # Process each sheet
39
+ writer = pd.ExcelWriter(output_path, engine='openpyxl')
40
 
41
+ for sheet_index, sheet in enumerate(sheets):
42
+ if not sheet.tables:
43
+ continue
44
+
45
+ # Get the first table in the sheet
46
+ table = sheet.tables[0]
47
+
48
+ # Extract data
49
+ rows = list(table.rows(values_only=True))
50
+ if not rows:
51
+ continue
52
+
53
+ # Split headers and data
54
+ headers = rows[0] if rows else []
55
+ data = rows[1:] if len(rows) > 1 else []
56
+
57
+ # Create DataFrame and write to Excel
58
+ df = pd.DataFrame(data, columns=headers)
59
+ sheet_name = f"Sheet{sheet_index + 1}"
60
+
61
+ df.to_excel(
62
+ writer,
63
+ sheet_name=sheet_name,
64
+ index=False
65
+ )
66
+
67
+ # Freeze the header row
68
+ writer.sheets[sheet_name].freeze_panes = 'A2'
69
 
 
 
70
  writer.close()
71
 
72
+ # Verify the file was created and has content
73
+ if os.path.exists(output_path) and os.path.getsize(output_path) > 0:
74
+ return output_path
75
+ else:
76
+ print("Output file is empty or was not created")
77
+ return None
78
 
79
  except Exception as e:
80
  print(f"Error converting file: {str(e)}")