import pandas as pd
import streamlit as st
import matplotlib.pyplot as plt
import matplotlib.font_manager as font_manager
import io
import base64
import os
from datetime import datetime, timedelta
import numpy as np
from matplotlib.backends.backend_agg import FigureCanvasAgg
from pypinyin import lazy_pinyin, Style
from matplotlib.backends.backend_pdf import PdfPages

def get_font(size=14):
    """Loads the specified font, with a fallback."""
    font_path = "simHei.ttc"
    if not os.path.exists(font_path):
        font_path = "SimHei.ttf"  # Fallback font
    if not os.path.exists(font_path):
        st.warning("Font file (simHei.ttc or SimHei.ttf) not found. Display may be incorrect.")
        return font_manager.FontProperties(size=size)
    return font_manager.FontProperties(fname=font_path, size=size)

def get_pinyin_abbr(text):
    """Gets the first letter of the Pinyin for the first two Chinese characters of a text."""
    if not isinstance(text, str):
        return ""
    # Extract the first two Chinese characters
    chars = [c for c in text if '\u4e00' <= c <= '\u9fff'][:2]
    if not chars:
        return ""
    pinyin_list = lazy_pinyin(chars, style=Style.FIRST_LETTER)
    return ''.join(pinyin_list).upper()

def process_schedule(file):
    """
    Processes the uploaded Excel file to extract and clean the movie schedule.
    This version also prepares all data fields needed for the new layout.
    """
    try:
        # Try to read the date from the specified cell
        date_df = pd.read_excel(file, header=None, skiprows=7, nrows=1, usecols=[3])
        date_str = pd.to_datetime(date_df.iloc[0, 0]).strftime('%Y-%m-%d')
        base_date = pd.to_datetime(date_str).date()
    except Exception:
        # Fallback to today's date if reading fails
        date_str = datetime.today().strftime('%Y-%m-%d')
        base_date = datetime.today().date()
    
    try:
        df = pd.read_excel(file, header=9, usecols=[1, 2, 4, 5])
        df.columns = ['Hall', 'StartTime', 'EndTime', 'Movie']
        
        # Data Cleaning
        df['Hall'] = df['Hall'].ffill()
        df.dropna(subset=['StartTime', 'EndTime', 'Movie'], inplace=True)
        df['Hall'] = df['Hall'].astype(str).str.extract(r'(\d+号)')
        df.dropna(subset=['Hall'], inplace=True) # Ensure rows without a hall number are dropped

        # Convert times to datetime objects
        df['StartTime_dt'] = pd.to_datetime(df['StartTime'], format='%H:%M', errors='coerce').apply(
            lambda t: t.replace(year=base_date.year, month=base_date.month, day=base_date.day) if pd.notnull(t) else t
        )
        df['EndTime_dt'] = pd.to_datetime(df['EndTime'], format='%H:%M', errors='coerce').apply(
            lambda t: t.replace(year=base_date.year, month=base_date.month, day=base_date.day) if pd.notnull(t) else t
        )
        
        df.dropna(subset=['StartTime_dt', 'EndTime_dt'], inplace=True)
        
        # Handle screenings that cross midnight
        df.loc[df['EndTime_dt'] < df['StartTime_dt'], 'EndTime_dt'] += timedelta(days=1)
        df = df.sort_values(['Hall', 'StartTime_dt'])
        
        # Merge consecutive screenings of the same movie
        merged_rows = []
        for _, group in df.groupby('Hall'):
            group = group.sort_values('StartTime_dt')
            current = None
            for _, row in group.iterrows():
                if current is None:
                    current = row.copy()
                else:
                    if row['Movie'] == current['Movie']:
                        current['EndTime_dt'] = row['EndTime_dt'] # Extend the end time
                    else:
                        merged_rows.append(current)
                        current = row.copy()
            if current is not None:
                merged_rows.append(current)
        
        if not merged_rows:
             return None, date_str

        merged_df = pd.DataFrame(merged_rows).reset_index(drop=True)
        
        # Adjust times as per original logic
        merged_df['StartTime_dt'] -= timedelta(minutes=10)
        merged_df['EndTime_dt'] -= timedelta(minutes=5)
        
        # --- New Data Preparation for Layout ---
        # 1. Create Index (序号)
        merged_df['Index'] = merged_df.groupby('Hall').cumcount() + 1
        # 2. Create Pinyin Abbreviation (拼音缩写)
        merged_df['Pinyin'] = merged_df['Movie'].apply(get_pinyin_abbr)
        # 3. Create Time String (时间)
        merged_df['TimeStr'] = merged_df['StartTime_dt'].dt.strftime('%H:%M') + ' - ' + merged_df['EndTime_dt'].dt.strftime('%H:%M')
        # 4. Clean Hall Number for display
        merged_df['Hall'] = merged_df['Hall'].str.replace('号', '')

        # Select and reorder columns as per requirement
        final_df = merged_df[['Hall', 'Index', 'Movie', 'Pinyin', 'TimeStr']]
        
        return final_df, date_str

    except Exception as e:
        st.error(f"An error occurred during file processing: {e}")
        return None, date_str


def create_print_layout(data, date_str):
    """
    Creates the print layout on an A4 page based on a dynamic grid system.
    """
    if data is None or data.empty:
        return None

    # --- 1. Layout Constants ---
    A4_WIDTH_IN, A4_HEIGHT_IN = 8.27, 11.69
    MARGIN_IN = 0.4
    USABLE_WIDTH_IN = A4_WIDTH_IN - (2 * MARGIN_IN)
    USABLE_HEIGHT_IN = A4_HEIGHT_IN - (2 * MARGIN_IN)

    # --- 2. Row and Font Calculation ---
    num_content_rows = len(data)
    total_grid_rows = num_content_rows + 2  # Add 2 for top/bottom padding rows
    row_height_in = USABLE_HEIGHT_IN / total_grid_rows
    # Calculate font size in points (1 inch = 72 points) to be 90% of row height
    font_size_pt = (row_height_in * 72) * 0.9
    content_font = get_font(font_size_pt)
    date_font = get_font(12)

    # --- 3. Column Width Calculation ---
    # Create a temporary figure to calculate text widths accurately
    temp_fig = plt.figure(figsize=(A4_WIDTH_IN, A4_HEIGHT_IN))
    canvas = FigureCanvasAgg(temp_fig)
    
    cols_to_measure = ['Hall', 'Index', 'Movie', 'Pinyin', 'TimeStr']
    col_widths_in = []

    for col in cols_to_measure:
        # Find the longest string in the column for measurement
        longest_item = max(data[col].astype(str).tolist(), key=len, default="")
        # Create a temporary text object to measure its width
        t = plt.text(0, 0, longest_item, fontproperties=content_font)
        # Get the bounding box of the text in display units and convert to inches
        bbox = t.get_window_extent(renderer=canvas.get_renderer())
        width_in = bbox.width / temp_fig.dpi
        col_widths_in.append(width_in * 1.1) # Add 10% padding
        t.remove()

    plt.close(temp_fig) # Close the temporary figure

    # Scale column widths to fit the usable page width
    total_calculated_width = sum(col_widths_in)
    scale_factor = USABLE_WIDTH_IN / total_calculated_width if total_calculated_width > 0 else 1
    final_col_widths_in = [w * scale_factor for w in col_widths_in]

    # --- 4. Figure and PDF/PNG Generation ---
    def process_figure(fig, ax):
        # Calculate grid coordinates in Axes units (0 to 1)
        col_widths_ax = [w / USABLE_WIDTH_IN for w in final_col_widths_in]
        row_height_ax = 1.0 / total_grid_rows
        
        x_coords_ax = [0] + np.cumsum(col_widths_ax).tolist()
        y_coords_ax = [1 - i * row_height_ax for i in range(total_grid_rows + 1)]

        # Add date string at the top-left of the usable area
        ax.text(0, 1, date_str, transform=ax.transAxes, fontproperties=date_font,
                ha='left', va='bottom', color='#A9A9A9')

        # --- Draw Grid and Content ---
        for i, row in data.iterrows():
            grid_row_index = i + 1  # Offset by 1 for the top padding row
            y_bottom = y_coords_ax[grid_row_index + 1]
            y_center = y_bottom + row_height_ax / 2

            # Draw bottom dotted line for the current row's cells
            ax.plot([0, 1], [y_bottom, y_bottom], transform=ax.transAxes,
                    linestyle=':', color='gray', linewidth=0.7)

            # Draw content for each cell in the row
            content_list = [row['Hall'], row['Index'], row['Movie'], row['Pinyin'], row['TimeStr']]
            for j, content in enumerate(content_list):
                x_left = x_coords_ax[j]
                x_center = x_left + col_widths_ax[j] / 2
                ax.text(x_center, y_center, content, transform=ax.transAxes,
                        fontproperties=content_font, ha='center', va='center')
        
        # --- Draw Vertical Grid Lines ---
        content_area_top_y = y_coords_ax[1]
        content_area_bottom_y = y_coords_ax[-2]
        for x in x_coords_ax[1:-1]:
            ax.plot([x, x], [content_area_bottom_y, content_area_top_y], transform=ax.transAxes,
                    linestyle=':', color='gray', linewidth=0.7)

        # --- Draw Black Separator Lines Between Halls ---
        hall_change_indices = data.index[data['Hall'] != data['Hall'].shift(-1)]
        for idx in hall_change_indices:
            # The line is at the bottom of the current row
            y_line = y_coords_ax[idx + 2] # +1 for top margin, +1 to get bottom of current row
            ax.plot([0, 1], [y_line, y_line], transform=ax.transAxes,
                    linestyle='-', color='black', linewidth=1.2)


    # Create figures for PNG and PDF
    png_fig = plt.figure(figsize=(A4_WIDTH_IN, A4_HEIGHT_IN), dpi=300)
    pdf_fig = plt.figure(figsize=(A4_WIDTH_IN, A4_HEIGHT_IN), dpi=300)
    
    # Configure axes to fill the usable area defined by margins
    ax_rect = [
        MARGIN_IN / A4_WIDTH_IN, MARGIN_IN / A4_HEIGHT_IN,
        USABLE_WIDTH_IN / A4_WIDTH_IN, USABLE_HEIGHT_IN / A4_HEIGHT_IN
    ]
    png_ax = png_fig.add_axes(ax_rect)
    pdf_ax = pdf_fig.add_axes(ax_rect)
    png_ax.axis('off')
    pdf_ax.axis('off')

    # Process both figures
    process_figure(png_fig, png_ax)
    process_figure(pdf_fig, pdf_ax)

    # Save PNG to buffer
    png_buffer = io.BytesIO()
    png_fig.savefig(png_buffer, format='png', pad_inches=0)
    png_buffer.seek(0)
    image_base64 = base64.b64encode(png_buffer.getvalue()).decode()
    plt.close(png_fig)

    # Save PDF to buffer
    pdf_buffer = io.BytesIO()
    pdf_fig.savefig(pdf_buffer, format='pdf', pad_inches=0)
    pdf_buffer.seek(0)
    pdf_base64 = base64.b64encode(pdf_buffer.getvalue()).decode()
    plt.close(pdf_fig)

    return {
        'png': f"data:image/png;base64,{image_base64}",
        'pdf': f"data:application/pdf;base64,{pdf_base64}"
    }

def display_pdf(base64_pdf):
    """Embeds the PDF in the Streamlit app for display."""
    pdf_display = f'<iframe src="{base64_pdf}" width="100%" height="800" type="application/pdf"></iframe>'
    return pdf_display

# --- Streamlit App Main Body ---
st.set_page_config(page_title="LED 屏幕时间表打印", layout="wide")
st.title("LED 屏幕时间表打印")

uploaded_file = st.file_uploader("选择打开【放映时间核对表.xls】文件", type=["xls"])

if uploaded_file:
    with st.spinner("文件正在处理中，请稍候..."):
        schedule, date_str = process_schedule(uploaded_file)
        if schedule is not None and not schedule.empty:
            output = create_print_layout(schedule, date_str)
            if output:
                # Create tabs to switch between PDF and PNG previews
                tab1, tab2 = st.tabs(["PDF 预览", "PNG 预览"])
                
                with tab1:
                    st.markdown(display_pdf(output['pdf']), unsafe_allow_html=True)
                
                with tab2:
                    st.image(output['png'], use_container_width=True)
            else:
                st.error("生成打印布局失败。")
        elif schedule is None:
             st.error("无法处理文件，请检查文件格式或内容是否正确。")
        else: # schedule is empty
             st.warning("处理完成，但文件中没有找到有效的排片数据。")