Spaces:

Ethscriptions
/

LED-print

Sleeping

App Files Files Community

LED-print / app.py

Ethscriptions

Update app.py

41c541d verified 6 months ago

raw

history blame

12.1 kB

	import pandas as pd
	import streamlit as st
	import matplotlib.pyplot as plt
	import matplotlib.font_manager as font_manager
	import io
	import base64
	import os
	from datetime import datetime, timedelta
	import numpy as np
	from matplotlib.backends.backend_agg import FigureCanvasAgg
	from pypinyin import lazy_pinyin, Style
	from matplotlib.backends.backend_pdf import PdfPages

	def get_font(size=14):
	"""Loads the specified font, with a fallback."""
	font_path = "simHei.ttc"
	if not os.path.exists(font_path):
	font_path = "SimHei.ttf" # Fallback font
	if not os.path.exists(font_path):
	st.warning("Font file (simHei.ttc or SimHei.ttf) not found. Display may be incorrect.")
	return font_manager.FontProperties(size=size)
	return font_manager.FontProperties(fname=font_path, size=size)

	def get_pinyin_abbr(text):
	"""Gets the first letter of the Pinyin for the first two Chinese characters of a text."""
	if not isinstance(text, str):
	return ""
	# Extract the first two Chinese characters
	chars = [c for c in text if '\u4e00' <= c <= '\u9fff'][:2]
	if not chars:
	return ""
	pinyin_list = lazy_pinyin(chars, style=Style.FIRST_LETTER)
	return ''.join(pinyin_list).upper()

	def process_schedule(file):
	"""
	Processes the uploaded Excel file to extract and clean the movie schedule.
	This version also prepares all data fields needed for the new layout.
	"""
	try:
	# Try to read the date from the specified cell
	date_df = pd.read_excel(file, header=None, skiprows=7, nrows=1, usecols=[3])
	date_str = pd.to_datetime(date_df.iloc[0, 0]).strftime('%Y-%m-%d')
	base_date = pd.to_datetime(date_str).date()
	except Exception:
	# Fallback to today's date if reading fails
	date_str = datetime.today().strftime('%Y-%m-%d')
	base_date = datetime.today().date()

	try:
	df = pd.read_excel(file, header=9, usecols=[1, 2, 4, 5])
	df.columns = ['Hall', 'StartTime', 'EndTime', 'Movie']

	# Data Cleaning
	df['Hall'] = df['Hall'].ffill()
	df.dropna(subset=['StartTime', 'EndTime', 'Movie'], inplace=True)
	df['Hall'] = df['Hall'].astype(str).str.extract(r'(\d+号)')
	df.dropna(subset=['Hall'], inplace=True) # Ensure rows without a hall number are dropped

	# Convert times to datetime objects
	df['StartTime_dt'] = pd.to_datetime(df['StartTime'], format='%H:%M', errors='coerce').apply(
	lambda t: t.replace(year=base_date.year, month=base_date.month, day=base_date.day) if pd.notnull(t) else t
	)
	df['EndTime_dt'] = pd.to_datetime(df['EndTime'], format='%H:%M', errors='coerce').apply(
	lambda t: t.replace(year=base_date.year, month=base_date.month, day=base_date.day) if pd.notnull(t) else t
	)

	df.dropna(subset=['StartTime_dt', 'EndTime_dt'], inplace=True)

	# Handle screenings that cross midnight
	df.loc[df['EndTime_dt'] < df['StartTime_dt'], 'EndTime_dt'] += timedelta(days=1)
	df = df.sort_values(['Hall', 'StartTime_dt'])

	# Merge consecutive screenings of the same movie
	merged_rows = []
	for _, group in df.groupby('Hall'):
	group = group.sort_values('StartTime_dt')
	current = None
	for _, row in group.iterrows():
	if current is None:
	current = row.copy()
	else:
	if row['Movie'] == current['Movie']:
	current['EndTime_dt'] = row['EndTime_dt'] # Extend the end time
	else:
	merged_rows.append(current)
	current = row.copy()
	if current is not None:
	merged_rows.append(current)

	if not merged_rows:
	return None, date_str

	merged_df = pd.DataFrame(merged_rows).reset_index(drop=True)

	# Adjust times as per original logic
	merged_df['StartTime_dt'] -= timedelta(minutes=10)
	merged_df['EndTime_dt'] -= timedelta(minutes=5)

	# --- New Data Preparation for Layout ---
	# 1. Create Index (序号)
	merged_df['Index'] = merged_df.groupby('Hall').cumcount() + 1
	# 2. Create Pinyin Abbreviation (拼音缩写)
	merged_df['Pinyin'] = merged_df['Movie'].apply(get_pinyin_abbr)
	# 3. Create Time String (时间)
	merged_df['TimeStr'] = merged_df['StartTime_dt'].dt.strftime('%H:%M') + ' - ' + merged_df['EndTime_dt'].dt.strftime('%H:%M')
	# 4. Clean Hall Number for display
	merged_df['Hall'] = merged_df['Hall'].str.replace('号', '')

	# Select and reorder columns as per requirement
	final_df = merged_df[['Hall', 'Index', 'Movie', 'Pinyin', 'TimeStr']]

	return final_df, date_str

	except Exception as e:
	st.error(f"An error occurred during file processing: {e}")
	return None, date_str


	def create_print_layout(data, date_str):
	"""
	Creates the print layout on an A4 page based on a dynamic grid system.
	"""
	if data is None or data.empty:
	return None

	# --- 1. Layout Constants ---
	A4_WIDTH_IN, A4_HEIGHT_IN = 8.27, 11.69
	MARGIN_IN = 0.4
	USABLE_WIDTH_IN = A4_WIDTH_IN - (2 * MARGIN_IN)
	USABLE_HEIGHT_IN = A4_HEIGHT_IN - (2 * MARGIN_IN)

	# --- 2. Row and Font Calculation ---
	num_content_rows = len(data)
	total_grid_rows = num_content_rows + 2 # Add 2 for top/bottom padding rows
	row_height_in = USABLE_HEIGHT_IN / total_grid_rows
	# Calculate font size in points (1 inch = 72 points) to be 90% of row height
	font_size_pt = (row_height_in * 72) * 0.9
	content_font = get_font(font_size_pt)
	date_font = get_font(12)

	# --- 3. Column Width Calculation ---
	# Create a temporary figure to calculate text widths accurately
	temp_fig = plt.figure(figsize=(A4_WIDTH_IN, A4_HEIGHT_IN))
	canvas = FigureCanvasAgg(temp_fig)

	cols_to_measure = ['Hall', 'Index', 'Movie', 'Pinyin', 'TimeStr']
	col_widths_in = []

	for col in cols_to_measure:
	# Find the longest string in the column for measurement
	longest_item = max(data[col].astype(str).tolist(), key=len, default="")
	# Create a temporary text object to measure its width
	t = plt.text(0, 0, longest_item, fontproperties=content_font)
	# Get the bounding box of the text in display units and convert to inches
	bbox = t.get_window_extent(renderer=canvas.get_renderer())
	width_in = bbox.width / temp_fig.dpi
	col_widths_in.append(width_in * 1.1) # Add 10% padding
	t.remove()

	plt.close(temp_fig) # Close the temporary figure

	# Scale column widths to fit the usable page width
	total_calculated_width = sum(col_widths_in)
	scale_factor = USABLE_WIDTH_IN / total_calculated_width if total_calculated_width > 0 else 1
	final_col_widths_in = [w * scale_factor for w in col_widths_in]

	# --- 4. Figure and PDF/PNG Generation ---
	def process_figure(fig, ax):
	# Calculate grid coordinates in Axes units (0 to 1)
	col_widths_ax = [w / USABLE_WIDTH_IN for w in final_col_widths_in]
	row_height_ax = 1.0 / total_grid_rows

	x_coords_ax = [0] + np.cumsum(col_widths_ax).tolist()
	y_coords_ax = [1 - i * row_height_ax for i in range(total_grid_rows + 1)]

	# Add date string at the top-left of the usable area
	ax.text(0, 1, date_str, transform=ax.transAxes, fontproperties=date_font,
	ha='left', va='bottom', color='#A9A9A9')

	# --- Draw Grid and Content ---
	for i, row in data.iterrows():
	grid_row_index = i + 1 # Offset by 1 for the top padding row
	y_bottom = y_coords_ax[grid_row_index + 1]
	y_center = y_bottom + row_height_ax / 2

	# Draw bottom dotted line for the current row's cells
	ax.plot([0, 1], [y_bottom, y_bottom], transform=ax.transAxes,
	linestyle=':', color='gray', linewidth=0.7)

	# Draw content for each cell in the row
	content_list = [row['Hall'], row['Index'], row['Movie'], row['Pinyin'], row['TimeStr']]
	for j, content in enumerate(content_list):
	x_left = x_coords_ax[j]
	x_center = x_left + col_widths_ax[j] / 2
	ax.text(x_center, y_center, content, transform=ax.transAxes,
	fontproperties=content_font, ha='center', va='center')

	# --- Draw Vertical Grid Lines ---
	content_area_top_y = y_coords_ax[1]
	content_area_bottom_y = y_coords_ax[-2]
	for x in x_coords_ax[1:-1]:
	ax.plot([x, x], [content_area_bottom_y, content_area_top_y], transform=ax.transAxes,
	linestyle=':', color='gray', linewidth=0.7)

	# --- Draw Black Separator Lines Between Halls ---
	hall_change_indices = data.index[data['Hall'] != data['Hall'].shift(-1)]
	for idx in hall_change_indices:
	# The line is at the bottom of the current row
	y_line = y_coords_ax[idx + 2] # +1 for top margin, +1 to get bottom of current row
	ax.plot([0, 1], [y_line, y_line], transform=ax.transAxes,
	linestyle='-', color='black', linewidth=1.2)


	# Create figures for PNG and PDF
	png_fig = plt.figure(figsize=(A4_WIDTH_IN, A4_HEIGHT_IN), dpi=300)
	pdf_fig = plt.figure(figsize=(A4_WIDTH_IN, A4_HEIGHT_IN), dpi=300)

	# Configure axes to fill the usable area defined by margins
	ax_rect = [
	MARGIN_IN / A4_WIDTH_IN, MARGIN_IN / A4_HEIGHT_IN,
	USABLE_WIDTH_IN / A4_WIDTH_IN, USABLE_HEIGHT_IN / A4_HEIGHT_IN
	]
	png_ax = png_fig.add_axes(ax_rect)
	pdf_ax = pdf_fig.add_axes(ax_rect)
	png_ax.axis('off')
	pdf_ax.axis('off')

	# Process both figures
	process_figure(png_fig, png_ax)
	process_figure(pdf_fig, pdf_ax)

	# Save PNG to buffer
	png_buffer = io.BytesIO()
	png_fig.savefig(png_buffer, format='png', pad_inches=0)
	png_buffer.seek(0)
	image_base64 = base64.b64encode(png_buffer.getvalue()).decode()
	plt.close(png_fig)

	# Save PDF to buffer
	pdf_buffer = io.BytesIO()
	pdf_fig.savefig(pdf_buffer, format='pdf', pad_inches=0)
	pdf_buffer.seek(0)
	pdf_base64 = base64.b64encode(pdf_buffer.getvalue()).decode()
	plt.close(pdf_fig)

	return {
	'png': f"data:image/png;base64,{image_base64}",
	'pdf': f"data:application/pdf;base64,{pdf_base64}"
	}

	def display_pdf(base64_pdf):
	"""Embeds the PDF in the Streamlit app for display."""
	pdf_display = f'<iframe src="{base64_pdf}" width="100%" height="800" type="application/pdf"></iframe>'
	return pdf_display

	# --- Streamlit App Main Body ---
	st.set_page_config(page_title="LED 屏幕时间表打印", layout="wide")
	st.title("LED 屏幕时间表打印")

	uploaded_file = st.file_uploader("选择打开【放映时间核对表.xls】文件", type=["xls"])

	if uploaded_file:
	with st.spinner("文件正在处理中，请稍候..."):
	schedule, date_str = process_schedule(uploaded_file)
	if schedule is not None and not schedule.empty:
	output = create_print_layout(schedule, date_str)
	if output:
	# Create tabs to switch between PDF and PNG previews
	tab1, tab2 = st.tabs(["PDF 预览", "PNG 预览"])

	with tab1:
	st.markdown(display_pdf(output['pdf']), unsafe_allow_html=True)

	with tab2:
	st.image(output['png'], use_container_width=True)
	else:
	st.error("生成打印布局失败。")
	elif schedule is None:
	st.error("无法处理文件，请检查文件格式或内容是否正确。")
	else: # schedule is empty
	st.warning("处理完成，但文件中没有找到有效的排片数据。")