Spaces:
Running
Running
import pandas as pd | |
import streamlit as st | |
import matplotlib.pyplot as plt | |
import matplotlib.font_manager as font_manager | |
import io | |
import base64 | |
import os | |
from datetime import datetime, timedelta | |
from matplotlib.patches import Rectangle | |
from pypinyin import lazy_pinyin, Style | |
from matplotlib.backends.backend_pdf import PdfPages | |
# --- 字体设置 --- | |
def get_font(size=14): | |
"""根据操作系统环境查找并返回中文字体属性""" | |
font_path = "simHei.ttc" # 优先使用 simHei.ttc | |
if not os.path.exists(font_path): | |
font_path = "SimHei.ttf" # SimHei.ttf 作为备选 | |
# 如果两者都不存在,可以添加更多备选字体路径 | |
if not os.path.exists(font_path): | |
# for Windows | |
font_path = "C:/Windows/Fonts/simhei.ttf" | |
if not os.path.exists(font_path): | |
# for MacOS | |
font_path = "/System/Library/Fonts/STHeiti Medium.ttc" | |
# 如果仍然找不到,matplotlib会回退到默认字体 | |
return font_manager.FontProperties(fname=font_path, size=size) | |
# --- 拼音处理 --- | |
def get_pinyin_abbr(text): | |
"""获取文本前两个汉字的拼音首字母""" | |
if not text or not isinstance(text, str): | |
return "" | |
# 提取中文字符 | |
chars = [c for c in text if '\u4e00' <= c <= '\u9fff'] | |
# 取前两个汉字 | |
chars_to_process = chars[:2] | |
if not chars_to_process: | |
return "" | |
# 获取拼音首字母并转为大写 | |
pinyin_list = lazy_pinyin(chars_to_process, style=Style.FIRST_LETTER) | |
return ''.join(pinyin_list).upper() | |
# --- 数据处理 --- | |
def process_schedule(file): | |
"""读取并处理 Excel 文件,返回格式化的 DataFrame 和日期""" | |
try: | |
# 尝试读取日期 | |
date_df = pd.read_excel(file, header=None, skiprows=7, nrows=1, usecols=[3]) | |
date_str = pd.to_datetime(date_df.iloc[0, 0]).strftime('%Y-%m-%d') | |
base_date = pd.to_datetime(date_str).date() | |
except Exception: | |
# 读取失败则使用当天日期 | |
date_str = datetime.today().strftime('%Y-%m-%d') | |
base_date = datetime.today().date() | |
try: | |
# 读取排片数据 | |
df = pd.read_excel(file, header=9, usecols=[1, 2, 4, 5]) | |
df.columns = ['Hall', 'StartTime', 'EndTime', 'Movie'] | |
# 数据清洗 | |
df['Hall'] = df['Hall'].ffill() | |
df.dropna(subset=['StartTime', 'EndTime', 'Movie'], inplace=True) | |
df['Hall'] = df['Hall'].astype(str).str.extract(r'(\d+号)') | |
df.dropna(subset=['Hall'], inplace=True) | |
# 时间转换 | |
df['StartTime_dt'] = pd.to_datetime(df['StartTime'], format='%H:%M', errors='coerce').apply( | |
lambda t: t.replace(year=base_date.year, month=base_date.month, day=base_date.day) if pd.notnull(t) else t | |
) | |
df['EndTime_dt'] = pd.to_datetime(df['EndTime'], format='%H:%M', errors='coerce').apply( | |
lambda t: t.replace(year=base_date.year, month=base_date.month, day=base_date.day) if pd.notnull(t) else t | |
) | |
df.dropna(subset=['StartTime_dt', 'EndTime_dt'], inplace=True) | |
# 处理跨天结束时间 | |
df.loc[df['EndTime_dt'] < df['StartTime_dt'], 'EndTime_dt'] += timedelta(days=1) | |
df = df.sort_values(['Hall', 'StartTime_dt']) | |
# 合并同一影厅的连续相同影片 | |
merged_rows = [] | |
for _, group in df.groupby('Hall'): | |
group = group.sort_values('StartTime_dt') | |
current = None | |
for _, row in group.iterrows(): | |
if current is None: | |
current = row.copy() | |
else: | |
if row['Movie'] == current['Movie']: | |
current['EndTime_dt'] = row['EndTime_dt'] | |
else: | |
merged_rows.append(current) | |
current = row.copy() | |
if current is not None: | |
merged_rows.append(current) | |
if not merged_rows: | |
return None, date_str | |
merged_df = pd.DataFrame(merged_rows) | |
# 统一调整时间 | |
merged_df['StartTime_dt'] -= timedelta(minutes=10) | |
merged_df['EndTime_dt'] -= timedelta(minutes=5) | |
# 格式化最终输出的列 | |
merged_df['Time'] = merged_df['StartTime_dt'].dt.strftime('%H:%M') + ' - ' + merged_df['EndTime_dt'].dt.strftime('%H:%M') | |
merged_df['Pinyin'] = merged_df['Movie'].apply(get_pinyin_abbr) | |
merged_df['Hall'] = merged_df['Hall'].str.replace('号', '') | |
return merged_df[['Hall', 'Movie', 'Pinyin', 'Time']], date_str | |
except Exception as e: | |
st.error(f"处理 Excel 数据时发生错误: {e}") | |
return None, date_str | |
# --- 打印布局生成 --- | |
def create_print_layout(data, date_str): | |
"""根据处理好的数据,生成用于打印的 PNG 和 PDF 布局""" | |
if data is None or data.empty: | |
return None | |
A4_SIZE_INCHES = (8.27, 11.69) | |
DPI = 300 | |
# 准备一个临时的 figure 用于计算文本渲染尺寸 | |
temp_fig = plt.figure(figsize=A4_SIZE_INCHES, dpi=DPI) | |
renderer = temp_fig.canvas.get_renderer() | |
# 1. 计算行高 | |
num_movies = len(data) | |
num_halls = len(data['Hall'].unique()) | |
# 总行数 = 电影条目数 + 厅间分隔数 + 上下留白(2) | |
# total_layout_rows = num_movies + (num_halls - 1) + 2 | |
total_layout_rows = num_movies + 2 # 简化为条目数+2,使行高更宽松 | |
row_height_inch = A4_SIZE_INCHES[1] / total_layout_rows | |
# 2. 计算基准字体大小 (点) | |
# 1 point = 1/72 inch. | |
# 字体高度为行高的 90% | |
font_size_pt = row_height_inch * 0.9 * 72 | |
base_font = get_font(font_size_pt) | |
# 3. 计算各列宽度 (除电影名外) | |
def get_text_width_inch(text, font): | |
t = plt.text(0, 0, text, fontproperties=font) | |
bbox = t.get_window_extent(renderer=renderer) | |
width_pixels = bbox.width | |
t.remove() | |
return width_pixels / DPI | |
# 找到每列最长的内容 | |
data['Index'] = data.groupby('Hall').cumcount() + 1 | |
max_hall_str = data['Hall'].max() + "#" # e.g. "10#" | |
max_index_str = str(data['Index'].max()) + "." # e.g. "5." | |
max_pinyin_str = data['Pinyin'].apply(len).max() * "A" # e.g. "PY" -> "AA" | |
max_time_str = data['Time'].apply(len).idxmax() | |
max_time_str = data.loc[max_time_str, 'Time'] | |
col_widths = {} | |
col_widths['Hall'] = get_text_width_inch(max_hall_str, base_font) * 1.1 | |
col_widths['Index'] = get_text_width_inch(max_index_str, base_font) * 1.1 | |
col_widths['Pinyin'] = get_text_width_inch(max_pinyin_str, base_font) * 1.1 | |
col_widths['Time'] = get_text_width_inch(max_time_str, base_font) * 1.1 | |
# 电影名列的宽度为剩余宽度 | |
non_movie_width = sum(col_widths.values()) | |
col_widths['Movie'] = A4_SIZE_INCHES[0] - non_movie_width | |
plt.close(temp_fig) # 关闭临时figure | |
# --- 开始正式绘图 --- | |
figs = {} | |
for fmt in ['png', 'pdf']: | |
fig = plt.figure(figsize=A4_SIZE_INCHES, dpi=DPI) | |
ax = fig.add_subplot(111) | |
ax.set_axis_off() | |
fig.subplots_adjust(left=0, right=1, top=1, bottom=0) | |
ax.set_xlim(0, A4_SIZE_INCHES[0]) | |
ax.set_ylim(0, A4_SIZE_INCHES[1]) | |
# 计算列的 X 轴起始位置 | |
x_pos = {} | |
current_x = 0 | |
# 新顺序: Hall, Index, Movie, Pinyin, Time | |
col_order = ['Hall', 'Index', 'Movie', 'Pinyin', 'Time'] | |
for col in col_order: | |
x_pos[col] = current_x | |
current_x += col_widths[col] | |
# 从顶部开始绘制 (顶部留出一行空白) | |
current_y = A4_SIZE_INCHES[1] - row_height_inch | |
halls = sorted(data['Hall'].unique(), key=lambda h: int(h)) | |
for hall in halls: | |
hall_data = data[data['Hall'] == hall].sort_values('Index') | |
for _, row in hall_data.iterrows(): | |
y_bottom = current_y - row_height_inch | |
# 绘制单元格 | |
for col_name in col_order: | |
cell_x = x_pos[col_name] | |
cell_width = col_widths[col_name] | |
# 绘制灰色虚线边框 | |
rect = Rectangle((cell_x, y_bottom), cell_width, row_height_inch, | |
edgecolor='lightgray', facecolor='none', | |
linestyle=(0, (1, 2)), linewidth=0.8, zorder=1) | |
ax.add_patch(rect) | |
# 准备文本内容 | |
text_content = { | |
'Hall': f"{row['Hall']}#", | |
'Index': f"{row['Index']}.", | |
'Movie': row['Movie'], | |
'Pinyin': row['Pinyin'], | |
'Time': row['Time'] | |
}[col_name] | |
# 文本垂直居中 | |
text_y = y_bottom + row_height_inch / 2 | |
# 电影名列特殊处理 | |
if col_name == 'Movie': | |
font_to_use = base_font.copy() | |
# 检查宽度并调整字体 | |
text_w_inch = get_text_width_inch(text_content, font_to_use) | |
max_w_inch = cell_width * 0.9 # 目标宽度为单元格宽度的90% | |
if text_w_inch > max_w_inch: | |
scale_factor = max_w_inch / text_w_inch | |
font_to_use.set_size(font_size_pt * scale_factor) | |
ax.text(cell_x + cell_width * 0.05, text_y, text_content, # 左对齐 | |
fontproperties=font_to_use, ha='left', va='center', clip_on=True) | |
else: # 其他列 | |
ax.text(cell_x + cell_width / 2, text_y, text_content, # 居中对齐 | |
fontproperties=base_font, ha='center', va='center', clip_on=True) | |
current_y -= row_height_inch | |
# 在每个影厅块结束后绘制黑色分隔线 | |
ax.plot([0, A4_SIZE_INCHES[0]], [current_y, current_y], color='black', linewidth=1.5, zorder=2) | |
# 在左上角添加日期 | |
ax.text(0.1, A4_SIZE_INCHES[1] - 0.3, date_str, | |
fontproperties=get_font(12), color='gray', ha='left', va='top') | |
figs[fmt] = fig | |
# 保存到内存 | |
png_buffer = io.BytesIO() | |
figs['png'].savefig(png_buffer, format='png', dpi=DPI) | |
png_buffer.seek(0) | |
image_base64 = base64.b64encode(png_buffer.getvalue()).decode() | |
plt.close(figs['png']) | |
pdf_buffer = io.BytesIO() | |
figs['pdf'].savefig(pdf_buffer, format='pdf', dpi=DPI) | |
pdf_buffer.seek(0) | |
pdf_base64 = base64.b64encode(pdf_buffer.getvalue()).decode() | |
plt.close(figs['pdf']) | |
return { | |
'png': f"data:image/png;base64,{image_base64}", | |
'pdf': f"data:application/pdf;base64,{pdf_base64}" | |
} | |
# --- Streamlit UI --- | |
st.set_page_config(page_title="LED 屏幕时间表打印", layout="wide") | |
st.title("LED 屏幕时间表打印") | |
st.markdown("请上传影院系统导出的 `放映时间核对表.xls` 文件。系统将自动处理数据并生成专业、美观的A4打印布局。") | |
uploaded_file = st.file_uploader("选择文件", accept_multiple_files=False, type=["xls", "xlsx"]) | |
if uploaded_file: | |
with st.spinner("文件处理与布局生成中,请稍候..."): | |
schedule, date_str = process_schedule(uploaded_file) | |
if schedule is not None and not schedule.empty: | |
output = create_print_layout(schedule, date_str) | |
st.success(f"成功生成 **{date_str}** 的排片表!") | |
# 创建下载按钮 | |
col1, col2 = st.columns(2) | |
with col1: | |
st.download_button( | |
label="📥 下载 PNG 图像", | |
data=base64.b64decode(output['png'].split(',')[1]), | |
file_name=f"排片表_{date_str}.png", | |
mime="image/png" | |
) | |
with col2: | |
st.download_button( | |
label="📄 下载 PDF 文档", | |
data=base64.b64decode(output['pdf'].split(',')[1]), | |
file_name=f"排片表_{date_str}.pdf", | |
mime="application/pdf" | |
) | |
# 创建选项卡进行预览 | |
tab1, tab2 = st.tabs(["📄 PDF 预览", "🖼️ PNG 预览"]) | |
with tab1: | |
st.markdown(f'<iframe src="{output["pdf"]}" width="100%" height="800" type="application/pdf"></iframe>', unsafe_allow_html=True) | |
with tab2: | |
st.image(output['png'], use_container_width=True) | |
else: | |
st.error("无法处理文件。请检查文件内容是否为空或格式是否正确。确保文件中包含有效的排片数据。") |