File size: 923 Bytes
188a2fe
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26

import re
import pandas as pd

def markdown_to_csv(llm_output):
    # Find all Markdown tables
    tables = re.findall(r"(\|(?:[^\n]+\|)+\n\|(?:\s*-+\s*\|)+\n(?:\|(?:[^\n]+\|)+\n)+)", llm_output)
    
    dataframes = []

    if tables:  # Ajouté pour éviter le 'NoneType' issue
        for table in tables:
            # Split lines and extract columns
            lines = table.strip().split("\n")
            headers = [col.strip() for col in lines[0].split("|")[1:-1]]  # Headers
            data_rows = [line.split("|")[1:-1] for line in lines[2:]]  # Ignore separator row

            # Clean and validate rows
            cleaned_data = [[col.strip() for col in row] for row in data_rows if len(row) == len(headers)]

            if cleaned_data:
                df = pd.DataFrame(cleaned_data, columns=headers)
                dataframes.append(df)

    return dataframes  # <- Corrigé : en dehors de la boucle