File size: 1,669 Bytes
9779920
f931a9d
 
ff8f508
9779920
f931a9d
ff8f508
9876236
f931a9d
ff8f508
 
f931a9d
 
 
ff8f508
9876236
 
ff8f508
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
import pandas as pd
import requests
from io import BytesIO
import numpy as np

def analyze_excel(path_or_url: str) -> str:
    """Analysera Excel-fil och returnera detaljerad information"""
    try:
        if path_or_url.startswith("http"):
            response = requests.get(path_or_url, timeout=10)
            response.raise_for_status()
            df = pd.read_excel(BytesIO(response.content))
        else:
            df = pd.read_excel(path_or_url)
    
    except Exception as e:
        return f"Error reading Excel file: {e}"
    
    # Detaljerad analys
    analysis = []
    analysis.append(f"Rows: {df.shape[0]}, Columns: {df.shape[1]}")
    analysis.append(f"Column names: {', '.join(df.columns)}")
    
    # Datatyper
    numeric_cols = df.select_dtypes(include=[np.number]).columns.tolist()
    if numeric_cols:
        analysis.append(f"Numeric columns: {', '.join(numeric_cols)}")
        for col in numeric_cols:
            analysis.append(f"{col} - Sum: {df[col].sum():.2f}, Mean: {df[col].mean():.2f}, Max: {df[col].max():.2f}, Min: {df[col].min():.2f}")
    
    text_cols = df.select_dtypes(include=['object']).columns.tolist()
    if text_cols:
        analysis.append(f"Text columns: {', '.join(text_cols)}")
        for col in text_cols:
            unique_values = df[col].nunique()
            analysis.append(f"{col} - Unique values: {unique_values}")
            if unique_values <= 10:
                analysis.append(f"{col} values: {', '.join(map(str, df[col].unique()))}")
    
    # Första 3 raderna som exempel
    analysis.append("First 3 rows:")
    analysis.append(df.head(3).to_string())
    
    return "\n".join(analysis)