Spaces:

SreekarB
/

SLPAnalysis

Sleeping

File size: 21,489 Bytes

import gradio as gr
import json
import os
import logging
import requests

# Configure logging
logging.basicConfig(level=logging.INFO)
logger = logging.getLogger(__name__)

# Anthropic API key - can be set as HuggingFace secret or environment variable
ANTHROPIC_API_KEY = os.getenv("ANTHROPIC_API_KEY", "")

# Check if API key is available
if ANTHROPIC_API_KEY:
    logger.info("Claude API key found")
else:
    logger.warning("Claude API key not found - using demo mode")

def call_claude_api(prompt):
    """Call Claude API directly"""
    if not ANTHROPIC_API_KEY:
        return "❌ Claude API key not configured. Please set ANTHROPIC_API_KEY environment variable."
    
    try:
        headers = {
            "Content-Type": "application/json",
            "x-api-key": ANTHROPIC_API_KEY,
            "anthropic-version": "2023-06-01"
        }
        
        data = {
            "model": "claude-3-5-sonnet-20241022",
            "max_tokens": 4096,
            "messages": [
                {
                    "role": "user",
                    "content": prompt
                }
            ]
        }
        
        response = requests.post(
            "https://api.anthropic.com/v1/messages",
            headers=headers,
            json=data,
            timeout=60
        )
        
        if response.status_code == 200:
            response_json = response.json()
            return response_json['content'][0]['text']
        else:
            logger.error(f"Claude API error: {response.status_code} - {response.text}")
            return f"❌ Claude API Error: {response.status_code}"
            
    except Exception as e:
        logger.error(f"Error calling Claude API: {str(e)}")
        return f"❌ Error: {str(e)}"

def process_file(file):
    """Process uploaded file"""
    if file is None:
        return "Please upload a file first."
    
    try:
        # Read file content
        with open(file.name, 'r', encoding='utf-8', errors='ignore') as f:
            content = f.read()
        
        if not content.strip():
            return "File appears to be empty."
            
        return content
    except Exception as e:
        return f"Error reading file: {str(e)}"

def analyze_transcript(file, age, gender, slp_notes):
    """Simple CASL analysis"""
    if file is None:
        return "Please upload a transcript file first."
    
    # Get transcript content
    transcript = process_file(file)
    if transcript.startswith("Error") or transcript.startswith("Please"):
        return transcript
    
    # Add SLP notes to the prompt if provided
    notes_section = ""
    if slp_notes and slp_notes.strip():
        notes_section = f"""
    
    SLP CLINICAL NOTES:
    {slp_notes.strip()}
    """
    
    # Simple analysis prompt
    def analyze_transcript(file, age, gender):
    """Simple CASL analysis"""
    if file is None:
        return "Please upload a transcript file first."
    
    # Get transcript content
    transcript = process_file(file)
    if transcript.startswith("Error") or transcript.startswith("Please"):
        return transcript
    
# Provide the instructions for analyzing the transcript
    instructions = f"""
    
    
    
    Each domain from the CASL-2 framework can be analyzed using the sample:
    
    Lexical/Semantic Skills:
    
    This category focuses on vocabulary knowledge, word meanings, and the ability to use words contextually. It measures both receptive and expressive language abilities related to word use.
    
    Key Subtests:
    
    Antonyms: Identifying words with opposite meanings.
    Synonyms: Identifying words with similar meanings.
    Idiomatic Language: Understanding and interpreting idioms and figurative language.
    
    Evaluate vocabulary diversity (type-token ratio).
    Note word-finding difficulties, incorrect word choices, or over-reliance on fillers (e.g., “like,” “stuff”).
    Assess use of specific vs. vague language (e.g., "car" vs. "sedan").
    
    Syntactic Skills:
    
    This category evaluates understanding and use of grammar and sentence structure. It focuses on the ability to comprehend and produce grammatically correct sentences.
    
    Key Subtests:
    
    Sentence Expression: Producing grammatically correct sentences based on prompts.
    Grammaticality Judgment: Identifying whether a sentence is grammatically correct.
    
    Examine sentence structure for grammatical accuracy.
    Identify errors in verb tense, subject-verb agreement, or sentence complexity.
    Note the use of clauses, conjunctions, and varied sentence types.
    
    
    Supralinguistic Skills:
    
    This subcategory assesses higher-level language skills that go beyond literal meanings, such as understanding implied meanings, sarcasm, and complex verbal reasoning.
    
    Key Subtests:
    
    Inferences: Understanding information that is not explicitly stated.
    Meaning from Context: Deriving meaning from surrounding text or dialogue.
    Nonliteral Language: Interpreting figurative language, such as metaphors or irony
    
    Look for use or understanding of figurative language, idioms, or humor.
    Assess ability to handle ambiguous or implied meanings in context.
    Identify advanced language use for abstract or hypothetical ideas.
    
    
    Pragmatic Skills(focus less on this as it is not typically necessary for the age range you will be dealing with):
    This category measures the ability to use language effectively in social contexts. It evaluates understanding of conversational rules, turn-taking, and adapting communication to different social situations.
    
    Key Subtests:
    
    Pragmatic Language Test: Assessing appropriateness of responses in social scenarios.
    
    
    Observe turn-taking, topic maintenance, and conversational appropriateness.
    Note use of politeness, tone, or adapting language to the listener.
    Evaluate narrative coherence in storytelling or recounting events.
    
    
    Quantitative Analysis:
    Count errors (e.g., grammatical, lexical) and divide by total utterances to calculate error rates.
    Measure Mean Length of Utterance (MLU) to gauge syntactic complexity.
    Count the variety of unique words for vocabulary richness.
    
    
    Qualitative Analysis:
    Assess the appropriateness and sophistication of responses for the individual’s age.
    Evaluate overall fluency, coherence, and adaptability in communication.
    1. Lexical/Semantic Analysis
    Objective: Evaluate vocabulary diversity, word meaning, and contextual usage.
    LLM Process:
    
    Word Diversity:
    Calculate the type-token ratio (TTR): Divide the number of unique words by the total number of words to estimate vocabulary richness.
    Identify repetition and overuse of basic words.
    Word Appropriateness:
    Analyze context to determine if words are used accurately (e.g., "big" for "large" vs. incorrect substitutions).
    Idiomatic Language:
    Detect use of idioms, metaphors, or figurative expressions.
    Assess whether these expressions are used and interpreted correctly within the speech.
    Scoring:
    
    Assign scores based on TTR thresholds and the presence of appropriately used advanced vocabulary or idiomatic language.
    2. Syntactic Analysis
    Objective: Assess grammatical accuracy, sentence complexity, and variety.
    LLM Process:
    
    Grammar Checking:
    Identify grammatical errors (e.g., incorrect verb tense, subject-verb disagreement, missing articles).
    Sentence Complexity:
    Calculate the mean length of utterance (MLU): Average the number of morphemes per sentence.
    Count clauses, conjunctions, and use of complex structures (e.g., relative clauses).
    Error Patterns:
    Note recurring syntactic errors or simplified constructions indicative of developmental or functional delays.
    Scoring:
    
    Base scores on error frequency, MLU, and the proportion of complex vs. simple sentences.
    3. Supralinguistic Analysis
    Objective: Evaluate understanding and use of abstract, implied, or nonliteral language.
    LLM Process:
    
    Inference Detection:
    Analyze whether the speaker makes logical inferences or responds appropriately to indirect prompts (e.g., "Why do you think they did that?" requiring contextual reasoning).
    Nonliteral Language:
    Detect use or interpretation of figurative expressions, idioms, or sarcasm.
    Contextual Adaptation:
    Assess whether the speaker adjusts their language based on the situation or implied meaning.
    Scoring:
    
    Assign points for accurate interpretations of implied meanings and use of nonliteral language.
    4. Pragmatic Analysis
    Objective: Assess social communication and appropriateness in interactions.
    
    
    LLM Process:
    
    Turn-Taking and Topic Maintenance:
    Evaluate whether the speaker follows conversational rules, including turn-taking and staying on topic.
    Social Cues:
    Analyze how well the speaker uses language to match the context (e.g., formal vs. informal speech).
    Clarity and Politeness:
    Assess the appropriateness of language for the audience and situation (e.g., clarity, tone, politeness).
    Scoring:
    
    Base scores on observed appropriateness and adherence to conversational norms.
    5. Overall Scoring
    Objective: Aggregate scores for all categories to estimate a composite language ability.
    LLM Process:
    
    Normalize subcategory scores based on predefined thresholds (e.g., raw scores from lexical, syntactic, supralinguistic, and pragmatic categories).
    Combine normalized scores to calculate an estimated General Language Ability Index (GLAI).
    Implementation Workflow
    Input:
    Provide the LLM with a transcribed spontaneous speech sample.
    Include metadata (e.g., speaker’s age, context of the conversation).
    Processing:
    Use predefined scoring rubrics to analyze lexical, syntactic, supralinguistic, and pragmatic features in the transcript.
    Output:
    Generate scores for each subcategory.
    Offer a detailed breakdown explaining how each score was derived.
    Summarize results with an estimated composite score and percentile rank.
    
    
    The CASL-2 provides descriptive scores for each subcategory and subtest to help interpret an individual's performance relative to age-based norms. These descriptive scores are based on the standard scores and are typically categorized into qualitative performance levels. Here’s an overview of how the descriptive scores are generally aligned for each subcategory and subtest:
    
    Descriptive Score Levels
    Each subcategory or subtest score typically falls into one of these descriptive ranges based on the standard score:
    
    Standard Score Range	Descriptive Label
    131 and above	Very Superior
    121–130	Superior
    111–120	Above Average
    90–110	Average
    80–89	Below Average
    70–79	Poor
    Below 70	Very Poor
    Descriptive Scores for Each Subcategory
    1. Lexical/Semantic
    Reflects vocabulary knowledge, word usage, and ability to interpret word relationships.
    Descriptive labels are based on scores from subtests like Antonyms, Synonyms, and Idiomatic Language.
    2. Syntactic
    Evaluates grammar and sentence structure understanding.
    Descriptive scores use results from subtests such as Sentence Expression and Grammaticality Judgment.
    3. Supralinguistic
    Represents higher-order language comprehension, such as nonliteral and abstract meanings.
    Descriptive labels are derived from subtests like Inferences, Meaning from Context, and Nonliteral Language.
    4. Pragmatic
    Measures social language use, including conversational appropriateness and adaptability.
    Descriptive scores come from the Pragmatic Language Test.
    5. General Language Ability Index (GLAI)
    Composite score representing overall spoken language competence.
    Combines scaled scores from various subtests into one standard score, interpreted using the same descriptive range.
    Percentile Ranks
    In addition to descriptive scores, CASL-2 provides percentile ranks to indicate the proportion of individuals in the normative sample who scored lower than the test-taker. For example:
    
    A standard score of 100 corresponds to the 50th percentile (average performance).
    A score of 85 corresponds to the 16th percentile (below average).
    
    """

# Format the answer
    answer_format = f"""
Template for LLM Output: CASL-2 Analysis from Spontaneous Speech Sample
    1. Introduction
    Provide a brief overview of the analysis, including context and objectives.
    Example:
    "This analysis evaluates the spoken language abilities of the individual based on a transcribed spontaneous speech sample. The results are categorized into the CASL-2 subcategories: Lexical/Semantic, Syntactic, Supralinguistic, Pragmatic, and Overall Language Ability."
    
    2. Lexical/Semantic Analysis
    Describe findings related to vocabulary, word meanings, and contextual usage.
    
    Word Diversity (Type-Token Ratio):
    Example: The speaker used 80 unique words out of 200 total words, resulting in a TTR of 0.4, indicating moderate vocabulary richness.
    
    Word Appropriateness:
    Example: Most words were used correctly within context, though advanced vocabulary or synonyms were limited.
    
    Idiomatic and Figurative Language:
    Example: No idiomatic expressions or figurative language were observed.
    
    Score: X/5
    3. Syntactic Analysis
    Evaluate grammatical accuracy, sentence complexity, and structure.
    
    Grammatical Accuracy:
    Example: The speech contained 3 grammatical errors, such as incorrect verb tense usage ("I goed to the park").
    
    Sentence Complexity (Mean Length of Utterance):
    Example: The mean length of utterance (MLU) was 5.2 words, indicating a preference for simple sentences.
    
    Error Patterns:
    Example: Frequent omissions of articles and auxiliary verbs.
    
    Score: X/5
    4. Supralinguistic Analysis
    Assess abstract and nonliteral language skills.
    
    Inference Making:
    Example: The speaker demonstrated minimal ability to infer meaning, as responses were literal and lacked contextual reasoning.
    
    Nonliteral Language:
    Example: No use or understanding of idioms, metaphors, or sarcasm was observed.
    
    Contextual Adaptation:
    Example: The speaker’s responses were appropriate to the conversation but lacked depth.
    
    Score: X/5
    5. Pragmatic Analysis
    Examine social communication skills and conversational appropriateness.
    
    Turn-Taking:
    Example: The speaker effectively took turns but occasionally interrupted the conversational flow.
    
    Topic Maintenance:
    Example: The speaker maintained the topic but struggled with cohesive transitions.
    
    Social Appropriateness:
    Example: Responses were contextually appropriate but lacked expressive variation.
    
    Score: X/5
    6. Overall Language Ability
    Summarize the composite score and provide insights.
    
    Composite Score (Estimated):
    Example: The composite score, derived from subcategory averages, is 3.0/5, indicating below-average language abilities relative to peers.
    
    Percentile Rank:
    Example: Based on performance, the speaker falls in the 30th percentile for their age group.
    
    Key Strengths:
    Example: The speaker exhibited strong topic maintenance and grammatical accuracy for simple sentences.
    
    Areas for Improvement:
    Example: Vocabulary diversity, sentence complexity, and inference-making skills require development.
    
    Please provide a CASL analysis including:
    
    1. SPEECH FACTORS (with counts and severity):
    - Difficulty producing fluent speech
    - Word retrieval issues  
    - Grammatical errors
    - Repetitions and revisions
    
    2. CASL SKILLS ASSESSMENT:
    - Lexical/Semantic Skills (Standard Score, Percentile, Level)
        - Syntactic Skills (Standard Score, Percentile, Level)
        - Supralinguistic Skills (Standard Score, Percentile, Level)
        
        3. TREATMENT RECOMMENDATIONS:
        - List 3-5 specific intervention strategies
        
        4. CLINICAL SUMMARY:
        - Brief explanation of findings and prognosis
        
        Use exact quotes from the transcript as evidence.
        Provide realistic standard scores (70-130 range, mean=100).
        """
    
    prompt = f"""
    
        
    You are a speech pathologist, a healthcare professional who specializes in evaluating, diagnosing, and treating communication disorders, including speech, language, cognitive-communication, voice, swallowing, and fluency disorders. Your role is to help patients improve their speech and communication skills through various therapeutic techniques and exercises.
    
    In this scenario, you will be working with a patient who has the following speech disorder or issue:
    
    Autism Spectrum Disorder - Demographics  Patient: {age}-year-old {gender}
    
    A speech-language pathologist (SLP) working in schools plays a vital role in supporting students with autism spectrum disorder (ASD). These professionals focus on helping students develop the communication skills they need to succeed academically, socially, and emotionally. Communication challenges are a common characteristic of ASD, and SLPs are uniquely equipped to address them with specialized knowledge and strategies.
    
    SLPs working with students with ASD begin by assessing their communication abilities, including their use of verbal and nonverbal language. This evaluation may involve observing how the student interacts with peers and teachers, understanding their use of gestures, facial expressions, or other forms of communication, and identifying areas for improvement. Based on the assessment, the SLP creates an individualized treatment plan tailored to the student’s specific needs.
    
    Interventions often focus on improving social communication skills, such as taking turns in conversation, understanding and using eye contact, recognizing emotions in others, and maintaining appropriate topics during discussions. For students with limited verbal abilities, the SLP may introduce augmentative and alternative communication (AAC) tools, such as picture exchange systems or speech-generating devices, to help them express themselves effectively.
    
    Here is a sample dialogue between you and the patient:
    
    <dialogue>
        
        TRANSCRIPT:
        {transcript}
    </dialogue>
    
    Based on the information provided, please do the following:
    
    {instructions}
    Do this using {answer_format}
    
    Remember, your goal is to provide a comprehensive and supportive therapy experience for the patient, helping them to improve their speech and communication skills and build their confidence in the process. Use your expertise and empathy to guide them through this journey.
    
        """
        
    # Get analysis from Claude API
    result = call_claude_api(prompt)
    return result

    
    # Get analysis from Claude API
    result = call_claude_api(prompt)
    return result

# Create simple interface
with gr.Blocks(title="Simple CASL Analysis", theme=gr.themes.Soft()) as app:
    
    gr.Markdown("# 🗣️ Simple CASL Analysis Tool")
    gr.Markdown("Upload a speech transcript and get instant CASL assessment results.")
    
    with gr.Row():
        with gr.Column():
            gr.Markdown("### Upload & Settings")
            
            file_upload = gr.File(
                label="Upload Transcript File",
                file_types=[".txt", ".cha"]
            )
            
            age = gr.Number(
                label="Patient Age", 
                value=8, 
                minimum=1, 
                maximum=120
            )
            
            gender = gr.Radio(
                ["male", "female", "other"], 
                label="Gender", 
                value="male"
            )
            
            slp_notes = gr.Textbox(
                label="SLP Clinical Notes (Optional)",
                placeholder="Enter any additional clinical observations, context, or notes...",
                lines=3
            )
            
            analyze_btn = gr.Button(
                "🔍 Analyze Transcript", 
                variant="primary"
            )
        
        with gr.Column():
            gr.Markdown("### Analysis Results")
            
            output = gr.Textbox(
                label="CASL Analysis Report",
                placeholder="Analysis results will appear here...",
                lines=25,
                max_lines=30
            )
    
    # Connect the analyze button
    analyze_btn.click(
        analyze_transcript,
        inputs=[file_upload, age, gender, slp_notes],
        outputs=[output]
    )

if __name__ == "__main__":
    print("🚀 Starting Simple CASL Analysis Tool...")
    if not ANTHROPIC_API_KEY:
        print("⚠️  ANTHROPIC_API_KEY not configured - analysis will show error message")
        print("   For HuggingFace Spaces: Add ANTHROPIC_API_KEY as a secret in your space settings")
        print("   For local use: export ANTHROPIC_API_KEY='your-key-here'")
    else:
        print("✅ Claude API configured")
    
    app.launch(show_api=False)