VisualiseCroatian

Runtime error

File size: 3,248 Bytes

import gradio as gr
import random
import nltk
from nltk.corpus import wordnet

import requests

# Download the Croatian WordNet data
nltk.download("wordnet")
nltk.download("omw")
nltk.download("omw-1.4")



# Function to get the English WordNet synset ID for a Croatian word
def get_english_synset_id(croatian_word):
    # Convert the Croatian word to English WordNet synset IDs
    synsets = wordnet.synsets(croatian_word, lang="hrv")
    
    # Check if any synsets were found
    if synsets:
        # Take the first synset (you can modify this to handle multiple synsets if needed)
        english_synset_id = synsets[0].name()
        return english_synset_id
    else:
        return None
        
# Function to get definitions and images from web
def get_definition_and_image(word):
    # try:
    #     # You may need to adjust this URL based on the source of definitions and images
    #     url = f"https://your-dictionary-website.com/{word}"
    #     response = requests.get(url)
    #     soup = BeautifulSoup(response.text, "html.parser")

    #     # Extract definition and image (assuming they are in specific HTML elements)
    #     definition = soup.find("div", {"class": "definition"}).text
    #     image_url = soup.find("img", {"class": "word-image"})["src"]

    #     return definition, image_url
    # except Exception as e:
    #     return None, None
    
    
    # Define the WordNet synset ID for the concept you're interested in
    synset_id =  get_english_synset_id(word) #"n07753592"  # Replace with the synset ID you want
    
    # URL for the ImageNet API
    base_url = "http://www.image-net.org/api/text/imagenet.synset.geturls?wnid="
    
    # Combine the base URL and the synset ID to get a list of image URLs
    url = base_url + synset_id
    
    # Send a GET request to the URL
    response = requests.get(url)
    
    if response.status_code == 200:
        # Parse the response to get a list of image URLs
        image_urls = response.text.splitlines()
        
        # Print the first 10 image URLs
        for i, url in enumerate(image_urls[:10], start=1):
            print(f"Image {i}: {url}")
    else:
        print(f"Failed to retrieve image URLs. Status code: {response.status_code}")

# Function to randomly sample a noun or verb
def sample_word_and_display_info():
    is_noun = random.choice([True, False])  # Randomly choose noun or verb
    if is_noun:
        pos = "n"
    else:
        pos = "v"

    # Get a random word of the chosen part of speech from the Croatian WordNet
    word = random.choice(wordnet.all_lemma_names(pos, lang="hrv"))
    
    # Get the definition and image (change the function for your source)
    definition, image_url = get_definition_and_image(word)

    if definition and image_url:
        print(f"Word: {word}")
        print(f"Part of speech: {'Noun' if is_noun else 'Verb'}")
        print(f"Definition: {definition}")
        print(f"Image URL: {image_url}")
        return image_url ,definition
    else:
        print(f"No information found for '{word}'")
        return none,none



def sample():
    return sample_word_and_display_info()
    

iface = gr.Interface(fn=sample, inputs="text", outputs="image, text")
iface.launch()