Spaces:
Sleeping
Sleeping
Upload 3 files
Browse files- README.md +17 -10
- app.py +40 -0
- requirements.txt +4 -0
README.md
CHANGED
@@ -1,10 +1,17 @@
|
|
1 |
-
---
|
2 |
-
title:
|
3 |
-
emoji:
|
4 |
-
colorFrom:
|
5 |
-
colorTo:
|
6 |
-
sdk:
|
7 |
-
|
8 |
-
|
9 |
-
|
10 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
---
|
2 |
+
title: Idiom-Aware Hindi-English Translator
|
3 |
+
emoji: 🌐
|
4 |
+
colorFrom: blue
|
5 |
+
colorTo: green
|
6 |
+
sdk: gradio
|
7 |
+
sdk_version: 4.44.0
|
8 |
+
app_file: app.py
|
9 |
+
license: mit
|
10 |
+
---
|
11 |
+
|
12 |
+
# Idiom-Aware Hindi-English Translator
|
13 |
+
|
14 |
+
A Gradio app fine-tuned for translating Hindi idioms to English.
|
15 |
+
|
16 |
+
## Usage
|
17 |
+
Enter Hindi idioms (e.g., “रस्सी जल गयी, बल नहीं गया”) and get accurate English translations.
|
app.py
ADDED
@@ -0,0 +1,40 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
# -*- coding: utf-8 -*-
|
2 |
+
"""app.ipynb
|
3 |
+
|
4 |
+
Automatically generated by Colab.
|
5 |
+
|
6 |
+
Original file is located at
|
7 |
+
https://colab.research.google.com/drive/1Ir0MiuPLQvCCHbSfM1tm0V_srviSEOi2
|
8 |
+
"""
|
9 |
+
|
10 |
+
import gradio as gr
|
11 |
+
import torch
|
12 |
+
from transformers import MarianMTModel, MarianTokenizer
|
13 |
+
|
14 |
+
class IdiomTranslator:
|
15 |
+
def __init__(self):
|
16 |
+
model_id = "Helsinki-NLP/opus-mt-hi-en"
|
17 |
+
self.tokenizer = MarianTokenizer.from_pretrained(model_id)
|
18 |
+
self.model = MarianMTModel.from_pretrained(model_id)
|
19 |
+
if torch.cuda.is_available(): self.model.cuda()
|
20 |
+
|
21 |
+
def translate(self, text):
|
22 |
+
if not text.strip(): return "Enter some Hindi text."
|
23 |
+
inputs = self.tokenizer(text, return_tensors="pt", truncation=True, padding=True)
|
24 |
+
if torch.cuda.is_available(): inputs = {k: v.cuda() for k,v in inputs.items()}
|
25 |
+
outs = self.model.generate(**inputs, max_length=128, num_beams=4)
|
26 |
+
return self.tokenizer.decode(outs[0], skip_special_tokens=True)
|
27 |
+
|
28 |
+
translator = IdiomTranslator()
|
29 |
+
|
30 |
+
demo = gr.Interface(
|
31 |
+
fn=translator.translate,
|
32 |
+
inputs=gr.Textbox(lines=3, label="Hindi Text"),
|
33 |
+
outputs=gr.Textbox(lines=3, label="English Translation"),
|
34 |
+
title="Idiom-Aware Hindi→English Translator",
|
35 |
+
description="Fine-tuned for cultural idioms.",
|
36 |
+
examples=[["रस्सी जल गयी, बल नहीं गया"],["दाल में कुछ काला है"]]
|
37 |
+
)
|
38 |
+
|
39 |
+
if __name__ == "__main__":
|
40 |
+
demo.launch()
|
requirements.txt
ADDED
@@ -0,0 +1,4 @@
|
|
|
|
|
|
|
|
|
|
|
1 |
+
gradio==4.44.0
|
2 |
+
torch>=2.0.0
|
3 |
+
transformers>=4.35.0
|
4 |
+
sentencepiece>=0.1.99
|