Spaces:

rubenroy
/

Zurich-14B

Running

App Files Files Community

rubenroy commited on Jan 31

Commit

08a1b37

verified ·

1 Parent(s): c757743

Update app.py

Browse files

Files changed (1) hide show

app.py +16 -16

app.py CHANGED Viewed

@@ -3,7 +3,7 @@ import spaces
 from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
-model_name = "rubenroy/Zurich-7B-GCv2-1m"
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     torch_dtype=torch.bfloat16,
@@ -14,7 +14,7 @@ tokenizer = AutoTokenizer.from_pretrained(model_name)
 @spaces.GPU
 def generate(message, chat_history, temperature=0.7, top_p=0.9, top_k=50, max_new_tokens=512, repetition_penalty=1.1):
     messages = [
-        {"role": "system", "content": "You are Zurich, a 7 billion parameter Large Language model built on the Qwen 2.5 7B model developed by Alibaba Cloud, and fine-tuned by Ruben Roy. You have been fine-tuned with the GammaCorpus v2 dataset, a dataset filled with structured and filtered multi-turn conversations and was also created by Ruben Roy. You are a helpful assistant."},
         {"role": "user", "content": message}
     ]
     text = tokenizer.apply_chat_template(
@@ -112,10 +112,10 @@ TITLE_HTML = """
         <div style="display: flex; align-items: center; justify-content: center; gap: 1rem;">
             <h1 style="font-size: 2.5rem; font-weight: 800; margin: 0; background: linear-gradient(135deg, #60a5fa 0%, #93c5fd 100%); -webkit-background-clip: text; -webkit-text-fill-color: transparent;">Zurich</h1>
             <div style="width: 2px; height: 2.5rem; background: linear-gradient(180deg, #3b82f6 0%, #60a5fa 100%);"></div>
-            <p style="font-size: 1.25rem; color: #94a3b8; margin: 0;">GammaCorpus v2-1m</p>
         </div>
         <div class="info-section">
-            <span>Fine-tuned from <a href="https://huggingface.co/Qwen/Qwen2.5-7B-Instruct" class="info-link">Qwen 2.5 7B Instruct</a> | Model: <a href="https://huggingface.co/rubenroy/Zurich-7B-GCv2-1m" class="info-link">Zurich-7B-GCv2-1m</a> | Training Dataset: <a href="https://huggingface.co/datasets/rubenroy/GammaCorpus-v2-1m" class="info-link">GammaCorpus v2 1m</a></span>
         </div>
     </div>
@@ -126,12 +126,12 @@ TITLE_HTML = """
                 7B Models
             </h2>
             <div style="display: grid; grid-template-columns: repeat(2, 1fr); gap: 0.75rem;">
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-7B-GCv2-5m" class="model-btn">Zurich 7B GCv2 5m</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-7B-GCv2-1m" class="model-btn">Zurich 7B GCv2 1m</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-7B-GCv2-500k" class="model-btn">Zurich 7B GCv2 500k</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-7B-GCv2-100k" class="model-btn">Zurich 7B GCv2 100k</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-7B-GCv2-50k" class="model-btn">Zurich 7B GCv2 50k</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-7B-GCv2-10k" class="model-btn">Zurich 7B GCv2 10k</a>
             </div>
         </div>
         <div class="model-section">
@@ -140,12 +140,12 @@ TITLE_HTML = """
                 14B Models
             </h2>
             <div style="display: grid; grid-template-columns: repeat(2, 1fr); gap: 0.75rem;">
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-14B-GCv2-5m" class="model-btn">Zurich 14B GCv2 5m</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-14B-GCv2-1m" class="model-btn">Zurich 14B GCv2 1m</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-14B-GCv2-500k" class="model-btn">Zurich 14B GCv2 500k</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-14B-GCv2-100k" class="model-btn">Zurich 14B GCv2 100k</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-14B-GCv2-50k" class="model-btn">Zurich 14B GCv2 50k</a>
-                <a href="https://huggingface.co/spaces/rubenroy/Zurich-14B-GCv2-10k" class="model-btn">Zurich 14B GCv2 10k</a>
             </div>
         </div>
     </div>

 from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
+model_name = "rubenroy/Zurich-14B-GCv2-5m"
 model = AutoModelForCausalLM.from_pretrained(
     model_name,
     torch_dtype=torch.bfloat16,
 @spaces.GPU
 def generate(message, chat_history, temperature=0.7, top_p=0.9, top_k=50, max_new_tokens=512, repetition_penalty=1.1):
     messages = [
+        {"role": "system", "content": "You are Zurich, a 14 billion parameter Large Language model built on the Qwen 2.5 14B model developed by Alibaba Cloud, and fine-tuned by Ruben Roy. You have been fine-tuned with the GammaCorpus v2 dataset, a dataset filled with structured and filtered multi-turn conversations and was also created by Ruben Roy. You are a helpful assistant."},
         {"role": "user", "content": message}
     ]
     text = tokenizer.apply_chat_template(
         <div style="display: flex; align-items: center; justify-content: center; gap: 1rem;">
             <h1 style="font-size: 2.5rem; font-weight: 800; margin: 0; background: linear-gradient(135deg, #60a5fa 0%, #93c5fd 100%); -webkit-background-clip: text; -webkit-text-fill-color: transparent;">Zurich</h1>
             <div style="width: 2px; height: 2.5rem; background: linear-gradient(180deg, #3b82f6 0%, #60a5fa 100%);"></div>
+            <p style="font-size: 1.25rem; color: #94a3b8; margin: 0;">GammaCorpus v2-5m</p>
         </div>
         <div class="info-section">
+            <span>Fine-tuned from <a href="https://huggingface.co/Qwen/Qwen2.5-14B-Instruct" class="info-link">Qwen 2.5 14B Instruct</a> | Model: <a href="https://huggingface.co/rubenroy/Zurich-14B-GCv2-5m" class="info-link">Zurich-14B-GCv2-5m</a> | Training Dataset: <a href="https://huggingface.co/datasets/rubenroy/GammaCorpus-v2-5m" class="info-link">GammaCorpus v2 5m</a></span>
         </div>
     </div>
                 7B Models
             </h2>
             <div style="display: grid; grid-template-columns: repeat(2, 1fr); gap: 0.75rem;">
+                <a href="https://huggingface.co/rubenroy/Zurich-7B-GCv2-5m" class="model-btn">Zurich 7B GCv2 5m</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-7B-GCv2-1m" class="model-btn">Zurich 7B GCv2 1m</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-7B-GCv2-500k" class="model-btn">Zurich 7B GCv2 500k</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-7B-GCv2-100k" class="model-btn">Zurich 7B GCv2 100k</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-7B-GCv2-50k" class="model-btn">Zurich 7B GCv2 50k</a>
+                <a href="https://huggingface.co/sces/rubenroy/Zurich-7B-GCv2-10k" class="model-btn">Zurich 7B GCv2 10k</a>
             </div>
         </div>
         <div class="model-section">
                 14B Models
             </h2>
             <div style="display: grid; grid-template-columns: repeat(2, 1fr); gap: 0.75rem;">
+                <a href="https://huggingface.co/rubenroy/Zurich-14B-GCv2-5m" class="model-btn">Zurich 14B GCv2 5m</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-14B-GCv2-1m" class="model-btn">Zurich 14B GCv2 1m</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-14B-GCv2-500k" class="model-btn">Zurich 14B GCv2 500k</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-14B-GCv2-100k" class="model-btn">Zurich 14B GCv2 100k</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-14B-GCv2-50k" class="model-btn">Zurich 14B GCv2 50k</a>
+                <a href="https://huggingface.co/rubenroy/Zurich-14B-GCv2-10k" class="model-btn">Zurich 14B GCv2 10k</a>
             </div>
         </div>
     </div>