Rohit Rajpoot commited on
Commit
50a24ac
·
1 Parent(s): e08e8bd

reducing the tokens for faster generation on hugging space

Browse files
Files changed (2) hide show
  1. app.py +1 -1
  2. assist/main.py +2 -2
app.py CHANGED
@@ -81,7 +81,7 @@ with col2:
81
  # 2) generation (reduce tokens for now)
82
  out = deepseek_gen(
83
  f"Use these notes to answer:\n\n{context}\n\nQ: {title}\nA:",
84
- max_new_tokens=20,
85
  do_sample=False
86
  )
87
 
 
81
  # 2) generation (reduce tokens for now)
82
  out = deepseek_gen(
83
  f"Use these notes to answer:\n\n{context}\n\nQ: {title}\nA:",
84
+ max_new_tokens=10,
85
  do_sample=False
86
  )
87
 
assist/main.py CHANGED
@@ -13,8 +13,8 @@ def hello(name: str = "world"):
13
  def heatmap():
14
  """Show token-similarity heatmap from tensor.pt."""
15
  # import here so chat() doesn’t drag in sklearn
16
- from .heatmap import show_heatmap
17
- show_heatmap()
18
 
19
  @app.command()
20
  def chat(question: str = typer.Argument(..., help="Question to ask RepoSage")):
 
13
  def heatmap():
14
  """Show token-similarity heatmap from tensor.pt."""
15
  # import here so chat() doesn’t drag in sklearn
16
+ from .heatmap import get_heatmap_figure
17
+ get_heatmap_figure()
18
 
19
  @app.command()
20
  def chat(question: str = typer.Argument(..., help="Question to ask RepoSage")):