HF_RepoSense

Sleeping

HF_RepoSense / test.py

new_llm

9a88164 5 months ago

806 Bytes

	"""This simple script shows how to interact with an OpenAI-compatible server from a client."""

	# import argparse

	# import modal
	from openai import OpenAI
	import os

	client = OpenAI(api_key=os.getenv("modal_api"))
	client.base_url = (
	"https://alexprincecursor--example-vllm-openai-compatible-serve.modal.run/v1/"
	)

	response = client.chat.completions.create(
	model="neuralmagic/Meta-Llama-3.1-8B-Instruct-quantized.w4a16", # GPT-4.1 mini
	messages=[
	{"role": "system", "content": "You are a rockstar lyric generator. You are given a song and you need to generate a lyric for it."},
	{"role": "user", "content":"The song is 'Bohemian Rhapsody' by Queen."}
	],
	max_tokens=512,
	temperature=0.7
	)
	print(response.choices[0].message.content)