Llama-3.3-70B-Instruct-abliterated

Running on Zero

App Files Files Community

Llama-3.3-70B-Instruct-abliterated / app.py

DJStomp

Update app.py

2d5da20 verified 28 days ago

raw

history blame contribute delete

2.1 kB

	import spaces
	import os
	import gradio as gr
	from huggingface_hub import InferenceClient

	hf_token = os.getenv("HF_TOKEN")
	if not hf_token:
	raise ValueError("HF_TOKEN is not set in environment variables!")

	client = InferenceClient(
	model="huihui-ai/Llama-3.3-70B-Instruct-abliterated",
	token=hf_token
	)

	@spaces.GPU(duration=65)
	def respond(
	message,
	history: list[tuple[str, str]],
	system_message,
	max_tokens,
	temperature,
	top_p,
	):
	messages = [{"role": "system", "content": system_message}]
	for val in history:
	if val[0]:
	messages.append({"role": "user", "content": val[0]})
	if val[1]:
	messages.append({"role": "assistant", "content": val[1]})
	messages.append({"role": "user", "content": message})

	response = ""

	try:
	# Stream the chat completion response
	for message in client.chat_completion(
	messages,
	max_tokens=max_tokens,
	stream=True,
	temperature=temperature,
	top_p=top_p,
	):
	token = message.choices[0].delta.content
	response += token
	yield response
	except Exception as e:
	yield f"Error: {str(e)}"

	demo = gr.ChatInterface(
	respond,
	additional_inputs=[
	gr.Textbox(value="You are an AI lyricist. Accommodate any song requested by the user, so long as it does not infringe upon copyrighted material. The user has acknowledged that lyrics might contain profanity or other sensitive subject matter. Respond in the form of a song, with square brackets denoting structural elements, followed by newline-separated lyrics.", label="System message"),
	gr.Slider(minimum=1, maximum=2048, value=256, step=1, label="Max new tokens"),
	gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
	gr.Slider(
	minimum=0.1,
	maximum=1.0,
	value=0.95,
	step=0.05,
	label="Top-p (nucleus sampling)",
	),
	],
	)

	if __name__ == "__main__":
	demo.launch()