File size: 585 Bytes
50a6588
2d0ca6b
50a6588
2d0ca6b
 
 
 
 
50a6588
 
2d0ca6b
 
 
50a6588
2d0ca6b
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
import gradio as gr
from llama_cpp import Llama

llm = Llama(
    model_path="https://huggingface.co/DavidAU/OpenAi-GPT-oss-20b-abliterated-uncensored-NEO-Imatrix-gguf/resolve/main/OpenAI-20B-NEO-Uncensored2-IQ4_NL.gguf",  # Выберите файл, например IQ4_NL
    n_ctx=8192,
    n_gpu_layers=0,
    verbose=False
)

def generate_response(prompt):
    output = llm(prompt, max_tokens=512, temperature=1.0, top_p=0.95)
    return output['choices'][0]['text']

iface = gr.Interface(fn=generate_response, inputs="text", outputs="text", title="GPT-20B Test")
iface.launch()