Spaces:
Runtime error
Runtime error
| import uvicorn | |
| from fastapi import FastAPI | |
| from transformers import AutoModelForCausalLM, AutoTokenizer | |
| app = FastAPI() | |
| model_name = 'facebook/incoder-1B' | |
| tokenizer = AutoTokenizer.from_pretrained(model_name) | |
| model = AutoModelForCausalLM.from_pretrained(model_name, low_cpu_mem_usage=True) | |
| print('load ok') | |
| def read_root(input_text, max_length, top_p, top_k, num_beams, temperature, repetition_penalty): | |
| inpt = tokenizer.encode(input_text, return_tensors="pt") | |
| out = model.generate(inpt, max_length=int(max_length), top_p=float(top_p), top_k=float(top_k), temperature=float(temperature), num_beams=int(num_beams), repetition_penalty=float(repetition_penalty)) | |
| res = tokenizer.decode(out[0]) | |
| return {"text": res} |