datadabllp

set up an API endpoint for an LLM agent using Flask

Aug 20th, 2024
460
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
Python 0.75 KB | None | 0 0
  1. from flask import Flask, request, jsonify
  2. from transformers import AutoModelForCausalLM, AutoTokenizer
  3.  
  4. app = Flask(__name__)
  5.  
  6. # Load your fine-tuned model
  7. model = AutoModelForCausalLM.from_pretrained("./fine_tuned_model")
  8. tokenizer = AutoTokenizer.from_pretrained("./fine_tuned_model")
  9.  
  10. @app.route('/generate', methods=['POST'])
  11. def generate_text():
  12.     data = request.json
  13.     prompt = data['prompt']
  14.    
  15.     # Generate text using the LLM
  16.     input_ids = tokenizer.encode(prompt, return_tensors='pt')
  17.     output = model.generate(input_ids, max_length=100)
  18.     generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
  19.    
  20.     return jsonify({'generated_text': generated_text})
  21.  
  22. if __name__ == '__main__':
  23.     app.run(debug=True)
  24.  
Advertisement
Add Comment
Please, Sign In to add comment