Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- from flask import Flask, request, jsonify
- from transformers import AutoModelForCausalLM, AutoTokenizer
- app = Flask(__name__)
- # Load your fine-tuned model
- model = AutoModelForCausalLM.from_pretrained("./fine_tuned_model")
- tokenizer = AutoTokenizer.from_pretrained("./fine_tuned_model")
- @app.route('/generate', methods=['POST'])
- def generate_text():
- data = request.json
- prompt = data['prompt']
- # Generate text using the LLM
- input_ids = tokenizer.encode(prompt, return_tensors='pt')
- output = model.generate(input_ids, max_length=100)
- generated_text = tokenizer.decode(output[0], skip_special_tokens=True)
- return jsonify({'generated_text': generated_text})
- if __name__ == '__main__':
- app.run(debug=True)
Advertisement
Add Comment
Please, Sign In to add comment