Spaces:

tonyliu404
/

Manglify_Backend

Running

App Files Files Community

Manglify_Backend / services /translate_qwen_service.py

tonyliu404

updated backend services to not import transformers library unless necessary, created requirements_deploy.txt

2d79ce4 about 1 month ago

raw

history blame

6.46 kB

	import json
	import os
	import requests
	from pathlib import Path
	from helpers import get_project_root
	from dotenv import load_dotenv, find_dotenv

	class Translate_Qwen_Service:
	def __init__(self, device=None):
	self.tokenizer = None
	self.model = None
	self.device = device if device else "cpu"

	ROOT = get_project_root()
	self.base_model_path = Path(os.getenv("MODEL_PATH", ROOT / "backend" / "models"))
	self.qwen_dir = self.base_model_path / "Qwen"

	def initialize_local_models(self):
	"internal method to only load local models when needed"
	from transformers import AutoTokenizer, AutoModelForCausalLM
	if self.model is not None and self.tokenizer is not None:
	return

	tokenizer_path = self.qwen_dir / "tokenizer"
	model_path = self.qwen_dir / "model"

	if not (tokenizer_path.exists() and model_path.exists()):
	print(f"Qwen tokenizer/model not found at {self.qwen_dir}. Attempting to download.")
	self.load_model()

	if tokenizer_path.exists() and model_path.exists():
	self.tokenizer = AutoTokenizer.from_pretrained(tokenizer_path)
	self.model = AutoModelForCausalLM.from_pretrained(model_path, tie_word_embeddings=False)
	print("Loaded Qwen LLM locally")
	else:
	raise FileNotFoundError(f"Error: Could not find or retrieve {model_path}")

	def load_model(self):
	from transformers import AutoTokenizer, AutoModelForCausalLM
	DOWNLOAD_MODEL = "Qwen/Qwen2.5-7B-Instruct"

	tokenizer = AutoTokenizer.from_pretrained(DOWNLOAD_MODEL)
	model = AutoModelForCausalLM.from_pretrained(DOWNLOAD_MODEL)
	tokenizer.save_pretrained(self.qwen_dir / "tokenizer")
	model.save_pretrained(self.qwen_dir / "model")

	print(f"Downloaded Qwen LLM to: {self.qwen_dir}")
	return str(self.qwen_dir)

	def translate(self, text):
	if not self.model or not self.tokenizer:
	self.initialize_local_models()

	messages = [
	{
	"role": "system",
	"content": """
	You are a professional Localizer/translator for Manga, Manhwa, and Manhua to English. You will receive JSON-formatted OCR text from manga.

	Analyze the whole list before translating any single line to understand the story context.

	Maintain Name Consistency: Do not translate names literally. If a word functions as a name, transliterate it (e.g., "Tonari" stay "Tonari", not "Next-door").

	Handle Stutters: If text is broken across multiple lines (e.g., "T... T... Tonari"), reconstruct the full thought in the translation.

	Match Tone: Use natural, colloquial English suitable for the detected setting (School, Fantasy, etc.).

	Output Format: Return ONLY a JSON object mapping the original ID to the translation.


	Sample JSON Object:
	{
	"0": "Translated text for line 0",
	"1": "Translated text for line 1",
	"2": "Translated text for line 2"
	}

	"""
	},
	{
	"role": "user",
	"content": str(text)
	},
	]
	inputs = self.tokenizer.apply_chat_template(
	messages,
	add_generation_prompt=True,
	tokenize=True,
	return_dict=True,
	return_tensors="pt",
	).to(self.device)

	outputs = self.model.generate(**inputs, max_new_tokens=400)
	output_text = self.tokenizer.decode(outputs[0][inputs["input_ids"].shape[-1]:], skip_special_tokens=True)

	try:
	return json.loads(output_text)
	except json.JSONDecodeError:
	print(f"LLM output was not valid JSON, {output_text}")
	return {"error": "Invalid JSON", "raw": output_text}

	def translate_cloud(self, text):
	API_URL = "https://router.huggingface.co/v1/chat/completions"
	load_dotenv(find_dotenv())
	HF_TOKEN = os.getenv("HF_TOKEN")

	if not HF_TOKEN:
	raise ValueError("HF_TOKEN missing")

	headers = {
	"Authorization": f"Bearer {HF_TOKEN}",
	}

	query = {
	"messages": [
	{
	"role": "system",
	"content": """
	You are a professional Localizer/translator for Manga, Manhwa, and Manhua to English. You will receive JSON-formatted OCR text from manga.

	Analyze the whole list before translating any single line to understand the story context.

	Maintain Name Consistency: Do not translate names literally. If a word functions as a name, transliterate it (e.g., "Tonari" stay "Tonari", not "Next-door").

	Handle Stutters: If text is broken across multiple lines (e.g., "T... T... Tonari"), reconstruct the full thought in the translation.

	Match Tone: Use natural, colloquial English suitable for the detected setting (School, Fantasy, etc.).

	Output Format: Return ONLY a JSON object mapping the original ID to the translation.


	Sample JSON Object:
	{
	"0": "Translated text for line 0",
	"1": "Translated text for line 1",
	"2": "Translated text for line 2"
	}

	"""
	},
	{
	"role": "user",
	"content": str(text)
	},
	],
	"model": "Qwen/Qwen2.5-7B-Instruct:fastest",
	"response_format": {"type": "json_object"}
	}

	try:
	response = requests.post(API_URL, headers=headers, json=query)
	response.raise_for_status()

	data = response.json()
	raw_content = data['choices'][0]['message']['content']

	output_text = json.loads(raw_content)
	return output_text

	except Exception as e:
	print(f"Qwen API Translation failed: {e}")
	raise