Spaces:

Aekanun
/

Thai-HandWriting-to-Text

Running on Zero

App Files Files Community

Aekanun commited on 15 days ago

Commit

b5217a9

•

1 Parent(s): 21cb9fc

fixing

Browse files

Files changed (2) hide show

app.py +16 -6
config.json +9 -0

app.py CHANGED Viewed

@@ -24,10 +24,11 @@ def load_model_and_processor():
     print("กำลังโหลดโมเดลและ processor...")
     try:
         base_model_path = "meta-llama/Llama-3.2-11B-Vision-Instruct"
         hub_model_path = "Aekanun/thai-handwriting-llm"
-        # ตั้งค่า BitsAndBytes แบบเดียวกับต้นฉบับ
         bnb_config = BitsAndBytesConfig(
             load_in_4bit=True,
             bnb_4bit_use_double_quant=True,
@@ -35,19 +36,21 @@ def load_model_and_processor():
             bnb_4bit_compute_dtype=torch.bfloat16
         )
-        # โหลด processor แบบเดียวกับต้นฉบับ (ไม่มี token)
         processor = AutoProcessor.from_pretrained(base_model_path)
-        # โหลดโมเดลจาก Hub แบบเดียวกับต้นฉบับ
-        print("กำลังโหลดโมเดลจาก Hub...")
         model = AutoModelForVision2Seq.from_pretrained(
             hub_model_path,
             device_map="auto",
             torch_dtype=torch.bfloat16,
             quantization_config=bnb_config,
-            trust_remote_code=True
         )
-        print("โหลดโมเดลจาก Hub สำเร็จ!")
         return True
     except Exception as e:
@@ -55,13 +58,18 @@ def load_model_and_processor():
         return False
 def process_handwriting(image):
     if image is None:
         return "กรุณาอัพโหลดรูปภาพ"
     try:
         if not isinstance(image, Image.Image):
             image = Image.fromarray(image)
         if image.mode != "RGB":
             image = image.convert("RGB")
@@ -96,8 +104,10 @@ Only return the transcription in Thai language."""
     except Exception as e:
         return f"เกิดข้อผิดพลาด: {str(e)}"
 print("กำลังเริ่มต้นแอปพลิเคชัน...")
 if load_model_and_processor():
     demo = gr.Interface(
         fn=process_handwriting,
         inputs=gr.Image(type="pil", label="อัพโหลดรูปลายมือเขียนภาษาไทย"),

     print("กำลังโหลดโมเดลและ processor...")
     try:
+        # กำหนด paths
         base_model_path = "meta-llama/Llama-3.2-11B-Vision-Instruct"
         hub_model_path = "Aekanun/thai-handwriting-llm"
+        # ตั้งค่า BitsAndBytes
         bnb_config = BitsAndBytesConfig(
             load_in_4bit=True,
             bnb_4bit_use_double_quant=True,
             bnb_4bit_compute_dtype=torch.bfloat16
         )
+        # โหลด processor จาก base model
+        print("Loading processor...")
         processor = AutoProcessor.from_pretrained(base_model_path)
+        # โหลดโมเดลจาก Hub
+        print("Loading model...")
         model = AutoModelForVision2Seq.from_pretrained(
             hub_model_path,
             device_map="auto",
             torch_dtype=torch.bfloat16,
             quantization_config=bnb_config,
+            trust_remote_code=True,
+            force_download=True  # เพิ่มมาเพื่อให้โหลดใหม่
         )
+        print("Model loaded successfully!")
         return True
     except Exception as e:
         return False
 def process_handwriting(image):
+    """ฟังก์ชันสำหรับ Gradio interface"""
+    global model, processor
     if image is None:
         return "กรุณาอัพโหลดรูปภาพ"
     try:
+        # Ensure image is in PIL format
         if not isinstance(image, Image.Image):
             image = Image.fromarray(image)
+        # Convert to RGB if needed
         if image.mode != "RGB":
             image = image.convert("RGB")
     except Exception as e:
         return f"เกิดข้อผิดพลาด: {str(e)}"
+# Initialize application
 print("กำลังเริ่มต้นแอปพลิเคชัน...")
 if load_model_and_processor():
+    # Create Gradio interface
     demo = gr.Interface(
         fn=process_handwriting,
         inputs=gr.Image(type="pil", label="อัพโหลดรูปลายมือเขียนภาษาไทย"),

config.json ADDED Viewed

	@@ -0,0 +1,9 @@

+{
+    "architectures": ["LlamaForCausalLM"],
+    "model_type": "llama",
+    "tokenizer_class": "PreTrainedTokenizerFast",
+    "model_max_length": 131072,
+    "megatron_core": "megatron.core",
+    "task_type": "CAUSAL_LM",
+    "target_modules": ["q_proj", "v_proj"]
+}