Spaces:

HIEHEU
/

Vietnamese_Text_Summarizer

Running

App Files Files Community

HIEHEU commited on Dec 15, 2025

Commit

41e35d1

verified ·

1 Parent(s): 226e13c

Update py/abstractive.py

Browse files

Files changed (1) hide show

py/abstractive.py +11 -11

py/abstractive.py CHANGED Viewed

@@ -40,7 +40,7 @@ def clean_text_inference(text: str) -> str:
     return text
 # -------------------------------------------------------------------
-# PHOBERT ENCODER (PyTorch) - ĐÃ SỬA CHỮA
 # -------------------------------------------------------------------
 class PhoBERTEncoderTorch:
     def __init__(self):
@@ -52,14 +52,15 @@ class PhoBERTEncoderTorch:
     def encode(self, input_ids, attention_mask):
         with torch.no_grad():
-            # [FIX 1] Ép kiểu input thành Long (int64) để tránh lỗi embedding trên CPU
             ids = torch.tensor(input_ids, dtype=torch.long).to(self.device)
             mask = torch.tensor(attention_mask, dtype=torch.long).to(self.device)
             outputs = self.model(ids, attention_mask=mask)
-            # [FIX 2] Output chuyển về numpy và ép kiểu float32
-            # Quan trọng: TensorFlow mặc định float32, nếu để float64 sẽ gây lỗi tính toán sai
             return outputs.last_hidden_state.detach().cpu().numpy().astype(np.float32)
 # -------------------------------------------------------------------
@@ -94,6 +95,7 @@ if TF_AVAILABLE:
             self.drop3 = tf.keras.layers.Dropout(rate)
         def call(self, x, enc_output, training=None):
             attn1 = self.att1(x, x, use_causal_mask=True)
             out1 = self.ln1(x + self.drop1(attn1, training=training))
             attn2 = self.att2(out1, enc_output)
@@ -102,7 +104,7 @@ if TF_AVAILABLE:
             return self.ln3(out2 + self.drop3(ffn_out, training=training))
 # -------------------------------------------------------------------
-# BUILD DECODER MODEL (Đã chỉnh sửa để khớp với file export)
 # -------------------------------------------------------------------
 def build_inference_model():
     # 1. Inputs
@@ -110,8 +112,7 @@ def build_inference_model():
     enc_raw_input = tf.keras.Input(shape=(None, 768), name='enc_raw_input')
     dec_inputs_inf = tf.keras.Input(shape=(None,), dtype=tf.int32, name='dec_inputs_inf')
-    # 2. Projection Layer (Quan trọng: Phải đặt tên đúng để load weights)
-    # Layer này chuyển 768 -> 512
     enc_out = tf.keras.layers.Dense(CONFIG["EMBED_DIM"], activation="linear", name="encoder_projection")(enc_raw_input)
     enc_out = tf.keras.layers.Dropout(CONFIG["DROPOUT"], name="encoder_dropout")(enc_out)
@@ -133,7 +134,6 @@ def build_inference_model():
     # 4. Decoder Blocks
     dec_out = dec_emb_inf
     for i in range(CONFIG["NUM_LAYERS"]):
-        # Tên block phải khớp: decoder_block_0, decoder_block_1...
         block = TransformerDecoderBlock(
             CONFIG["EMBED_DIM"],
             CONFIG["NUM_HEADS"],
@@ -178,7 +178,7 @@ class AbstractiveSummarizer:
         print(f"📥 Loading weights from {weights_path}...")
         try:
-            # Load weights. Quan trọng: skip_mismatch=False để đảm bảo mọi thứ khớp 100%
             self.decoder_model.load_weights(weights_path)
             print("✅ Weights loaded successfully!")
         except Exception as e:
@@ -236,10 +236,10 @@ class AbstractiveSummarizer:
             return_tensors='np'
         )
-        # 3. Encode bằng PyTorch (nhận về vector 768 chiều, float32)
         enc_out = self.phobert.encode(inp['input_ids'], inp['attention_mask'])
-        # 4. Generate Summary bằng TF Model (có tích hợp Projection 768->512)
         seq = self.beam_search(enc_out, k=k)
         # 5. Decode kết quả

     return text
 # -------------------------------------------------------------------
+# PHOBERT ENCODER (PyTorch) - [ĐÃ SỬA ĐỂ KHỚP DATA TYPE]
 # -------------------------------------------------------------------
 class PhoBERTEncoderTorch:
     def __init__(self):
     def encode(self, input_ids, attention_mask):
         with torch.no_grad():
+            # [SỬA 1] Ép kiểu input thành Long (int64) để tránh lỗi với PyTorch CPU
             ids = torch.tensor(input_ids, dtype=torch.long).to(self.device)
             mask = torch.tensor(attention_mask, dtype=torch.long).to(self.device)
             outputs = self.model(ids, attention_mask=mask)
+            # [SỬA 2] Quan trọng nhất: Chuyển output về float32
+            # PyTorch CPU thường trả về float64, nhưng TensorFlow Keras 3 cần float32.
+            # Nếu không ép kiểu này, model sẽ tính toán ra rác.
             return outputs.last_hidden_state.detach().cpu().numpy().astype(np.float32)
 # -------------------------------------------------------------------
             self.drop3 = tf.keras.layers.Dropout(rate)
         def call(self, x, enc_output, training=None):
+            # Code này dùng use_causal_mask=True -> Bắt buộc dùng Keras 3 (TensorFlow > 2.16)
             attn1 = self.att1(x, x, use_causal_mask=True)
             out1 = self.ln1(x + self.drop1(attn1, training=training))
             attn2 = self.att2(out1, enc_output)
             return self.ln3(out2 + self.drop3(ffn_out, training=training))
 # -------------------------------------------------------------------
+# BUILD DECODER MODEL
 # -------------------------------------------------------------------
 def build_inference_model():
     # 1. Inputs
     enc_raw_input = tf.keras.Input(shape=(None, 768), name='enc_raw_input')
     dec_inputs_inf = tf.keras.Input(shape=(None,), dtype=tf.int32, name='dec_inputs_inf')
+    # 2. Projection Layer
     enc_out = tf.keras.layers.Dense(CONFIG["EMBED_DIM"], activation="linear", name="encoder_projection")(enc_raw_input)
     enc_out = tf.keras.layers.Dropout(CONFIG["DROPOUT"], name="encoder_dropout")(enc_out)
     # 4. Decoder Blocks
     dec_out = dec_emb_inf
     for i in range(CONFIG["NUM_LAYERS"]):
         block = TransformerDecoderBlock(
             CONFIG["EMBED_DIM"],
             CONFIG["NUM_HEADS"],
         print(f"📥 Loading weights from {weights_path}...")
         try:
+            # Load weights.
             self.decoder_model.load_weights(weights_path)
             print("✅ Weights loaded successfully!")
         except Exception as e:
             return_tensors='np'
         )
+        # 3. Encode bằng PyTorch (nhận về vector 768 chiều, đã ép float32)
         enc_out = self.phobert.encode(inp['input_ids'], inp['attention_mask'])
+        # 4. Generate Summary bằng TF Model
         seq = self.beam_search(enc_out, k=k)
         # 5. Decode kết quả