SCANSKY
/

BERTopic-Tourism-Chinese

Model card Files Files and versions

SCANSKY commited on Feb 28

Commit

d85085f

·

verified ·

1 Parent(s): a9a0985

Create handler.py

Files changed (1) hide show

handler.py +80 -0

handler.py ADDED Viewed

	@@ -0,0 +1,80 @@

+import json
+from bertopic import BERTopic
+class EndpointHandler:
+    def __init__(self, model_path="SCANSKY/BERTopic-Tourism-English"):
+        """
+        Initialize the handler. Load the BERTopic model from Hugging Face.
+        """
+        self.topic_model = BERTopic.load(model_path)
+    def preprocess(self, data):
+        """
+        Preprocess the incoming request data.
+        - Extract text input from the request.
+        """
+        try:
+            # Directly work with the incoming data dictionary
+            text_input = data.get("inputs", "")
+            return text_input
+        except Exception as e:
+            raise ValueError(f"Error during preprocessing: {str(e)}")
+    def inference(self, text_input):
+        """
+        Perform inference using the BERTopic model.
+        - Process the text input and generate topic predictions.
+        """
+        try:
+            # Split text into documents (assuming one document per line)
+            docs = text_input.strip().split('\n')
+            # Perform topic inference
+            topics, probabilities = self.topic_model.transform(docs)
+            # Prepare the results
+            results = []
+            for topic, prob in zip(topics, probabilities):
+                topic_info = self.topic_model.get_topic(topic)
+                topic_words = [word for word, _ in topic_info] if topic_info else []
+                # Get custom label for the topic (with fallback if custom_labels_ is not available)
+                if hasattr(self.topic_model, "custom_labels_") and self.topic_model.custom_labels_ is not None:
+                    custom_label = self.topic_model.custom_labels_[topic + 1]
+                else:
+                    custom_label = f"Topic {topic}"  # Fallback label
+                results.append({
+                    "topic": int(topic),
+                    "probability": float(prob),
+                    "top_words": topic_words[:5],  # Top 5 words
+                    "customLabel": custom_label  # Add custom label
+                })
+            return results
+        except Exception as e:
+            raise ValueError(f"Error during inference: {str(e)}")
+    def postprocess(self, results):
+        """
+        Postprocess the inference results into a JSON-serializable list.
+        """
+        return results  # Directly returning the list of results
+    def __call__(self, data):
+        """
+        Handle the incoming request.
+        """
+        try:
+            # Preprocess the data
+            text_input = self.preprocess(data)
+            # Perform inference
+            results = self.inference(text_input)
+            # Postprocess the results
+            response = self.postprocess(results)
+            return response
+        except Exception as e:
+            return [{"error": str(e)}]  # Returning error as a list with a dictionary