Spaces:

tori29umai
/

ContentSafetyAnalyzer

Running on Zero

App Files Files Community

tori29umai commited on Jun 5

Commit

aa2fbfe

•

1 Parent(s): 607a0f5

Update

Browse files

Files changed (1) hide show

app.py +19 -61

app.py CHANGED Viewed

@@ -31,7 +31,6 @@ def preprocess_image(image):
     image = image.astype(np.float32)
     return image
 class webui:
     def __init__(self):
         self.demo = gr.Blocks()
@@ -41,39 +40,36 @@ class webui:
         print("Hugging Faceからモデルをダウンロード中")
         onnx_path = hf_hub_download(model_id, "model.onnx")
         csv_path = hf_hub_download(model_id, "selected_tags.csv")
-        ort_sess = ort.InferenceSession(onnx_path)
-        print("ONNXモデルを実行中")
-        print(f"ONNXモデルのパス: {onnx_path}")
         image = Image.open(image_path)
         image = image.convert("RGB") if image.mode != "RGB" else image
         image = preprocess_image(image)
         with open(csv_path, "r", encoding="utf-8") as f:
             reader = csv.reader(f)
-            header = next(reader)
             rows = list(reader)
         rating_tags = [row[1] for row in rows if row[2] == "9"]
         character_tags = [row[1] for row in rows if row[2] == "4"]
         general_tags = [row[1] for row in rows if row[2] == "0"]
-        img = np.array([image])
-        prob = ort_sess.run(None, {ort_sess.get_inputs()[0].name: img})[0][0]  # ONNXモデルからの出力
         thresh = 0.35
         # NSFW/SFW判定
         tag_confidences = {tag: prob[i] for i, tag in enumerate(rating_tags)}
         max_nsfw_score = max(tag_confidences.get("questionable", 0), tag_confidences.get("explicit", 0))
         max_sfw_score = tag_confidences.get("general", 0)
-        NSFW_flag = None
-        if max_nsfw_score > max_sfw_score:
-            NSFW_flag = "NSFWの可能性が高いです"
-        else:
-            NSFW_flag = "SFWの可能性が高いです"
         # 版権キャラクターの可能性を評価
         character_tags_with_probs = []
@@ -85,50 +81,12 @@ class webui:
                     prob_percent = round(p * 100, 2)  # 確率をパーセンテージに変換
                     character_tags_with_probs.append((tag_name, f"{prob_percent}%"))
-        IP_flag = None
-        if character_tags_with_probs:
-            IP_flag = f"版権キャラクター: {character_tags_with_probs}の可能性があります"
-        else:
-            IP_flag = "版権キャラクターの可能性が低いと思われます"
         # タグを生成
-        tag_freq = {}
-        undesired_tags = []
-        combined_tags = []
-        general_tag_text = ""
-        character_tag_text = ""
-        remove_underscore = True
-        caption_separator = ", "
-        general_threshold = 0.35
-        character_threshold = 0.35
-        for i, p in enumerate(prob[4:]):
-            if i < len(general_tags) and p >= general_threshold:
-                tag_name = general_tags[i]
-                if remove_underscore and len(tag_name) > 3:  # ignore emoji tags like >_< and ^_^
-                    tag_name = tag_name.replace("_", " ")
-                if tag_name not in undesired_tags:
-                    tag_freq[tag_name] = tag_freq.get(tag_name, 0) + 1
-                    general_tag_text += caption_separator + tag_name
-                    combined_tags.append(tag_name)
-            elif i >= len(general_tags) and p >= character_threshold:
-                tag_name = character_tags[i - len(general_tags)]
-                if remove_underscore and len(tag_name) > 3:
-                    tag_name = tag_name.replace("_", " ")
-                if tag_name not in undesired_tags:
-                    tag_freq[tag_name] = tag_freq.get(tag_name, 0) + 1
-                    character_tag_text += caption_separator + tag_name
-                    combined_tags.append(tag_name)
-        # 先頭のカンマを取る
-        if len(general_tag_text) > 0:
-            general_tag_text = general_tag_text[len(caption_separator) :]
-        if len(character_tag_text) > 0:
-            character_tag_text = character_tag_text[len(caption_separator) :]
-        tag_text = caption_separator.join(combined_tags)
         return NSFW_flag, IP_flag, tag_text
     def launch(self):
@@ -136,7 +94,7 @@ class webui:
             with gr.Row():
                 with gr.Column():
                     input_image = gr.Image(type='filepath', label="Analysis Image")
-                    model_id = gr.Textbox(label="MODEL ID", value="SmilingWolf/wd-vit-tagger-v3")
                     output_0 = gr.Textbox(label="NSFW Flag")
                     output_1 = gr.Textbox(label="IP Flag")
                     output_2 = gr.Textbox(label="Tags")
@@ -148,8 +106,8 @@ class webui:
                         outputs=[output_0, output_1, output_2]
                     )
-        self.demo.launch()
 if __name__ == "__main__":
     ui = webui()
-    ui.launch()

     image = image.astype(np.float32)
     return image
 class webui:
     def __init__(self):
         self.demo = gr.Blocks()
         print("Hugging Faceからモデルをダウンロード中")
         onnx_path = hf_hub_download(model_id, "model.onnx")
         csv_path = hf_hub_download(model_id, "selected_tags.csv")
+        # ONNXモデルとCSVファイルの読み込み
         image = Image.open(image_path)
         image = image.convert("RGB") if image.mode != "RGB" else image
         image = preprocess_image(image)
+        img = np.array([image])
+        ort_sess = ort.InferenceSession(onnx_path)  # セッションの生成をここで行う
+        prob = ort_sess.run(None, {ort_sess.get_inputs()[0].name: img})[0][0]
         with open(csv_path, "r", encoding="utf-8") as f:
             reader = csv.reader(f)
+            next(reader)  # ヘッダーをスキップ
             rows = list(reader)
         rating_tags = [row[1] for row in rows if row[2] == "9"]
         character_tags = [row[1] for row in rows if row[2] == "4"]
         general_tags = [row[1] for row in rows if row[2] == "0"]
+        # タグと評価
+        NSFW_flag, IP_flag, tag_text = self.evaluate_tags(prob, rating_tags, character_tags, general_tags)
+        return NSFW_flag, IP_flag, tag_text
+    def evaluate_tags(self, prob, rating_tags, character_tags, general_tags):
         thresh = 0.35
         # NSFW/SFW判定
         tag_confidences = {tag: prob[i] for i, tag in enumerate(rating_tags)}
         max_nsfw_score = max(tag_confidences.get("questionable", 0), tag_confidences.get("explicit", 0))
         max_sfw_score = tag_confidences.get("general", 0)
+        NSFW_flag = "NSFWの可能性が高いです" if max_nsfw_score > max_sfw_score else "SFWの可能性が高いです"
         # 版権キャラクターの可能性を評価
         character_tags_with_probs = []
                     prob_percent = round(p * 100, 2)  # 確率をパーセンテージに変換
                     character_tags_with_probs.append((tag_name, f"{prob_percent}%"))
+        IP_flag = f"版権キャラクター: {character_tags_with_probs}の可能性があります" if character_tags_with_probs else "版権キャラクターの可能性が低いと思われます"
         # タグを生成
+        general_tag_text = ", ".join([general_tags[i] for i in range(len(general_tags)) if prob[i] >= thresh])
+        character_tag_text = ", ".join([character_tags[i - len(general_tags)] for i in range(len(general_tags), len(prob)) if prob[i] >= thresh])
+        tag_text = f"{general_tag_text}, {character_tag_text}" if character_tag_text else general_tag_text
         return NSFW_flag, IP_flag, tag_text
     def launch(self):
             with gr.Row():
                 with gr.Column():
                     input_image = gr.Image(type='filepath', label="Analysis Image")
+                    model_id = gr.Textbox(label="Model ID", value="SmilingWolf/wd-vit-tagger-v3")
                     output_0 = gr.Textbox(label="NSFW Flag")
                     output_1 = gr.Textbox(label="IP Flag")
                     output_2 = gr.Textbox(label="Tags")
                         outputs=[output_0, output_1, output_2]
                     )
+        self.demo.launch(share=True)  # 公開リンクを設定
 if __name__ == "__main__":
     ui = webui()
+    ui.launch()