Spaces:

rein0421
/

AIdentify

Running

App Files Files

rein0421 commited on Nov 9, 2024

Commit

82291b8

verified ·

1 Parent(s): 374194c

Upload 7 files

Browse files

Files changed (7) hide show

1026.pt +3 -0
Dockerfile +24 -0
app.py +941 -0
main.png +0 -0
output_vectors.json +0 -0
requirements.txt +72 -0
sums_data.json +0 -0

1026.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87af30931732d6ac63bd65230b33f22ca157a3dd97e72c361b55be8a3a2dfade
+size 22568035

Dockerfile ADDED Viewed

	@@ -0,0 +1,24 @@

+# Use the official Python 3.10.9 image
+FROM python:3.10.9
+# Copy the current directory contents into the container at .
+COPY . .
+# Install dependencies for OpenCV and other requirements
+RUN apt-get update && apt-get install -y libgl1 libglib2.0-0 curl
+# Set the working directory to /
+WORKDIR /
+# Create a user to avoid permission issues
+RUN useradd -m appuser
+USER appuser
+# Set the working directory to /home/appuser
+WORKDIR /home/appuser
+# Add /home/appuser/.local/bin to PATH
+ENV PATH="/home/appuser/.local/bin:${PATH}"
+# Install requirements.txt
+RUN pip install --no-cache-dir --upgrade -r /requirements.txt
+# Start the FastAPI app on port 7860, the default port expected by Spaces
+CMD ["uvicorn", "app:app", "--host", "0.0.0.0", "--port", "7860"]

app.py ADDED Viewed

	@@ -0,0 +1,941 @@

+# -*- coding: utf-8 -*-
+# Commented out IPython magic to ensure Python compatibility.
+import os
+import supervision as sv
+from PIL import Image, ImageFilter
+import numpy as np
+import cv2
+import pycocotools.mask as mask_util
+from fastapi import FastAPI, File, UploadFile, Form
+from fastapi.middleware.cors import CORSMiddleware
+from fastapi.responses import FileResponse, HTMLResponse
+import shutil
+import json
+from pathlib import Path
+import nest_asyncio
+import uvicorn
+from pyngrok import ngrok
+from diffusers import StableDiffusionInpaintPipeline
+import torch
+from simple_lama_inpainting import SimpleLama
+from sklearn.cluster import (
+    KMeans, AgglomerativeClustering, DBSCAN, MiniBatchKMeans, Birch,
+    SpectralClustering, MeanShift, OPTICS
+)
+from sklearn.decomposition import PCA
+from sklearn.metrics import silhouette_score
+from sklearn.neighbors import KNeighborsClassifier
+from torchvision import transforms
+import threading
+import concurrent.futures
+from typing import Tuple
+from types import SimpleNamespace
+import subprocess
+import uuid
+from datetime import datetime
+from ultralytics import YOLO
+import math
+import numpy as np
+import matplotlib.pyplot as plt
+#この下のコードは特定の領域をマスクしないタイプのコード
+import uuid
+from datetime import datetime
+import cv2
+import numpy as np
+from datetime import datetime
+from ultralytics import YOLO
+from PIL import Image
+app = FastAPI()
+# CORSミドルウェアの追加
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],  # ここを適切なオリジンに設定することもできます
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+HOME = "./"
+dangerarray=[10,30,90,50,80,20,40,70,100,60]#ここに各クラスターの危険度を設定しておく
+#ここで認識する精度を上げたり下げたりできる
+thresholds = {
+    'text': 0.1,
+    'name tag': 0.1,
+    'license plate': 0.3,
+    'Mail': 0.3,
+    'Documents': 0.3,
+    'QR codes': 0.4,
+    'barcodes': 0.4,
+    'map': 0.5,
+    'digital screens': 0.6,
+    'information board': 0.5,
+    'signboard': 0.3,
+    'poster': 0.8,
+    'sign': 0.3,
+    'logo': 0.3,
+    'card': 0.4,
+    'window': 0.2,
+    'mirror': 0.2,
+    'Famous landmark': 0.7,
+    'cardboard': 0.6,
+    'manhole': 0.6,
+    'utility pole': 0.7
+}
+'''
+'''
+# Define paths
+CONFIG_PATH = os.path.join(HOME, "GroundingDINO/groundingdino/config/GroundingDINO_SwinT_OGC.py")
+WEIGHTS_NAME = "groundingdino_swint_ogc.pth"
+WEIGHTS_PATH = os.path.join(HOME, "weights", WEIGHTS_NAME)
+from PIL import Image
+def is_bright(pixel):
+    # ピクセルの輝度を計算して明るさを判定する
+    r, g, b = pixel
+    brightness = (0.299 * r + 0.587 * g + 0.114 * b)  # 輝度の計算
+    return brightness > 127  # 閾値を127に設定
+def analyze_mask_brightness(original_image_path, mask_image_path):
+    # 画像を開く
+    original_img = Image.open(original_image_path).convert('RGB')
+    mask_img = Image.open(mask_image_path).convert('L')  # グレースケールに変換
+    width, height = original_img.size
+    if mask_img.size != (width, height):
+        print("エラー: マスク画像と元画像のサイズが一致していません。")
+        return
+    # 明るいピクセルと暗いピクセルのカウント
+    bright_count = 0
+    dark_count = 0
+    for y in range(height):
+        for x in range(width):
+            mask_value = mask_img.getpixel((x, y))
+            if mask_value > 127:  # マスクが白（対象領域）ならば
+                pixel = original_img.getpixel((x, y))
+                if is_bright(pixel):
+                    bright_count += 1
+                else:
+                    dark_count += 1
+    # 明るさの結果を判定
+    brightness_result = 1 if bright_count > dark_count else 2
+    return brightness_result
+def classify_mask_size(mask_image_path, small_threshold, medium_threshold, large_threshold):
+    # マスク画像を開く
+    mask_img = Image.open(mask_image_path).convert('L')  # グレースケールに変換
+    width, height = mask_img.size
+    total_pixels = width * height
+    white_pixel_count = 0
+    # マスク画像の白いピクセルをカウント
+    for y in range(height):
+        for x in range(width):
+            mask_value = mask_img.getpixel((x, y))
+            if mask_value > 127:  # 白いピクセルと判断
+                white_pixel_count += 1
+    # 白いピクセルの割合を計算
+    mask_area_ratio = (white_pixel_count / total_pixels) * 100
+    # マスクサイズを分類
+    if mask_area_ratio <= small_threshold:
+        size_category = 1  # すごく小さい
+    elif mask_area_ratio <= medium_threshold:
+        size_category = 2  # 小さい
+    elif mask_area_ratio <= large_threshold:
+        size_category = 3  # 大きい
+    else:
+        size_category = 4  # すごく大きい
+    return size_category
+def analyze_mask_combined(original_image_path, mask_image_path, small_threshold, medium_threshold, large_threshold):
+    # マスクの大きさを判定
+    size_category = classify_mask_size(mask_image_path, small_threshold, medium_threshold, large_threshold)
+    # マスク部分の明るさを判定
+    brightness_result = analyze_mask_brightness(original_image_path, mask_image_path)
+    # 結果を出力
+    size_text = {1: "すごく小さい", 2: "小さい", 3: "大きい", 4: "すごく大きい"}
+    print(f"マスクの大きさ: {size_text[size_category]} ({size_category})")
+    print(f"マスクの明るさ: {brightness_result}")
+    result={
+            'size':size_category,
+            'brightness':brightness_result
+            }
+    return result
+#この下で消去対象を決定
+def decide_to_object(risk_level):
+    '''
+    tex = [
+        'text','Name tag', 'License plate', 'Mail', 'Documents', 'QR codes',
+        'barcodes', 'Map', 'Digital screens', 'information board',
+        'signboard', 'poster', 'sign', 'utility pole'
+    ]
+    '''
+    tex = [
+        'text', 'License plate', 'Digital screens',
+        'signboard', 'poster', 'sign', 'logo', 'card', 'window', 'mirror',
+        'Famous landmark', 'cardboard', 'manhole', 'utility pole'
+    ]
+    #この配列の要素の順番を変えると消える順番が変わる。
+    risk_level = int(risk_level / 20)*(len(tex)/10)#個数決定(1/2)
+    return tex[:int(risk_level)+1]
+def create_mask(image, x1, y1, x2, y2):
+    # Create a black image with the same size as the input image
+    mask = np.zeros((image.shape[0], image.shape[1]), dtype=np.uint8)
+    # Draw a white rectangle on the mask where the object is located
+    cv2.rectangle(mask, (int(x1), int(y1)), (int(x2), int(y2)), 255, -1)
+    return mask
+def special_process_image_yolo(risk_level, image_path, point1, point2, thresholds=None):
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    print(device)
+    # YOLOv8モデルをロードし、GPUに移動
+    model = YOLO('./1026.pt')  # モデルのパスを指定
+    model.to(device)  # モデルをGPUに移動
+    # タイムスタンプを作成
+    timestamp = datetime.now().strftime("%Y%m%d%H%M%S")
+    # リスクレベルに基づいた減衰率の計算
+    def logistic_decay(risk_level, k=0.1, r0=50):
+        return 1 / (1 + np.exp(-k * (risk_level - r0)))
+    decay_factor = logistic_decay(risk_level)
+    adjusted_thresholds = {key: max(value - decay_factor + 0.8, 0.01) / 2 for key, value in thresholds.items()}
+    # 画像の読み込みとRGB変換
+    image = cv2.imread(image_path)
+    image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    image_np = np.array(image_rgb, dtype=np.uint8)
+    # 推論実行
+    results = model(image_rgb)
+    # 初期化したマスク画像
+    mask = np.zeros((image_np.shape[0], image_np.shape[1]), dtype=np.uint8)
+    # 各検出結果に基づきマスク作成
+    for box in results[0].boxes:
+        x1, y1, x2, y2 = map(int, box.xyxy[0])  # ボックスの座標
+        confidence = box.conf[0]
+        class_id = box.cls[0]
+        object_type = model.names[int(class_id)]
+        # クラス名に基づいたしきい値
+        threshold = adjusted_thresholds.get(object_type, 0.5)
+        if confidence >= threshold:
+            mask[y1:y2, x1:x2] = 255  # ボックス領域を白に設定
+    # 絶対座標に変換した点の範囲を黒に設定
+    p1_x, p1_y = int(point1[0] * image_np.shape[1]), int(point1[1] * image_np.shape[0])
+    p2_x, p2_y = int(point2[0] * image_np.shape[1]), int(point2[1] * image_np.shape[0])
+    x_min, y_min = max(0, min(p1_x, p2_x)), max(0, min(p1_y, p2_y))
+    x_max, y_max = min(image_np.shape[1], max(p1_x, p2_x)), min(image_np.shape[0], max(p1_y, p2_y))
+    mask[y_min:y_max, x_min:x_max] = 0  # 範囲を黒に設定
+    # デバッグ用に白い長方形を描画
+    debug_image = image_np.copy()
+    cv2.rectangle(debug_image, (x_min, y_min), (x_max, y_max), (255, 255, 255), 2)
+    # デバッグ画像とマスク画像を保存
+    debug_image_pil = Image.fromarray(debug_image)
+    debug_image_pil.save(f"./debug_image_with_rectangle_{timestamp}.jpg")
+    mask_image_pil = Image.fromarray(mask)
+    mask_image_pil.save(f"./final_mask_{timestamp}.jpg")
+    return f"./final_mask_{timestamp}.jpg"
+def convert_image_format(input_path, output_format="png"):
+    """
+    画像をJPGからPNGまたはPNGからJPGに変換する関数。
+    Parameters:
+    - input_path: 変換したい元画像のパス
+    - output_format: 出力形式 ("png" または "jpg" を指定、デフォルトは "png")
+    Returns:
+    - output_path: 変換された画像の出力パス
+    """
+    # サポートされているフォーマットかを確認
+    if output_format not in ["png", "jpg", "jpeg"]:
+        raise ValueError("サポートされている出力形式は 'png' または 'jpg' です��")
+    # 画像の読み込み
+    image = cv2.imread(input_path)
+    if image is None:
+        raise ValueError(f"画像が見つかりません: {input_path}")
+    # 出力パスの生成
+    base_name = os.path.splitext(os.path.basename(input_path))[0]
+    output_path = f"{base_name}.{output_format}"
+    # 画像の保存
+    if output_format == "png":
+        cv2.imwrite(output_path, image, [cv2.IMWRITE_PNG_COMPRESSION, 9])  # PNG形式で最高圧縮率
+    else:
+        cv2.imwrite(output_path, image, [cv2.IMWRITE_JPEG_QUALITY, 90])    # JPG形式で高画質
+    return output_path
+#この下は、openCV
+def inpaint_image_with_mask(image_path, mask_path, output_path, inpaint_radius=5, inpaint_method=cv2.INPAINT_TELEA):
+    """
+    マスク画像を使用して元画像のインペイントを行う関数。
+    Parameters:
+    - image_path: 元画像のパス
+    - mask_path: マスク画像のパス（修復したい領域が白、その他が黒）
+    - output_path: インペイント結果の出力パス
+    - inpaint_radius: インペイントの半径（デフォルトは5）
+    - inpaint_method: インペイントのアルゴリズム（デフォルトはcv2.INPAINT_TELEA）
+    Returns:
+    - inpainted_image: インペイントされた画像
+    """
+    # 画像とマスクを読み込み
+    image = cv2.imread(image_path)
+    mask = cv2.imread(mask_path, cv2.IMREAD_GRAYSCALE)  # マスクはグレースケールで読み込み
+    # マスク画像が正常に読み込めたかチェック
+    if image is None:
+        raise ValueError(f"元画像が見つかりません: {image_path}")
+    if mask is None:
+        raise ValueError(f"マスク画像が見つかりません: {mask_path}")
+    # マスク画像が元画像と同じサイズでない場合、リサイズ
+    if image.shape[:2] != mask.shape[:2]:
+        print(f"マスク画像のサイズを元画像に合わせてリサイズします: {mask.shape} -> {image.shape[:2]}")
+        mask = cv2.resize(mask, (image.shape[1], image.shape[0]))
+    # インペイント処理
+    inpainted_image = cv2.inpaint(image, mask, inpaint_radius, inpaint_method)
+    # インペイント結果を保存
+    cv2.imwrite(output_path, inpainted_image)
+    return  output_path
+def stamp_image_with_mask(base_image_path, mask_path,output_path,stamp_image_path='./main.png'):
+    """
+    マスク画像を使用して元画像に別の画像を埋め込む関数。
+    Parameters:
+    - base_image_path: 元画像のパス
+    - mask_path: マスク画像のパス（埋め込みたい領域が白、その他が黒）
+    - embed_image_path: 埋め込み用画像のパス
+    - output_path: 結果の出力パス
+    Returns:
+    - output_path: 埋め込み処理された画像の出力パス
+    """
+    # 画像とマスクを読み込み
+    base_image = cv2.imread(base_image_path)
+    mask = cv2.imread(mask_path, cv2.IMREAD_GRAYSCALE)
+    embed_image = cv2.imread(stamp_image_path)
+    # 画像が正常に読み込めたかチェック
+    if base_image is None:
+        raise ValueError(f"元画像が見つかりません: {base_image_path}")
+    if mask is None:
+        raise ValueError(f"マスク画像が見つかりません: {mask_path}")
+    if embed_image is None:
+        raise ValueError(f"埋め込み用画像が見つかりません: {stamp_image_path}")
+    # マスク画像と埋め込み画像を元画像と同じサイズにリサイズ
+    if base_image.shape[:2] != mask.shape[:2]:
+        print(f"マスク画像のサイズを元画像に合わせてリサイズします: {mask.shape} -> {base_image.shape[:2]}")
+        mask = cv2.resize(mask, (base_image.shape[1], base_image.shape[0]))
+    if base_image.shape[:2] != embed_image.shape[:2]:
+        print(f"埋め込み画像のサイズを元画像に合わせてリサイズします: {embed_image.shape[:2]} -> {base_image.shape[:2]}")
+        embed_image = cv2.resize(embed_image, (base_image.shape[1], base_image.shape[0]))
+    # マスク領域に埋め込み画像を配置
+    embedded_image = base_image.copy()
+    embedded_image[mask == 255] = embed_image[mask == 255]
+    # 結果を保存
+    cv2.imwrite(output_path, embedded_image)
+    return output_path
+import torch
+from PIL import Image, ImageFilter
+import numpy as np
+from simple_lama_inpainting import SimpleLama
+def inpaint_image_with_mask1(img_path, mask_path, output_path, resize_factor=0.5):
+    print('lama')
+    # GPUが利用可能か確認
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    # 画像とマスクを読み込み
+    image = Image.open(img_path).convert("RGB")  # 画像をRGBに変換
+    mask = Image.open(mask_path).convert('L')  # マスクをグレースケールに変換
+    # 画像とマスクのサイズを合わせる
+    mask = mask.resize(image.size, Image.NEAREST)
+    # マスクのエッジをぼかす (Gaussian Blur)
+    blurred_mask = mask.filter(ImageFilter.GaussianBlur(radius=3))  # 半径3ピクセルでぼかし
+    # SimpleLama インスタンスを作成
+    simple_lama = SimpleLama()
+    # 画像とマスクをNumPy配列に変換
+    image_np = np.array(image)
+    mask_np = np.array(blurred_mask) / 255.0  # マスクを0-1範囲にスケーリング
+    # 入力画像とマスクをSimpleLamaに渡してインペイント
+    inpainted_np = simple_lama(image_np, mask_np)  # NumPy配列を渡す
+    # 結果を画像として保存
+    result_image = Image.fromarray(np.uint8(inpainted_np))  # NumPy array -> PIL Image
+    # 出力画像をリサイズ
+    new_size = (int(result_image.width * resize_factor), int(result_image.height * resize_factor))
+    result_image = result_image.resize(new_size, Image.ANTIALIAS)
+    # 結果を保存
+    result_image.save(output_path)
+    print(f"Inpainted image saved at {output_path}")
+    return output_path
+# 保存先のディレクトリを指定
+SAVE_DIR = Path("./saved_images")
+SAVE_DIR.mkdir(parents=True, exist_ok=True)
+def save_image(file, filename):
+    """画像ファイルを指定ディレクトリに保存"""
+    filepath = SAVE_DIR / filename
+    with open(filepath, "wb") as buffer:
+        shutil.copyfileobj(file, buffer)
+    return filepath
+@app.post("/create-mask-and-inpaint-opencv")
+async def create_mask_and_inpaint_opencv(image: UploadFile = File(...), risk_level: int = Form(...)):
+    point1 = (0.00000000000002, 0.00000000000002)
+    point2 = (0.00000000000001, 0.00000000000001)
+    input_path = save_image(image.file, "input.jpg")
+    mask_path =  special_process_image_yolo(risk_level, input_path, point1, point2, thresholds)
+    output_path = SAVE_DIR / "output_opencv.jpg"
+    # OpenCVでインペイント
+    inpaint_image_with_mask(input_path, mask_path, output_path)
+    return FileResponse(output_path)
+@app.post("/create-mask-and-inpaint-stamp")
+async def create_mask_and_inpaint_opencv(image: UploadFile = File(...), risk_level: int = Form(...)):
+    point1 = (0.00000000000002, 0.00000000000002)
+    point2 = (0.00000000000001, 0.00000000000001)
+    input_path = save_image(image.file, "input.jpg")
+    mask_path =  special_process_image_yolo(risk_level, input_path, point1, point2, thresholds)
+    output_path = SAVE_DIR / "output_opencv.jpg"
+    # OpenCVでインペイント
+    stamp_image_with_mask(input_path, mask_path, output_path)
+    return FileResponse(output_path)
+@app.post("/create-mask-and-inpaint-simple-lama")
+async def create_mask_and_inpaint_simple_lama(image: UploadFile = File(...), risk_level: int = Form(...)):
+    input_path = save_image(image.file, "input.jpg")
+    point1 = (0.00000000000002, 0.00000000000002)
+    point2 = (0.00000000000001, 0.00000000000001)
+    mask_path =  special_process_image_yolo(risk_level, input_path, point1, point2, thresholds)
+    output_path = SAVE_DIR / "output_simple_lama.jpg"
+    # SimpleLamaでインペイント
+    inpaint_image_with_mask1(input_path, mask_path, output_path, resize_factor=1)
+    return FileResponse(output_path)
+#下のendpointは特定領域をマスクしないタイプのもの
+#下記はDeepFillv2
+# ベクトル化対象のオブジェクトリスト
+TEXT_PROMPTS = [
+     'text','Name tag', 'License plate', 'Mail', 'Documents', 'QR codes',
+        'barcodes', 'Map', 'Digital screens', 'information board',
+        'signboard', 'poster', 'sign', 'logo', 'card', 'window', 'mirror',
+        'Famous landmark', 'cardboard', 'manhole', 'utility pole'
+]
+BOX_THRESHOLD = 0.3
+TEXT_THRESHOLD = 0.3
+# クラスタリング結果をJSONファイルから読み込む関数
+def load_sums_from_json(filepath):
+    with open(filepath, 'r') as json_file:
+        sums = json.load(json_file)
+    return sums
+# ベクトルデータをJSONファイルから読み込む関数
+def load_vectors_from_json(filepath):
+    with open(filepath, 'r') as json_file:
+        data = json.load(json_file)
+    return data
+# 新しい画像を分類する関数
+def classify_new_image(new_image_vector, sums_data, loaded_vectors, loaded_object_names, k=1):
+    cluster_centers = []
+    for cluster in sums_data:
+        indices = [loaded_object_names.index(obj_name) for obj_name in cluster]
+        cluster_vectors = np.array([loaded_vectors[obj_name] for obj_name in cluster])
+        cluster_center = np.mean(cluster_vectors, axis=0)
+        cluster_centers.append(cluster_center)
+    knn = KNeighborsClassifier(n_neighbors=k)
+    knn.fit(cluster_centers, range(len(cluster_centers)))
+    new_image_label = knn.predict([new_image_vector])
+    return new_image_label[0]
+import torch
+import cv2
+import numpy as np
+from ultralytics import YOLO  # YOLOv8ライブラリ
+def process_image_vec(image_path):
+    # GPUを使用できるか確認
+    device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+    print(device)
+    # YOLOv8モデルをロードし、GPUに移動
+    model = YOLO('./1026.pt')  # モデルのパスを指定
+    model.to(device)  # モデルをGPUに移動
+    # 初期化
+    object_vector = np.zeros(len(TEXT_PROMPTS))
+    # 画像の読み込み
+    image = cv2.imread(image_path)
+    image_rgb = cv2.cvtColor(image, cv2.COLOR_BGR2RGB)
+    # YOLOで推論を実行
+    results = model(image_rgb)  # 推論を実行
+    # 各プロンプトごとに確認
+    for i, text_prompt in enumerate(TEXT_PROMPTS):
+        prompt_sum = 0  # 各プロンプトに対応するスコアの合計
+        for box in results[0].boxes:
+            class_id = int(box.cls[0])
+            confidence = box.conf[0]
+            detected_class = model.names[class_id]
+            # 検出クラス名とテキストプロンプトの一致を確認
+            if text_prompt.lower() == detected_class.lower():
+                prompt_sum += confidence  # クラスが一致した場合、信頼度を加算
+        # object_vectorにスコアを格納
+        object_vector[i] = prompt_sum
+    print(object_vector)
+    return object_vector.tolist()
+# APIのエンドポイント
+@app.post("/classify-image/")
+async def classify_image(file: UploadFile = File(...)):
+    image_path = "./temp_image.jpg"
+    # アップロードされた画像を保存
+    with open(image_path, "wb") as buffer:
+        buffer.write(await file.read())
+    # 画像をベクトル化
+    new_image_vector = process_image_vec(image_path)
+    # JSONファイルからデータを読み込む
+    json_filepath = "./output_vectors.json"
+    loaded_data = load_vectors_from_json(json_filepath)
+    loaded_vectors = {obj_name: np.array(vector) for obj_name, vector in loaded_data.items()}
+    loaded_object_names = list(loaded_vectors.keys())
+    # 既存のクラスタリング結果を読み込む
+    sums_data = load_sums_from_json("./sums_data.json")
+    # 新しい画像がどのクラスタに分類されるかを判定
+    new_image_cluster = classify_new_image(new_image_vector, sums_data, loaded_vectors, loaded_object_names)
+    return {"danger":dangerarray[int(new_image_cluster + 1)]}#バグったらここを＋にして
+@app.post("/create-mask-and-inpaint-simple-lama-special")
+async def create_mask_and_inpaint_simple_lama(
+    image: UploadFile = File(...),
+    risk_level: int = Form(...),
+    x1: float = Form(...),
+    y1: float = Form(...),
+    x2: float = Form(...),
+    y2: float = Form(...),
+):
+    # Extract points from the form data
+    point1 = [x1, y1]
+    point2 = [x2, y2]
+    # Save the input image
+    input_path = save_image(image.file, "input.jpg")
+    print('1111',point1,point2)
+    # Create a mask image (using the new process_image function)
+    mask_path = special_process_image_yolo(risk_level, input_path, point1, point2,thresholds=thresholds)
+    # Define the output path for the inpainted image
+    output_path = "./output_simple_lama.jpg"
+    # Perform inpainting with SimpleLama
+    inpaint_image_with_mask1(input_path, mask_path, output_path, resize_factor=1)
+    # Return the resulting image as a response
+    return FileResponse(output_path, media_type="image/jpeg", filename="output_simple_lama.jpg")
+from PIL import Image
+def resize_mask_to_match(image_path, mask_path):
+    # オリジナル画像とマスク画像を読み込む
+    original_image = Image.open(image_path)
+    mask_image = Image.open(mask_path)
+    # マスク画像をオリジナル画像のサイズにリサイズ
+    resized_mask = mask_image.resize(original_image.size)
+    # マスク画像を上書き保存
+    resized_mask.save(mask_path)
+@app.post("/create-mask-and-inpaint-sum")
+async def create_mask_sum(image: UploadFile = File(...), risk_level: int = Form(...),
+    x1: float = Form(...),
+    y1: float = Form(...),
+    x2: float = Form(...),
+    y2: float = Form(...),):
+    default_x = 0.001
+    default_y = 0.001
+    point1 = [default_x if math.isnan(x1) else x1, default_y if math.isnan(y1) else y1]
+    point2 = [default_x if math.isnan(x2) else x2, default_y if math.isnan(y2) else y2]
+    input_path = save_image(image.file, "input.jpg")
+    mask_path = special_process_image_yolo(risk_level, input_path, point1, point2,thresholds=thresholds)
+    # 現在のタイムスタンプを生成
+    timestamp = datetime.now().strftime("%Y%m%d_%H%M%S")
+    # 一意な識別子を生成
+    unique_id = uuid.uuid4().hex
+    output_path = f"./output_simple_lama_{timestamp}_{unique_id}.jpg"
+    # OpenCVでインペイント
+    inpaint_image_with_mask1(input_path, mask_path, output_path)
+    return FileResponse(output_path)
+@app.get("/", response_class=HTMLResponse)
+async def read_root():
+    html_content = """
+ <!DOCTYPE html>
+<html lang="ja">
+<head>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <title>画像処理アプリ</title>
+    <!-- Bootstrap CSS -->
+    <link href="https://stackpath.bootstrapcdn.com/bootstrap/4.5.2/css/bootstrap.min.css" rel="stylesheet">
+    <!-- jQuery UI CSS -->
+    <link rel="stylesheet" href="https://code.jquery.com/ui/1.12.1/themes/base/jquery-ui.css">
+    <link href="https://cdnjs.cloudflare.com/ajax/libs/font-awesome/5.15.4/css/all.min.css" rel="stylesheet">
+    <style>
+        body {
+            background-color: #f0f0f5;
+            color: #333;
+            text-align: center;
+            padding: 40px 20px;
+        }
+        h1 {
+            color: #555;
+            margin-bottom: 30px;
+            font-weight: bold;
+        }
+        .image-preview, .processed-preview {
+            max-width: 100%;
+            height: auto;
+            border-radius: 10px;
+            box-shadow: 0 4px 15px rgba(0, 0, 0, 0.2);
+            margin-top: 20px;
+        }
+        #result {
+            margin-top: 40px;
+            display: none;
+        }
+        .slider-container {
+            text-align: left;
+            margin-top: 20px;
+        }
+        .slider-label {
+            font-size: 1.2rem;
+            color: #333;
+        }
+        #slider {
+            margin-top: 10px;
+        }
+        .btn-primary {
+            background-color: #007bff;
+            border-color: #007bff;
+            font-size: 1.2rem;
+            padding: 10px 20px;
+            border-radius: 50px;
+        }
+        .btn-primary:hover {
+            background-color: #0056b3;
+            border-color: #004085;
+        }
+        .form-control, .custom-select {
+            border-radius: 20px;
+            box-shadow: 0 2px 5px rgba(0, 0, 0, 0.1);
+        }
+        .form-control-file {
+            font-size: 1rem;
+        }
+        .form-group {
+            margin-bottom: 25px;
+        }
+        .btn-success {
+            padding: 10px 20px;
+            border-radius: 50px;
+        }
+    </style>
+</head>
+<body>
+    <div class="container">
+        <h1><i class="fas fa-image"></i> 画像処理アプリ - モザイクとインペイント</h1>
+        <div class="form-group">
+            <input type="file" id="uploadImage" class="form-control-file" accept="image/*" onchange="previewImage()">
+        </div>
+        <img id="uploadedImage" class="image-preview" src="#" alt="アップロードされた画像" style="display: none;">
+        <div class="form-group mt-4">
+            <label for="processingType">処理方法を選択:</label>
+            <select id="processingType" class="custom-select">
+                <option value="opencv">OpenCVインペイント</option>
+                <option value="simple_lama">Simple Lamaインペイント</option>
+                <option value="stable_diffusion">Stable Diffusionインペイント</option>
+                <option value="deep_fill_v2">DeepFillv2インペイント</option>
+            </select>
+        </div>
+        <div class="slider-container">
+            <label for="riskLevel" class="slider-label">リスクレベル (0-100): <span id="riskLevelLabel">50</span></label>
+            <div id="slider"></div>
+        </div>
+        <button class="btn btn-primary mt-4" onclick="processImage()">処理開始</button>
+        <div id="result" class="mt-5">
+            <h2>処理結果:</h2>
+            <img id="processedImage" class="processed-preview" src="" alt="">
+            <a id="downloadLink" class="btn btn-success mt-3" href="#" download="processed_image.jpg">処理された画像をダウンロード</a>
+        </div>
+    </div>
+    <!-- jQuery and Bootstrap JS -->
+    <script src="https://code.jquery.com/jquery-3.5.1.min.js"></script>
+    <script src="https://stackpath.bootstrapcdn.com/bootstrap/4.5.2/js/bootstrap.min.js"></script>
+    <!-- jQuery UI -->
+    <script src="https://code.jquery.com/ui/1.12.1/jquery-ui.js"></script>
+    <script>
+        $(function() {
+            // スライダーの設定
+            $("#slider").slider({
+                range: "min",
+                value: 50, // 初期値
+                min: 0,
+                max: 100,
+                slide: function(event, ui) {
+                    $("#riskLevelLabel").text(ui.value);
+                }
+            });
+        });
+        function previewImage() {
+            const fileInput = document.getElementById('uploadImage');
+            const uploadedImage = document.getElementById('uploadedImage');
+            if (fileInput.files && fileInput.files[0]) {
+                const reader = new FileReader();
+                reader.onload = function (e) {
+                    uploadedImage.src = e.target.result;
+                    uploadedImage.style.display = 'block';
+                };
+                reader.readAsDataURL(fileInput.files[0]);
+            }
+        }
+        function processImage() {
+            const fileInput = document.getElementById('uploadImage');
+            const processingType = document.getElementById('processingType').value;
+            const riskLevel = $("#slider").slider("value");  // スライ���ーから値を取得
+            const resultDiv = document.getElementById('result');
+            const processedImage = document.getElementById('processedImage');
+            const downloadLink = document.getElementById('downloadLink');
+            if (fileInput.files.length === 0) {
+                alert("画像を選択してください。");
+                return;
+            }
+            const file = fileInput.files[0];
+            const formData = new FormData();
+            formData.append('image', file);
+            formData.append('risk_level', riskLevel);  // リスクレベルを追加
+            let apiEndpoint;
+            if (processingType === "opencv") {
+                apiEndpoint = "/create-mask-and-inpaint-opencv";
+            } else if (processingType === "simple_lama") {
+                apiEndpoint = "/create-mask-and-inpaint-simple-lama";
+            } else if (processingType === "stable_diffusion") {
+                apiEndpoint = "/create-mask-and-inpaint-stable-diffusion";
+            } else if (processingType=="deep_fill_v2"){
+                apiEndpoint = "/create-mask-and-inpaint-deepfillv2";
+            }
+            const url = "https://wired-kitten-adequately.ngrok-free.app" + apiEndpoint;
+            fetch(url, {
+                method: 'POST',
+                body: formData
+            })
+            .then(response => {
+                if (!response.ok) {
+                    throw new Error("Network response was not ok");
+                }
+                return response.blob();
+            })
+            .then(blob => {
+                const objectURL = URL.createObjectURL(blob);
+                processedImage.src = objectURL;
+                downloadLink.href = objectURL;
+                resultDiv.style.display = "block";
+            })
+            .catch(error => {
+                console.error("画像処理に失敗しました。", error);
+                alert("画像処理に失敗しました。");
+            });
+        }
+    </script>
+</body>
+</html>
+    """
+    return HTMLResponse(content=html_content)
+if __name__ == "__main__":
+    app.run(host="0.0.0.0", port=7860)

main.png ADDED Viewed

output_vectors.json ADDED Viewed

The diff for this file is too large to render. See raw diff

requirements.txt ADDED Viewed

	@@ -0,0 +1,72 @@

+annotated-types==0.7.0
+anyio==4.6.2.post1
+certifi==2024.8.30
+charset-normalizer==3.4.0
+click==8.1.7
+colorama==0.4.6
+contourpy==1.3.0
+cycler==0.12.1
+diffusers==0.31.0
+fastapi==0.115.4
+filelock==3.16.1
+fire==0.5.0
+fonttools==4.54.1
+fsspec==2024.10.0
+futures==3.0.5
+h11==0.14.0
+huggingface-hub==0.26.2
+idna==3.10
+importlib_metadata==8.5.0
+Jinja2==3.1.4
+joblib==1.4.2
+kiwisolver==1.4.7
+MarkupSafe==3.0.2
+matplotlib==3.9.2
+mpmath==1.3.0
+nest-asyncio==1.6.0
+networkx==3.4.2
+numpy==1.26.4
+opencv-python==4.10.0.84
+opencv-python-headless==4.10.0.84
+packaging==24.1
+pandas==2.2.3
+Pillow==9.5.0
+psutil==6.1.0
+py-cpuinfo==9.0.0
+pycocotools==2.0.8
+pydantic==2.9.2
+pydantic_core==2.23.4
+pyngrok==7.2.1
+pyparsing==3.2.0
+python-dateutil==2.9.0.post0
+python-multipart==0.0.17
+pytz==2024.2
+PyYAML==6.0.2
+regex==2024.9.11
+requests==2.32.3
+safetensors==0.4.5
+scikit-learn==1.5.2
+scipy==1.14.1
+seaborn==0.13.2
+setuptools==75.3.0
+simple-lama-inpainting==0.1.2
+six==1.16.0
+sniffio==1.3.1
+starlette==0.41.2
+supervision==0.9.0
+sympy==1.13.1
+termcolor==2.5.0
+threadpoolctl==3.5.0
+tokenizers==0.20.3
+torch==2.5.1
+torchvision==0.20.1
+tqdm==4.66.6
+transformers==4.46.2
+typing_extensions==4.12.2
+tzdata==2024.2
+ultralytics==8.3.23
+ultralytics-thop==2.0.10
+urllib3==2.2.3
+uvicorn==0.32.0
+zipp==3.20.2
+supervision

sums_data.json ADDED Viewed

The diff for this file is too large to render. See raw diff