classification-garbage

Build error

App Files Files Community

Jerry75AI commited on 6 days ago

Commit

5fea29a

verified ·

1 Parent(s): 18742db

Upload 2 files

Browse files

Files changed (2) hide show

app.py +84 -57
requirements.txt +1 -1

app.py CHANGED Viewed

@@ -1,86 +1,113 @@
-import gradio as gr
-import numpy as np
-from PIL import Image
-import tensorflow as tf
-from typing import List, Dict, Any
 import io
-# Labels must mirror src/classification-model/index.ts
-LABELS: List[str] = [
-    "battery",
-    "biological",
-    "brown-glass",
-    "cardboard",
-    "clothes",
-    "green-glass",
-    "metal",
-    "paper",
-    "plastic",
-    "shoes",
-    "trash",
-    "white-glass",
 ]
-def _load_image_to_rgb(image: Image.Image) -> np.ndarray:
     if image.mode != "RGB":
         image = image.convert("RGB")
-    return np.asarray(image)
-def _resize_224(img_rgb: np.ndarray) -> np.ndarray:
-    im = Image.fromarray(img_rgb)
-    im = im.resize((224, 224), Image.NEAREST)
-    return np.asarray(im)
-def _preprocess(image: Image.Image) -> np.ndarray:
-    rgb = _load_image_to_rgb(image)
-    rgb224 = _resize_224(rgb)
-    # shape [1,224,224,3], float32 in 0..255
-    arr = rgb224.astype("float32")
-    return np.expand_dims(arr, axis=0)
 class PreTrainedModel:
-    def __init__(self, model_path: str = "model/model_resnet50.keras") -> None:
-        self.model = tf.keras.models.load_model(model_path)
     def predict_image(self, image: Image.Image) -> Dict[str, float]:
-        x = _preprocess(image)
         preds = self.model.predict(x)
         if isinstance(preds, (list, tuple)):
             preds = preds[0]
         probs = np.asarray(preds).squeeze().tolist()
         return {label: score for label, score in zip(LABELS, probs)}
 model = PreTrainedModel()
 def predict(image):
     predictions = model.predict_image(image)
-    probs_percent = {label: round(p * 100, 2)
-                     for label, p in predictions.items()}
-    max_label = max(probs_percent, key=probs_percent.get)
-    return {
-        "label": max_label,
-        "percentage": probs_percent[max_label],
-        "probabilities": probs_percent,
-    }
-iface = gr.Interface(
-    fn=predict,
-    inputs=gr.Image(type="pil"),
-    outputs=gr.JSON(),
-    title="Waste Classification",
-    description="Upload an image of waste to classify it.",
-)
 if __name__ == "__main__":
-    iface.launch()

 import io
+from typing import Dict
+import numpy as np
+import tensorflow as tf
+from PIL import Image
+from bustapi import BustAPI, Request, Response
+LABELS = [
+    "battery",        # 电池
+    "biological",     # 生物垃圾/厨余垃圾
+    "brown-glass",    # 棕色玻璃
+    "cardboard",      # 纸板
+    "clothes",        # 衣物
+    "green-glass",    # 绿色玻璃
+    "metal",          # 金属
+    "paper",          # 纸张
+    "plastic",        # 塑料
+    "shoes",          # 鞋子
+    "trash",          # 其他垃圾
+    "white-glass",    # 白色玻璃
 ]
+MODEL_PATH = "model/model_resnet50.keras"
+def preprocess(image: Image.Image) -> np.ndarray:
+    """
+    完整的图像预处理流程，将输入图像转换为模型可接受的格式
+    image: PIL Image 对象，输入的原始图像
+    返回: 预处理后的图像数组，形状为 [1, 224, 224, 3]，数据类型为 float32，像素值范围 0-255
+    """
+    # 检查图像模式是否为 RGB，如果不是则进行转换
     if image.mode != "RGB":
         image = image.convert("RGB")
+    # 使用最近邻插值法将图像调整为 224x224 像素
+    # 224x224 是 ResNet50 模型的标准输入尺寸
+    image = image.resize((224, 224), Image.NEAREST)
+    # 将调整后的 PIL Image 转换回 NumPy 数组
+    # 形状为 [1, 224, 224, 3]，数据类型为 float32，像素值范围 0-255
+    # 再将图像数据类型转换为 float32，以便进行后续计算
+    rgb224 = np.asarray(image).astype("float32")
+    # 在第一个维度（批次维度）上扩展数组，使其形状变为 [1, 224, 224, 3]
+    # 这是为了匹配深度学习模型期望的输入格式（批次大小, 高度, 宽度, 通道数）
+    return np.expand_dims(rgb224, axis=0)
 class PreTrainedModel:
+    """
+    预训练模型包装类，用于加载和运行垃圾分类模型
+    """
+    def __init__(self) -> None:
+        """
+        初始化预训练模型
+        """
+        self.model = tf.keras.models.load_model(MODEL_PATH)
     def predict_image(self, image: Image.Image) -> Dict[str, float]:
+        """
+        对输入图像进行分类预测
+        image: PIL Image 对象，待分类的图像
+        返回: 包含每个标签及其对应预测概率的字典
+        """
+        # 对输入图像进行预处理，转换为模型可接受的格式
+        x = preprocess(image)
+        # 使用模型进行预测，返回预测结果
         preds = self.model.predict(x)
+        # 如果预测结果是列表或元组（某些模型会返回多个输出），取第一个输出
         if isinstance(preds, (list, tuple)):
             preds = preds[0]
+        # 将预测结果转换为 NumPy 数组，去除多余的维度，并转换为 Python 列表
         probs = np.asarray(preds).squeeze().tolist()
+        # 将标签与对应的预测概率组合成字典返回
         return {label: score for label, score in zip(LABELS, probs)}
+# 创建全局模型实例，程序启动时加载模型
+# 这样做可以避免每次预测时重复加载模型，提高响应速度
 model = PreTrainedModel()
 def predict(image):
+    """
+    预测函数，用于 Gradio 接口调用
+    image: 输入图像
+    返回: 包含预测标签、置信度和所有类别概率的字典
+    """
+    # 调用模型进行预测，获取每个类别的概率
     predictions = model.predict_image(image)
+    # 找出概率最高的类别作为预测结果
+    max_label = max(predictions, key=predictions.get)
+    return max_label
+# 创建服务器
+app = BustAPI()
+@app.post("/predict")
+async def predict_api(req: Request):
+    # 读取 POST 二进制流
+    img_bytes = await req.body()
+    # 转 PIL Image
+    image = Image.open(io.BytesIO(img_bytes)).convert("RGB")
+    # 推理
+    label = predict(image)
+    return Response.json({
+        "label": label
+    })
+@app.get("/")
+async def home():
+    return "POST /predict"
 if __name__ == "__main__":
+    app.run(host="0.0.0.0", port=8000)

requirements.txt CHANGED Viewed

@@ -2,4 +2,4 @@ tensorflow==2.16.1
 numpy
 Pillow
 requests
-gradio

 numpy
 Pillow
 requests
+bustapi