classification-garbage1

Sleeping

App Files Files Community

Jerry75AI commited on 6 days ago

Commit

1f0055e

verified ·

1 Parent(s): 18742db

Upload 4 files

Browse files

Files changed (4) hide show

Dockerfile +25 -0
README.md +6 -11
app.py +96 -57
requirements.txt +1 -1

Dockerfile ADDED Viewed

	@@ -0,0 +1,25 @@

+FROM tensorflow/tensorflow:2.16.1-jupyter
+WORKDIR /app
+# Install system dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    build-essential gfortran libblas-dev liblapack-dev \
+    libffi-dev libssl-dev libbz2-dev liblzma-dev zlib1g-dev \
+    libncurses5-dev libncursesw5-dev libreadline-dev curl git \
+    && rm -rf /var/lib/apt/lists/*
+# Copy requirements first for caching
+COPY requirements.txt .
+# Upgrade pip and install all dependencies
+RUN pip install --no-cache-dir -r requirements.txt
+# Copy app source
+COPY . .
+# Expose Flask port
+EXPOSE 7860
+# Run Flask API
+CMD ["python", "app.py"]

README.md CHANGED Viewed

@@ -1,14 +1,9 @@
 ---
-title: Classification Garbage
-emoji: 📚
-colorFrom: gray
-colorTo: yellow
-sdk: gradio
-sdk_version: 5.48.0
-app_file: app.py
 pinned: false
 ---
-# HF Model: Classification
-This folder contains files to load a Keras (.keras) image classification model on Hugging Face Inference.

 ---
+title: gcai
+emoji: 🌍
+colorFrom: yellow
+colorTo: indigo
+sdk: docker
 pinned: false
+license: mit
 ---

app.py CHANGED Viewed

@@ -1,86 +1,125 @@
-import gradio as gr
-import numpy as np
-from PIL import Image
-import tensorflow as tf
-from typing import List, Dict, Any
 import io
-# Labels must mirror src/classification-model/index.ts
-LABELS: List[str] = [
-    "battery",
-    "biological",
-    "brown-glass",
-    "cardboard",
-    "clothes",
-    "green-glass",
-    "metal",
-    "paper",
-    "plastic",
-    "shoes",
-    "trash",
-    "white-glass",
 ]
-def _load_image_to_rgb(image: Image.Image) -> np.ndarray:
     if image.mode != "RGB":
         image = image.convert("RGB")
-    return np.asarray(image)
-def _resize_224(img_rgb: np.ndarray) -> np.ndarray:
-    im = Image.fromarray(img_rgb)
-    im = im.resize((224, 224), Image.NEAREST)
-    return np.asarray(im)
-def _preprocess(image: Image.Image) -> np.ndarray:
-    rgb = _load_image_to_rgb(image)
-    rgb224 = _resize_224(rgb)
-    # shape [1,224,224,3], float32 in 0..255
-    arr = rgb224.astype("float32")
-    return np.expand_dims(arr, axis=0)
 class PreTrainedModel:
-    def __init__(self, model_path: str = "model/model_resnet50.keras") -> None:
-        self.model = tf.keras.models.load_model(model_path)
     def predict_image(self, image: Image.Image) -> Dict[str, float]:
-        x = _preprocess(image)
         preds = self.model.predict(x)
         if isinstance(preds, (list, tuple)):
             preds = preds[0]
         probs = np.asarray(preds).squeeze().tolist()
         return {label: score for label, score in zip(LABELS, probs)}
 model = PreTrainedModel()
 def predict(image):
     predictions = model.predict_image(image)
-    probs_percent = {label: round(p * 100, 2)
-                     for label, p in predictions.items()}
-    max_label = max(probs_percent, key=probs_percent.get)
-    return {
-        "label": max_label,
-        "percentage": probs_percent[max_label],
-        "probabilities": probs_percent,
-    }
-iface = gr.Interface(
-    fn=predict,
-    inputs=gr.Image(type="pil"),
-    outputs=gr.JSON(),
-    title="Waste Classification",
-    description="Upload an image of waste to classify it.",
-)
 if __name__ == "__main__":
-    iface.launch()

 import io
+from typing import Dict
+import numpy as np
+import tensorflow as tf
+from PIL import Image, UnidentifiedImageError
+from robyn import Robyn, Request
+LABELS = [
+    "battery",        # 电池
+    "biological",     # 生物垃圾/厨余垃圾
+    "brown-glass",    # 棕色玻璃
+    "cardboard",      # 纸板
+    "clothes",        # 衣物
+    "green-glass",    # 绿色玻璃
+    "metal",          # 金属
+    "paper",          # 纸张
+    "plastic",        # 塑料
+    "shoes",          # 鞋子
+    "trash",          # 其他垃圾
+    "white-glass",    # 白色玻璃
 ]
+MODEL_PATH = "model/model_resnet50.keras"
+def preprocess(image: Image.Image) -> np.ndarray:
+    """
+    完整的图像预处理流程，将输入图像转换为模型可接受的格式
+    image: PIL Image 对象，输入的原始图像
+    返回: 预处理后的图像数组，形状为 [1, 224, 224, 3]，数据类型为 float32，像素值范围 0-255
+    """
+    # 检查图像模式是否为 RGB，如果不是则进行转换
     if image.mode != "RGB":
         image = image.convert("RGB")
+    # 使用最近邻插值法将图像调整为 224x224 像素
+    # 224x224 是 ResNet50 模型的标准输入尺寸
+    image = image.resize((224, 224), Image.NEAREST)
+    # 将调整后的 PIL Image 转换回 NumPy 数组
+    # 形状为 [1, 224, 224, 3]，数据类型为 float32，像素值范围 0-255
+    # 再将图像数据类型转换为 float32，以便进行后续计算
+    rgb224 = np.asarray(image).astype("float32")
+    # 在第一个维度（批次维度）上扩展数组，使其形状变为 [1, 224, 224, 3]
+    # 这是为了匹配深度学习模型期望的输入格式（批次大小, 高度, 宽度, 通道数）
+    return np.expand_dims(rgb224, axis=0)
 class PreTrainedModel:
+    """
+    预训练模型包装类，用于加载和运行垃圾分类模型
+    """
+    def __init__(self) -> None:
+        """
+        初始化预训练模型
+        """
+        self.model = tf.keras.models.load_model(MODEL_PATH)
     def predict_image(self, image: Image.Image) -> Dict[str, float]:
+        """
+        对输入图像进行分类预测
+        image: PIL Image 对象，待分类的图像
+        返回: 包含每个标签及其对应预测概率的字典
+        """
+        # 对输入图像进行预处理，转换为模型可接受的格式
+        x = preprocess(image)
+        # 使用模型进行预测，返回预测结果
         preds = self.model.predict(x)
+        # 如果预测结果是列表或元组（某些模型会返回多个输出），取第一个输出
         if isinstance(preds, (list, tuple)):
             preds = preds[0]
+        # 将预测结果转换为 NumPy 数组，去除多余的维度，并转换为 Python 列表
         probs = np.asarray(preds).squeeze().tolist()
+        # 将标签与对应的预测概率组合成字典返回
         return {label: score for label, score in zip(LABELS, probs)}
+# 创建全局模型实例，程序启动时加载模型
+# 这样做可以避免每次预测时重复加载模型，提高响应速度
 model = PreTrainedModel()
 def predict(image):
+    """
+    预测函数，用于 Gradio 接口调用
+    image: 输入图像
+    返回: 包含预测标签、置信度和所有类别概率的字典
+    """
+    # 调用模型进行预测，获取每个类别的概率
     predictions = model.predict_image(image)
+    # 找出概率最高的类别作为预测结果
+    max_label = max(predictions, key=predictions.get)
+    return max_label
+# 创建服务器
+app = Robyn(__file__)
+@app.post("/predict")
+def predict_route(request: Request):
+    try:
+        # 读取 POST 二进制流
+        raw = request.body
+        if raw is None or len(raw) == 0:
+            return {"error": "empty request body"}, 400
+        # Robyn 的 request.body 可能是 str 或 bytes；
+        # 发图片二进制时通常会是 bytes。
+        if isinstance(raw, str):
+            raw = raw.encode("latin1")
+        image = Image.open(io.BytesIO(raw)).convert("RGB")
+        label = predict(image)
+        return label
+    except UnidentifiedImageError:
+        return {"error": "invalid image bytes"}, 400
+    except Exception as e:
+        return {"error": str(e)}, 500
+@app.get("/")
+def home():
+    return "POST /predict"
 if __name__ == "__main__":
+    app.start(host="0.0.0.0", port=8080)

requirements.txt CHANGED Viewed

@@ -2,4 +2,4 @@ tensorflow==2.16.1
 numpy
 Pillow
 requests
-gradio

 numpy
 Pillow
 requests
+robyn