Spaces:

hongyu12321
/

RedFish

Sleeping

App Files Files Community

hongyu12321 commited on Sep 13

Commit

8fc4073

verified ·

1 Parent(s): aca8858

Update app.py

Browse files

Files changed (1) hide show

app.py +170 -40

app.py CHANGED Viewed

@@ -1,40 +1,170 @@
-# app.py
-import os
-os.environ["TRANSFORMERS_NO_TF"] = "1"
-os.environ["TRANSFORMERS_NO_FLAX"] = "1"
-os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
-import gradio as gr
-from PIL import Image
-from hf_model import PretrainedAgeEstimator
-est = PretrainedAgeEstimator()
-def predict(img):
-    # Gradio may pass PIL or numpy; handle both
-    if not isinstance(img, Image.Image):
-        img = Image.fromarray(img)
-    age, top = est.predict(img, topk=5)
-    # 1) dict[str, float] for Label
-    probs = {lbl: float(prob) for lbl, prob in top}
-    # 2) plain string for the estimate
-    summary = f"Estimated age: **{age:.1f}** years"
-    return probs, summary
-demo = gr.Interface(
-    fn=predict,
-    inputs=gr.Image(type="pil", label="Upload a face image"),
-    outputs=[
-        gr.Label(num_top_classes=5, label="Age Prediction (probabilities)"),
-        gr.Markdown(label="Summary"),
-    ],
-    title="Pretrained Age Estimator",
-    description="Runs a pretrained ViT-based age classifier and reports a point estimate from class probabilities."
-)
-if __name__ == "__main__":
-    demo.launch(share=True)

+# app.py
+import os
+os.environ["TRANSFORMERS_NO_TF"] = "1"
+os.environ["TRANSFORMERS_NO_FLAX"] = "1"
+os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
+import gradio as gr
+from PIL import Image
+import numpy as np
+import torch
+from hf_model import PretrainedAgeEstimator
+from face_utils import FaceCropper
+# NEW: diffusers for cartoonizer
+from diffusers import StableDiffusionImg2ImgPipeline
+# ---------- Load models once ----------
+est = PretrainedAgeEstimator()
+cropper = FaceCropper(device=est.device)
+# A solid, public SD 1.5 img2img pipeline; fast and reliable
+SD15_ID = "runwayml/stable-diffusion-v1-5"
+sd_pipe = StableDiffusionImg2ImgPipeline.from_pretrained(
+    SD15_ID,
+    torch_dtype=torch.float16 if torch.cuda.is_available() else torch.float32,
+    safety_checker=None,   # rely on prompts; HF Spaces also has a global filter
+).to(est.device)
+# ---------- Helpers ----------
+def _ensure_pil(img):
+    if isinstance(img, Image.Image):
+        return img
+    return Image.fromarray(img)
+# ----- Age: single image -----
+def predict_single(img, auto_crop=True, topk=5, show_annot=True):
+    if img is None:
+        return {}, "No image provided.", None
+    img = _ensure_pil(img).convert("RGB")
+    preview = img
+    face = None
+    if auto_crop:
+        face, annotated, _ = cropper.detect_and_crop(img, select="largest")
+        preview = annotated if show_annot else img
+    target = face if face is not None else img
+    age, top = est.predict(target, topk=topk)
+    probs = {lbl: float(prob) for lbl, prob in top}
+    summary = f"**Estimated age:** {age:.1f} years"
+    return probs, summary, preview
+# ----- Age: batch -----
+def predict_batch(files, auto_crop=True, topk=5):
+    if not files:
+        return "No files uploaded."
+    rows = ["| File | Estimated Age | Top-1 | p |", "|---|---:|---|---:|"]
+    for f in files:
+        try:
+            img = Image.open(f.name).convert("RGB")
+            face = None
+            if auto_crop:
+                face, _, _ = cropper.detect_and_crop(img, select="largest")
+            target = face if face is not None else img
+            age, top = est.predict(target, topk=topk)
+            top1_lbl, top1_p = top[0]
+            rows.append(f"| {os.path.basename(f.name)} | {age:.1f} | {top1_lbl} | {top1_p:.3f} |")
+        except Exception:
+            rows.append(f"| {os.path.basename(f.name)} | (error) | - | - |")
+    return "\n".join(rows)
+# ----- NEW: Cartoonizer (img2img) -----
+def cartoonize(img, prompt, strength=0.6, guidance=7.5, steps=25, seed=0, use_face_crop=True):
+    """
+    img: PIL or numpy
+    prompt: text description, e.g. "cute cel-shaded cartoon, soft outlines, vibrant colors"
+    strength: how much to deviate from the input (0.3 subtle → 0.8 strong)
+    guidance: prompt strength (5–12 typical)
+    steps: diffusion steps (20–40 typical)
+    seed: reproducibility (-1 for random)
+    """
+    if img is None:
+        return None
+    img = _ensure_pil(img).convert("RGB")
+    # optional crop to the largest face for better identity preservation
+    if use_face_crop:
+        face, _, _ = cropper.detect_and_crop(img, select="largest")
+        if face is not None:
+            img = face
+    # cartoon-y defaults (you can tweak in UI)
+    base_prompt = (
+        "cartoon, cel-shaded, clean lineart, smooth shading, high contrast, vibrant, studio ghibli style, "
+        "pixar style, highly detailed, 2D illustration"
+    )
+    full_prompt = f"{base_prompt}, {prompt}".strip().strip(",")
+    generator = None
+    if seed and seed >= 0:
+        generator = torch.Generator(device=est.device).manual_seed(int(seed))
+    out = sd_pipe(
+        prompt=full_prompt,
+        image=img,
+        strength=float(strength),
+        guidance_scale=float(guidance),
+        num_inference_steps=int(steps),
+        generator=generator,
+    )
+    result = out.images[0]
+    return result
+# ---------- UI ----------
+with gr.Blocks(title="Pretrained Age Estimator + Cartoonizer") as demo:
+    gr.Markdown("# Pretrained Age Estimator + Cartoonizer")
+    gr.Markdown("Detects age from a face and can also generate a cartoonized image guided by your text description.")
+    with gr.Tabs():
+        with gr.Tab("Age (Single)"):
+            with gr.Row():
+                with gr.Column():
+                    inp = gr.Image(type="pil", label="Upload a face image")
+                    cam = gr.Image(sources=["webcam"], type="pil", label="Webcam (optional)")
+                    auto = gr.Checkbox(True, label="Auto face crop (MTCNN)")
+                    topk = gr.Slider(3, 9, value=5, step=1, label="Top-K age ranges")
+                    annot = gr.Checkbox(True, label="Show detection preview")
+                    btn = gr.Button("Predict Age", variant="primary")
+                with gr.Column():
+                    out_label = gr.Label(num_top_classes=5, label="Age Prediction (probabilities)")
+                    out_md = gr.Markdown(label="Summary")
+                    out_prev = gr.Image(label="Preview", visible=True)
+            def run_single(img, cam_img, auto_crop, topk_val, show_annot):
+                chosen = cam_img if cam_img is not None else img
+                return predict_single(chosen, auto_crop, int(topk_val), show_annot)
+            btn.click(fn=run_single, inputs=[inp, cam, auto, topk, annot],
+                      outputs=[out_label, out_md, out_prev])
+        with gr.Tab("Age (Batch)"):
+            files = gr.Files(label="Upload multiple images")
+            auto_b = gr.Checkbox(True, label="Auto face crop (MTCNN)")
+            topk_b = gr.Slider(3, 9, value=5, step=1, label="Top-K age ranges")
+            btn_b = gr.Button("Run batch")
+            out_table = gr.Markdown()
+            btn_b.click(fn=predict_batch, inputs=[files, auto_b, topk_b], outputs=out_table)
+        with gr.Tab("Cartoonizer"):
+            src = gr.Image(type="pil", label="Source image (face or any photo)")
+            prompt = gr.Textbox(label="Your style prompt",
+                                value="cute cel-shaded cartoon, clean lines, soft colors")
+            with gr.Row():
+                strength = gr.Slider(0.2, 0.95, value=0.6, step=0.05, label="Transformation strength")
+                guidance = gr.Slider(3, 15, value=7.5, step=0.5, label="Guidance scale")
+                steps = gr.Slider(10, 50, value=25, step=1, label="Steps")
+                seed = gr.Number(value=0, precision=0, label="Seed (0 or -1 = random)")
+            use_crop = gr.Checkbox(True, label="Crop to largest face before stylizing")
+            btn_c = gr.Button("Generate Cartoon", variant="primary")
+            out_img = gr.Image(label="Cartoon result")
+            btn_c.click(fn=cartoonize,
+                        inputs=[src, prompt, strength, guidance, steps, seed, use_crop],
+                        outputs=out_img)
+if __name__ == "__main__":
+    demo.launch()