Spaces:

aidenpan
/

AniLines-Anime-Lineart-Extractor

Running on Zero

App Files Files Community

aidenpan commited on 28 days ago

Commit

9a514db

1 Parent(s): 4557021

rename repo

Browse files

Files changed (7) hide show

.gitattributes +1 -0
.gitignore +7 -0
README.md +6 -6
app.py +151 -0
network/line_extractor.py +107 -0
requirements.txt +8 -0
weights/.gitkeep +0 -0

.gitattributes CHANGED Viewed

@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text

 *.zip filter=lfs diff=lfs merge=lfs -text
 *.zst filter=lfs diff=lfs merge=lfs -text
 *tfevents* filter=lfs diff=lfs merge=lfs -text
+example.png filter=lfs diff=lfs merge=lfs -text

.gitignore ADDED Viewed

	@@ -0,0 +1,7 @@

+dev
+__pycache__
+.gradio
+*.pth
+*.png
+*.jpg

README.md CHANGED Viewed

@@ -1,14 +1,14 @@
 ---
-title: AniLines Anime Lineart Extractor
-emoji: 👁
-colorFrom: gray
-colorTo: gray
 sdk: gradio
-sdk_version: 5.18.0
 app_file: app.py
 pinned: false
 license: mit
-short_description: Extracting lineart, sketch from anime images and videos
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

 ---
+title: Anilines
+emoji: ⚡
+colorFrom: blue
+colorTo: purple
 sdk: gradio
+sdk_version: 5.16.1
 app_file: app.py
 pinned: false
 license: mit
+short_description: Anime Line Extractor
 ---
 Check out the configuration reference at https://huggingface.co/docs/hub/spaces-config-reference

app.py ADDED Viewed

	@@ -0,0 +1,151 @@

+import spaces
+import os
+import cv2
+import argparse
+import numpy as np
+import gradio as gr
+import numpy as np
+from tqdm import tqdm
+from PIL import Image, ImageEnhance
+import torch
+from torch.amp import autocast
+import torch.nn.functional as F
+from network.line_extractor import LineExtractor
+def resize(image, max_size=3840):
+    h, w = image.shape[:2]
+    if h > w:
+        h, w = (max_size, int(w * max_size / h))
+    else:
+        h, w = (int(h * max_size / w), max_size)
+    return cv2.resize(image, (w, h))
+def increase_sharpness(img, factor=6.0):
+    image = Image.fromarray(img)
+    enhancer = ImageEnhance.Sharpness(image)
+    return np.array(enhancer.enhance(factor))
+def load_model(mode):
+    if mode == 'basic':
+        model = LineExtractor(3, 1, True)
+    elif mode == 'detail':
+        model = LineExtractor(2, 1, True)
+    path_model = os.path.join('weights', f'{mode}.pth')
+    model.load_state_dict(torch.load(path_model, weights_only=True))
+    for param in model.parameters():
+        param.requires_grad = False
+    model.eval()
+    return model
+def process_image(image, mode, binarize, threshold, fp16=True):
+    if image is None:
+        return None
+    binarize_value = threshold if binarize else -1
+    args = argparse.Namespace(mode=mode, binarize=binarize_value, fp16=fp16, device="cuda:0")
+    image = cv2.cvtColor(np.array(image), cv2.COLOR_RGB2BGR)
+    if image.shape[0] > 1920 or image.shape[1] > 1920:
+        image = resize(image)
+    return inference(image, args)
+def process_video(path_in, path_out, fourcc='mp4v', **kwargs):
+    video = cv2.VideoCapture(path_in)
+    fps = video.get(cv2.CAP_PROP_FPS)
+    width = int(video.get(cv2.CAP_PROP_FRAME_WIDTH))
+    height = int(video.get(cv2.CAP_PROP_FRAME_HEIGHT))
+    total_frames = int(video.get(cv2.CAP_PROP_FRAME_COUNT))
+    fourcc = cv2.VideoWriter_fourcc(*fourcc)
+    video_out = cv2.VideoWriter(path_out, fourcc, fps, (width, height))
+    for _ in tqdm(range(total_frames), desc='Processing Video'):
+        ret, frame = video.read()
+        if not ret:
+            break
+        img = inference(frame, **kwargs)
+        img = cv2.cvtColor(img, cv2.COLOR_GRAY2BGR)
+        video_out.write(img)
+    video.release()
+    video_out.release()
+@spaces.GPU(duration=60)
+def inference(img: np.ndarray, args):
+    if args.mode == 'basic':
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2RGB)
+        img = increase_sharpness(img)
+        img = torch.from_numpy(img).permute(2, 0, 1).unsqueeze(0).float().to(args.device) / 255.
+        x_in = img
+    else:
+        img = cv2.cvtColor(img, cv2.COLOR_BGR2GRAY)
+        sobelx = cv2.Sobel(img, cv2.CV_64F, 1, 0, ksize=3)
+        sobely = cv2.Sobel(img, cv2.CV_64F, 0, 1, ksize=3)
+        sobel = cv2.magnitude(sobelx, sobely)
+        sobel = 255 - cv2.normalize(sobel, None, 0, 255, cv2.NORM_MINMAX, cv2.CV_8UC1)
+        img = torch.from_numpy(img).unsqueeze(0).unsqueeze(0).float().to(args.device) / 255.
+        sobel = torch.from_numpy(sobel).unsqueeze(0).unsqueeze(0).float().to(args.device) / 255.
+        x_in = torch.cat([img, sobel], dim=1)
+    B, C, H, W = x_in.shape
+    pad_h = 8 - (H % 8)
+    pad_w = 8 - (W % 8)
+    x_in = F.pad(x_in, (0, pad_w, 0, pad_h), mode='reflect')
+    with torch.no_grad(), autocast(enabled=args.fp16, device_type='cuda:0'):
+        if args.mode == 'basic':
+            pred = model_basic(x_in)
+        elif args.mode == 'detail':
+            pred = model_detail(x_in)
+    pred = pred[:, :, :H, :W]
+    if args.binarize != -1:
+        pred = (pred > args.binarize).float()
+    return np.clip((pred[0, 0].cpu().numpy() * 255) + 0.5, 0, 255).astype(np.uint8)
+model_basic = load_model("basic").to("cuda:0")
+model_detail = load_model("detail").to("cuda:0")
+with gr.Blocks() as demo:
+    gr.Markdown("# AniLines - Anime Line Extractor Demo")
+    gr.Markdown("For video and batch processing, please refer to the [project page](https://github.com/zhenglinpan/AniLines-Anime-Line-Extractor)")
+    with gr.Tabs():
+        with gr.Tab("Image Processing"):
+            gr.Markdown("## Process Images")
+            gr.Markdown("*Online demo resizes image to a max of 4K if larger.")
+            with gr.Row():
+                image_input = gr.Image(type="pil", label="Upload Image")
+                image_output = gr.Image(label="Processed Output")
+            mode_dropdown = gr.Radio(["basic", "detail"], value="detail", label="Processing Mode")
+            binarize_checkbox = gr.Checkbox(label="Binarize", value=False)
+            binarize_slider = gr.Slider(minimum=0, maximum=1, step=0.05, value=0.75, label="Binarization Threshold (-1 for auto)", visible=False)
+            binarize_checkbox.change(lambda binarize: gr.update(visible=binarize), inputs=binarize_checkbox, outputs=binarize_slider)
+            process_button = gr.Button("Process")
+            gr.Examples(
+                examples=["example.png", "example2.jpg"],
+                inputs=image_input,
+                outputs=image_input
+            )
+            process_button.click(process_image,
+                                 inputs=[image_input, mode_dropdown, binarize_checkbox, binarize_slider],
+                                 outputs=image_output)
+demo.queue().launch()

network/line_extractor.py ADDED Viewed

	@@ -0,0 +1,107 @@

+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+class LineExtractor(nn.Module):
+    def __init__(self, chan_in, chan_out, bilinear=False):
+        super().__init__()
+        self.bilinear = bilinear
+        self.inc = (DoubleConv(chan_in, 64))
+        self.down1 = (Down(64, 128))
+        self.down2 = (Down(128, 256))
+        self.down3 = (Down(256, 512))
+        factor = 2 if bilinear else 1
+        self.down4 = (Down(512, 1024 // factor))
+        self.up1 = (Up(1024, 512 // factor, bilinear))
+        self.up2 = (Up(512, 256 // factor, bilinear))
+        self.up3 = (Up(256, 128 // factor, bilinear))
+        self.up4 = (Up(128, 64, bilinear))
+        self.outc = (OutConv(64, chan_out))
+    def forward(self, x):
+        x1 = self.inc(x)
+        x2 = self.down1(x1)
+        x3 = self.down2(x2)
+        x4 = self.down3(x3)
+        x5 = self.down4(x4)
+        x = self.up1(x5, x4)
+        x = self.up2(x, x3)
+        x = self.up3(x, x2)
+        x = self.up4(x, x1)
+        logits = self.outc(x)
+        return logits
+    def use_checkpointing(self):
+        self.inc = torch.utils.checkpoint(self.inc)
+        self.down1 = torch.utils.checkpoint(self.down1)
+        self.down2 = torch.utils.checkpoint(self.down2)
+        self.down3 = torch.utils.checkpoint(self.down3)
+        self.down4 = torch.utils.checkpoint(self.down4)
+        self.up1 = torch.utils.checkpoint(self.up1)
+        self.up2 = torch.utils.checkpoint(self.up2)
+        self.up3 = torch.utils.checkpoint(self.up3)
+        self.up4 = torch.utils.checkpoint(self.up4)
+        self.outc = torch.utils.checkpoint(self.outc)
+class DoubleConv(nn.Module):
+    def __init__(self, in_channels, out_channels, mid_channels=None):
+        super().__init__()
+        if not mid_channels:
+            mid_channels = out_channels
+        self.double_conv = nn.Sequential(
+            nn.Conv2d(in_channels, mid_channels, kernel_size=3, padding=1, bias=False),
+            nn.BatchNorm2d(mid_channels),
+            nn.ReLU(inplace=True),
+            nn.Conv2d(mid_channels, out_channels, kernel_size=3, padding=1, bias=False),
+            nn.BatchNorm2d(out_channels),
+            nn.ReLU(inplace=True)
+        )
+    def forward(self, x):
+        return self.double_conv(x)
+class Down(nn.Module):
+    def __init__(self, in_channels, out_channels):
+        super().__init__()
+        self.maxpool_conv = nn.Sequential(
+            nn.MaxPool2d(2),
+            DoubleConv(in_channels, out_channels)
+        )
+    def forward(self, x):
+        return self.maxpool_conv(x)
+class Up(nn.Module):
+    def __init__(self, in_channels, out_channels, bilinear=True):
+        super().__init__()
+        if bilinear:
+            self.up = nn.Upsample(scale_factor=2, mode='bilinear', align_corners=True)
+            self.conv = DoubleConv(in_channels, out_channels, in_channels // 2)
+        else:
+            self.up = nn.ConvTranspose2d(in_channels, in_channels // 2, kernel_size=2, stride=2)
+            self.conv = DoubleConv(in_channels, out_channels)
+    def forward(self, x1, x2):
+        x1 = self.up(x1)
+        diffY = x2.size()[2] - x1.size()[2]
+        diffX = x2.size()[3] - x1.size()[3]
+        x1 = F.pad(x1, [diffX // 2, diffX - diffX // 2,
+                        diffY // 2, diffY - diffY // 2])
+        x = torch.cat([x2, x1], dim=1)
+        return self.conv(x)
+class OutConv(nn.Module):
+    def __init__(self, in_channels, out_channels):
+        super(OutConv, self).__init__()
+        self.conv = nn.Conv2d(in_channels, out_channels, kernel_size=1)
+    def forward(self, x):
+        return self.conv(x)

requirements.txt ADDED Viewed

	@@ -0,0 +1,8 @@

+tqdm
+torch
+torchvision
+opencv-python
+pillow
+numpy
+gradio
+spaces

weights/.gitkeep ADDED Viewed

File without changes