image-enhancer-multiple-image

Running

App Files Files Community

abiabidali commited on Aug 15

Commit

acf7f61

•

1 Parent(s): 9c737cd

Update app.py

Browse files

Fast Processing

Files changed (1) hide show

app.py +68 -64

app.py CHANGED Viewed

@@ -1,93 +1,96 @@
 import torch
 from PIL import Image
 from RealESRGAN import RealESRGAN
 import gradio as gr
 import numpy as np
 import tempfile
-import time
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
-def load_model(scale):
-    model = RealESRGAN(device, scale=scale)
-    weights_path = f'weights/RealESRGAN_x{scale}.pth'
-    try:
-        model.load_weights(weights_path, download=True)
-        print(f"Weights for scale {scale} loaded successfully.")
-    except Exception as e:
-        print(f"Error loading weights for scale {scale}: {e}")
-        model.load_weights(weights_path, download=False)
-    return model
-model2 = load_model(2)
-model4 = load_model(4)
-model8 = load_model(8)
 def enhance_image(image, scale):
-    try:
-        print(f"Enhancing image with scale {scale}...")
-        start_time = time.time()
-        image_np = np.array(image.convert('RGB'))
-        print(f"Image converted to numpy array: shape {image_np.shape}, dtype {image_np.dtype}")
-        if scale == '2x':
-            result = model2.predict(image_np)
-        elif scale == '4x':
-            result = model4.predict(image_np)
-        else:
-            result = model8.predict(image_np)
-        enhanced_image = Image.fromarray(np.uint8(result))
-        print(f"Image enhanced in {time.time() - start_time:.2f} seconds")
-        return enhanced_image
-    except Exception as e:
-        print(f"Error enhancing image: {e}")
-        return image
-def muda_dpi(input_image, dpi):
-    dpi_tuple = (dpi, dpi)
-    image = Image.fromarray(input_image.astype('uint8'), 'RGB')
-    temp_file = tempfile.NamedTemporaryFile(delete=False, suffix='.jpg')
-    image.save(temp_file, format='JPEG', dpi=dpi_tuple)
-    temp_file.close()
-    return Image.open(temp_file.name)
-def resize_image(input_image, width, height):
-    image = Image.fromarray(input_image.astype('uint8'), 'RGB')
-    resized_image = image.resize((width, height))
-    temp_file = tempfile.NamedTemporaryFile(delete=False, suffix='.jpg')
-    resized_image.save(temp_file, format='JPEG')
-    temp_file.close()
-    return Image.open(temp_file.name)
 def process_images(image_files, enhance, scale, adjust_dpi, dpi, resize, width, height):
     processed_images = []
     file_paths = []
-    for image_file in image_files:
-        input_image = np.array(Image.open(image_file).convert('RGB'))
-        original_image = Image.fromarray(input_image.astype('uint8'), 'RGB')
         if enhance:
-            original_image = enhance_image(original_image, scale)
         if adjust_dpi:
-            original_image = muda_dpi(np.array(original_image), dpi)
         if resize:
-            original_image = resize_image(np.array(original_image), width, height)
         temp_file = tempfile.NamedTemporaryFile(delete=False, suffix='.jpg')
-        original_image.save(temp_file.name,format='JPEG')
-        processed_images.append(original_image)
-        file_paths.append(temp_file.name)
-    return processed_images, file_paths
 iface = gr.Interface(
     fn=process_images,
     inputs=[
-        gr.Files(label="Upload Image Files"),  # Use gr.Files for multiple file uploads
         gr.Checkbox(label="Enhance Images (ESRGAN)"),
         gr.Radio(['2x', '4x', '8x'], type="value", value='2x', label='Resolution model'),
         gr.Checkbox(label="Adjust DPI"),
@@ -97,11 +100,12 @@ iface = gr.Interface(
         gr.Number(label="Height", value=512)
     ],
     outputs=[
-        gr.Gallery(label="Final Images"),  # Use gr.Gallery to display multiple images
-        gr.Files(label="Download Final Images")
     ],
-    title="Multi-Image Enhancer",
-    description="Upload multiple images (.jpg, .png), enhance using AI, adjust DPI, resize, and download the final results."
 )
 iface.launch(debug=True)

 import torch
+from transformers import BlipProcessor, BlipForConditionalGeneration
 from PIL import Image
 from RealESRGAN import RealESRGAN
 import gradio as gr
 import numpy as np
 import tempfile
+import os
+# Set device to GPU if available, otherwise use CPU
 device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')
+# Load the BLIP model and processor once
+processor = BlipProcessor.from_pretrained("Salesforce/blip-image-captioning-base")
+model = BlipForConditionalGeneration.from_pretrained("Salesforce/blip-image-captioning-base").to(device)
+# Load the Real-ESRGAN models
+model2 = RealESRGAN(device, scale=2)
+model4 = RealESRGAN(device, scale=4)
+model8 = RealESRGAN(device, scale=8)
+# Load weights for all models at the start to avoid reloading during processing
+model2.load_weights('weights/RealESRGAN_x2.pth', download=True)
+model4.load_weights('weights/RealESRGAN_x4.pth', download=True)
+model8.load_weights('weights/RealESRGAN_x8.pth', download=True)
+# Function to enhance image resolution
 def enhance_image(image, scale):
+    image_np = np.array(image.convert('RGB'))
+    if scale == '2x':
+        result = model2.predict(image_np)
+    elif scale == '4x':
+        result = model4.predict(image_np)
+    else:
+        result = model8.predict(image_np)
+    return Image.fromarray(np.uint8(result))
+# Function to generate caption for the image using BLIP
+def generate_caption(image):
+    inputs = processor(images=image, return_tensors="pt").to(device)
+    output_ids = model.generate(**inputs)
+    return processor.decode(output_ids[0], skip_special_tokens=True)
+# Function to adjust DPI of the image
+def muda_dpi(image, dpi):
+    image.save(image.filename, format='JPEG', dpi=(dpi, dpi))
+    return image
+# Function to resize the image
+def resize_image(image, width, height):
+    return image.resize((width, height))
+# Main function to process images
 def process_images(image_files, enhance, scale, adjust_dpi, dpi, resize, width, height):
     processed_images = []
     file_paths = []
+    captions = []
+    for i, image_file in enumerate(image_files):
+        image = Image.open(image_file).convert('RGB')
+        # Enhance resolution if required
         if enhance:
+            image = enhance_image(image, scale)
+        # Adjust DPI if required
         if adjust_dpi:
+            image = muda_dpi(image, dpi)
+        # Resize if required
         if resize:
+            image = resize_image(image, width, height)
+        # Generate caption
+        caption = generate_caption(image)
+        captions.append(caption)
+        # Save the processed image
+        custom_filename = f"Image_Captioning_with_BLIP_{i+1}.jpg"
         temp_file = tempfile.NamedTemporaryFile(delete=False, suffix='.jpg')
+        image.save(temp_file.name, format='JPEG')
+        final_path = temp_file.name.replace(temp_file.name.split('/')[-1], custom_filename)
+        os.rename(temp_file.name, final_path)
+        file_paths.append(final_path)
+        processed_images.append(image)
+    return processed_images, file_paths, captions
+# Setup Gradio interface
 iface = gr.Interface(
     fn=process_images,
     inputs=[
+        gr.Files(label="Upload Image Files"),
         gr.Checkbox(label="Enhance Images (ESRGAN)"),
         gr.Radio(['2x', '4x', '8x'], type="value", value='2x', label='Resolution model'),
         gr.Checkbox(label="Adjust DPI"),
         gr.Number(label="Height", value=512)
     ],
     outputs=[
+        gr.Gallery(label="Final Images"),
+        gr.Files(label="Download Final Images"),
+        gr.Textbox(label="Image Captions")
     ],
+    title="High-Quality Image Enhancer with Fast Processing",
+    description="Upload multiple images (.jpg, .png), enhance using AI, adjust DPI, resize, generate captions, and download the final results."
 )
 iface.launch(debug=True)