Spaces:
Running
Running
im
commited on
Commit
·
e9eeafb
1
Parent(s):
82a72c7
divid
Browse files- .gitignore +1 -0
- app.py +5 -79
- download_images.py +15 -0
- flagged/log.csv +1 -0
- process.py +77 -0
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
.env
|
app.py
CHANGED
@@ -82,94 +82,20 @@
|
|
82 |
|
83 |
|
84 |
|
85 |
-
import
|
86 |
-
import requests
|
87 |
-
from PIL import Image
|
88 |
-
import numpy as np
|
89 |
import gradio as gr
|
90 |
from encoder import FashionCLIPEncoder
|
91 |
-
|
92 |
-
# Constants
|
93 |
-
REQUESTS_HEADERS = {
|
94 |
-
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'
|
95 |
-
}
|
96 |
-
BATCH_SIZE = 30 # Define batch size for processing
|
97 |
|
98 |
# Initialize encoder
|
99 |
encoder = FashionCLIPEncoder()
|
100 |
|
101 |
-
#
|
102 |
-
|
103 |
-
try:
|
104 |
-
response = requests.get(url, stream=True, headers=REQUESTS_HEADERS, timeout=timeout)
|
105 |
-
if response.status_code == 200:
|
106 |
-
return Image.open(response.raw).convert("RGB") # Ensure consistent format
|
107 |
-
return None
|
108 |
-
except Exception as e:
|
109 |
-
print(f"Error downloading image: {e}")
|
110 |
-
return None
|
111 |
-
|
112 |
-
# Embedding function for a batch of images
|
113 |
-
def batch_process_images(image_urls: str):
|
114 |
-
# Split the input string by commas and strip whitespace
|
115 |
-
urls = [url.strip() for url in image_urls.split(",") if url.strip()]
|
116 |
-
|
117 |
-
if not urls:
|
118 |
-
return {"error": "No valid image URLs provided."}
|
119 |
-
|
120 |
-
results = []
|
121 |
-
batch_urls, batch_images = [], []
|
122 |
-
|
123 |
-
for url in urls:
|
124 |
-
try:
|
125 |
-
# Download image
|
126 |
-
image = download_image_as_pil(url)
|
127 |
-
if not image:
|
128 |
-
results.append({"image_url": url, "error": "Failed to download image"})
|
129 |
-
continue
|
130 |
-
|
131 |
-
batch_urls.append(url)
|
132 |
-
batch_images.append(image)
|
133 |
-
|
134 |
-
# Process batch when reaching batch size
|
135 |
-
if len(batch_images) == BATCH_SIZE:
|
136 |
-
process_batch(batch_urls, batch_images, results)
|
137 |
-
batch_urls, batch_images = [], []
|
138 |
-
|
139 |
-
except Exception as e:
|
140 |
-
results.append({"image_url": url, "error": str(e)})
|
141 |
-
|
142 |
-
# Process remaining images in the last batch
|
143 |
-
if batch_images:
|
144 |
-
process_batch(batch_urls, batch_images, results)
|
145 |
-
|
146 |
-
return results
|
147 |
-
|
148 |
-
|
149 |
-
# Helper function to process a batch
|
150 |
-
def process_batch(batch_urls, batch_images, results):
|
151 |
-
try:
|
152 |
-
# Generate embeddings
|
153 |
-
embeddings = encoder.encode_images(batch_images)
|
154 |
-
|
155 |
-
for url, embedding in zip(batch_urls, embeddings):
|
156 |
-
# Normalize embedding
|
157 |
-
embedding_normalized = embedding / np.linalg.norm(embedding)
|
158 |
-
|
159 |
-
# Append results
|
160 |
-
results.append({
|
161 |
-
"image_url": url,
|
162 |
-
"embedding_preview": embedding_normalized[:5].tolist(), # First 5 values for preview
|
163 |
-
"success": True
|
164 |
-
})
|
165 |
-
except Exception as e:
|
166 |
-
for url in batch_urls:
|
167 |
-
results.append({"image_url": url, "error": str(e)})
|
168 |
-
|
169 |
|
170 |
# Gradio Interface
|
171 |
iface = gr.Interface(
|
172 |
-
fn=batch_process_images,
|
173 |
inputs=gr.Textbox(
|
174 |
lines=5,
|
175 |
placeholder="Enter image URLs separated by commas",
|
|
|
82 |
|
83 |
|
84 |
|
85 |
+
import os
|
|
|
|
|
|
|
86 |
import gradio as gr
|
87 |
from encoder import FashionCLIPEncoder
|
88 |
+
from process import batch_process_images
|
|
|
|
|
|
|
|
|
|
|
89 |
|
90 |
# Initialize encoder
|
91 |
encoder = FashionCLIPEncoder()
|
92 |
|
93 |
+
# Constants
|
94 |
+
BATCH_SIZE = 30 # Define batch size for processing
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
95 |
|
96 |
# Gradio Interface
|
97 |
iface = gr.Interface(
|
98 |
+
fn=lambda image_urls: batch_process_images(image_urls, encoder, BATCH_SIZE),
|
99 |
inputs=gr.Textbox(
|
100 |
lines=5,
|
101 |
placeholder="Enter image URLs separated by commas",
|
download_images.py
ADDED
@@ -0,0 +1,15 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import requests
|
2 |
+
from PIL import Image
|
3 |
+
|
4 |
+
REQUESTS_HEADERS = {
|
5 |
+
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/91.0.4472.124 Safari/537.36'
|
6 |
+
}
|
7 |
+
def download_image_as_pil(url: str, timeout: int = 10) -> Image.Image:
|
8 |
+
try:
|
9 |
+
response = requests.get(url, stream=True, headers=REQUESTS_HEADERS, timeout=timeout)
|
10 |
+
if response.status_code == 200:
|
11 |
+
return Image.open(response.raw).convert("RGB") # Ensure consistent format
|
12 |
+
return None
|
13 |
+
except Exception as e:
|
14 |
+
print(f"Error downloading image: {e}")
|
15 |
+
return None
|
flagged/log.csv
CHANGED
@@ -1,2 +1,3 @@
|
|
1 |
Batch Image URLs,Embedding Results,flag,username,timestamp
|
2 |
"https://cdn.shopify.com/s/files/1/0522/2239/4534/files/CT21355-22_1024x1024.webp, https://cdn.shopify.com/s/files/1/0522/2239/4534/files/00907857-C6B0-4D2A-8AEA-688BDE1E67D7_1024x1024.jpg","[{""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": "":"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""d"", ""error"": ""Failed to download image""}, {""image_url"": ""n"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""y"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""m"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""9"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""C"", ""error"": ""Failed to download image""}, {""image_url"": ""T"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""_"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""x"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""w"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""b"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": "","", ""error"": ""Failed to download image""}, {""image_url"": "" "", ""error"": ""Failed to download image""}, {""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": "":"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""d"", ""error"": ""Failed to download image""}, {""image_url"": ""n"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""y"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""m"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""9"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""9"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""C"", ""error"": ""Failed to download image""}, {""image_url"": ""6"", ""error"": ""Failed to download image""}, {""image_url"": ""B"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""D"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""A"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""A"", ""error"": ""Failed to download image""}, {""image_url"": ""E"", ""error"": ""Failed to download image""}, {""image_url"": ""A"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""6"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""B"", ""error"": ""Failed to download image""}, {""image_url"": ""D"", ""error"": ""Failed to download image""}, {""image_url"": ""E"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""E"", ""error"": ""Failed to download image""}, {""image_url"": ""6"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""D"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""_"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""x"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""j"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""g"", ""error"": ""Failed to download image""}]",,,2025-01-18 01:08:09.984056
|
|
|
|
1 |
Batch Image URLs,Embedding Results,flag,username,timestamp
|
2 |
"https://cdn.shopify.com/s/files/1/0522/2239/4534/files/CT21355-22_1024x1024.webp, https://cdn.shopify.com/s/files/1/0522/2239/4534/files/00907857-C6B0-4D2A-8AEA-688BDE1E67D7_1024x1024.jpg","[{""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": "":"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""d"", ""error"": ""Failed to download image""}, {""image_url"": ""n"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""y"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""m"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""9"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""C"", ""error"": ""Failed to download image""}, {""image_url"": ""T"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""_"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""x"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""w"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""b"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": "","", ""error"": ""Failed to download image""}, {""image_url"": "" "", ""error"": ""Failed to download image""}, {""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""t"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": "":"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""d"", ""error"": ""Failed to download image""}, {""image_url"": ""n"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""h"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""y"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""c"", ""error"": ""Failed to download image""}, {""image_url"": ""o"", ""error"": ""Failed to download image""}, {""image_url"": ""m"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""9"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""3"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""f"", ""error"": ""Failed to download image""}, {""image_url"": ""i"", ""error"": ""Failed to download image""}, {""image_url"": ""l"", ""error"": ""Failed to download image""}, {""image_url"": ""e"", ""error"": ""Failed to download image""}, {""image_url"": ""s"", ""error"": ""Failed to download image""}, {""image_url"": ""/"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""9"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""5"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""C"", ""error"": ""Failed to download image""}, {""image_url"": ""6"", ""error"": ""Failed to download image""}, {""image_url"": ""B"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""D"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""A"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""A"", ""error"": ""Failed to download image""}, {""image_url"": ""E"", ""error"": ""Failed to download image""}, {""image_url"": ""A"", ""error"": ""Failed to download image""}, {""image_url"": ""-"", ""error"": ""Failed to download image""}, {""image_url"": ""6"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""8"", ""error"": ""Failed to download image""}, {""image_url"": ""B"", ""error"": ""Failed to download image""}, {""image_url"": ""D"", ""error"": ""Failed to download image""}, {""image_url"": ""E"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""E"", ""error"": ""Failed to download image""}, {""image_url"": ""6"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""D"", ""error"": ""Failed to download image""}, {""image_url"": ""7"", ""error"": ""Failed to download image""}, {""image_url"": ""_"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""x"", ""error"": ""Failed to download image""}, {""image_url"": ""1"", ""error"": ""Failed to download image""}, {""image_url"": ""0"", ""error"": ""Failed to download image""}, {""image_url"": ""2"", ""error"": ""Failed to download image""}, {""image_url"": ""4"", ""error"": ""Failed to download image""}, {""image_url"": ""."", ""error"": ""Failed to download image""}, {""image_url"": ""j"", ""error"": ""Failed to download image""}, {""image_url"": ""p"", ""error"": ""Failed to download image""}, {""image_url"": ""g"", ""error"": ""Failed to download image""}]",,,2025-01-18 01:08:09.984056
|
3 |
+
"https://cdn.shopify.com/s/files/1/0522/2239/4534/files/CT21355-22_1024x1024.webp, https://cdn.shopify.com/s/files/1/0522/2239/4534/files/00907857-C6B0-4D2A-8AEA-688BDE1E67D7_1024x1024.jpg","{""error"": ""No valid image URLs provided.""}",,,2025-01-18 14:24:29.459219
|
process.py
ADDED
@@ -0,0 +1,77 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
import numpy as np
|
2 |
+
from download_images import download_image_as_pil
|
3 |
+
|
4 |
+
def batch_process_images(image_urls: str, encoder, batch_size: int):
|
5 |
+
"""
|
6 |
+
Processes a batch of image URLs and generates embeddings for each image.
|
7 |
+
|
8 |
+
Args:
|
9 |
+
image_urls (str): Comma-separated string of image URLs.
|
10 |
+
encoder: The encoder object used to generate embeddings.
|
11 |
+
batch_size (int): The maximum number of images to process in one batch.
|
12 |
+
|
13 |
+
Returns:
|
14 |
+
list: A list of dictionaries containing embedding results or errors.
|
15 |
+
"""
|
16 |
+
# Split the input string by commas and strip whitespace
|
17 |
+
urls = [url.strip() for url in image_urls.split(",") if url.strip()]
|
18 |
+
|
19 |
+
if not urls:
|
20 |
+
return {"error": "No valid image URLs provided."}
|
21 |
+
|
22 |
+
results = []
|
23 |
+
batch_urls, batch_images = [], []
|
24 |
+
|
25 |
+
for url in urls:
|
26 |
+
try:
|
27 |
+
# Download image
|
28 |
+
image = download_image_as_pil(url)
|
29 |
+
if not image:
|
30 |
+
results.append({"image_url": url, "error": "Failed to download image"})
|
31 |
+
continue
|
32 |
+
|
33 |
+
batch_urls.append(url)
|
34 |
+
batch_images.append(image)
|
35 |
+
|
36 |
+
# Process batch when reaching batch size
|
37 |
+
if len(batch_images) == batch_size:
|
38 |
+
process_batch(batch_urls, batch_images, results, encoder)
|
39 |
+
batch_urls, batch_images = [], []
|
40 |
+
|
41 |
+
except Exception as e:
|
42 |
+
results.append({"image_url": url, "error": str(e)})
|
43 |
+
|
44 |
+
# Process remaining images in the last batch
|
45 |
+
if batch_images:
|
46 |
+
process_batch(batch_urls, batch_images, results, encoder)
|
47 |
+
|
48 |
+
return results
|
49 |
+
|
50 |
+
|
51 |
+
def process_batch(batch_urls, batch_images, results, encoder):
|
52 |
+
"""
|
53 |
+
Processes a batch of images and generates embeddings.
|
54 |
+
|
55 |
+
Args:
|
56 |
+
batch_urls (list): List of image URLs in the batch.
|
57 |
+
batch_images (list): List of PIL images in the batch.
|
58 |
+
results (list): List to store results for each image.
|
59 |
+
encoder: The encoder object used to generate embeddings.
|
60 |
+
"""
|
61 |
+
try:
|
62 |
+
# Generate embeddings
|
63 |
+
embeddings = encoder.encode_images(batch_images)
|
64 |
+
|
65 |
+
for url, embedding in zip(batch_urls, embeddings):
|
66 |
+
# Normalize embedding
|
67 |
+
embedding_normalized = embedding / np.linalg.norm(embedding)
|
68 |
+
|
69 |
+
# Append results
|
70 |
+
results.append({
|
71 |
+
"image_url": url,
|
72 |
+
"embedding_preview": embedding_normalized[:5].tolist(), # First 5 values for preview
|
73 |
+
"success": True
|
74 |
+
})
|
75 |
+
except Exception as e:
|
76 |
+
for url in batch_urls:
|
77 |
+
results.append({"image_url": url, "error": str(e)})
|