tdurbor's picture
Consolidate image preparation pipeline
fe62bf5
raw
history blame
2.35 kB
import os
import requests
import time
# Load environment variables from .env file
from dotenv import load_dotenv
load_dotenv()
API_KEY = os.getenv('REMOVEBG_API_KEY')
def process_image(input_image_path, output_image_path):
url = "https://api.remove.bg/v1.0/removebg"
try:
with open(input_image_path, 'rb') as image_file:
files = { "image_file": image_file }
payload = { "size": "auto" }
headers = {
"Accept": "image/png, application/json",
"x-api-key": API_KEY
}
response = requests.post(url, data=payload, files=files, headers=headers)
response.raise_for_status()
with open(output_image_path, 'wb') as f:
f.write(response.content)
print(f"Image downloaded and saved to {output_image_path}")
except requests.exceptions.HTTPError as e:
if response.status_code == 429:
print(f"Rate limit exceeded. Retrying {input_image_path} after delay...")
time.sleep(60) # Wait for 60 seconds before retrying
return process_image(input_image_path, output_image_path)
else:
print(f"Error: {str(e)} ({input_image_path})")
return str(e)
def iterate_over_directory(directory_path, result_directory):
for root, _, files in os.walk(directory_path):
for file in files:
if file.lower().endswith(('.png', '.jpg', '.jpeg', '.webp', '.heic')):
file_path = os.path.join(root, file)
result_file_name = os.path.splitext(os.path.basename(file_path))[0] + '.png'
result_file_directory = os.path.join(result_directory)
if not os.path.exists(result_file_directory):
os.makedirs(result_file_directory)
result_path = os.path.join(result_file_directory, result_file_name)
if not os.path.exists(result_path): # don't re-process images
process_image(file_path, result_path)
if __name__ == "__main__":
INPUT_DIRECTORY = "../original-images/"
OUTPUT_DIRECTORY = "../result-remove-bg/"
if not os.path.exists(OUTPUT_DIRECTORY):
os.makedirs(OUTPUT_DIRECTORY)
iterate_over_directory(directory_path=INPUT_DIRECTORY, result_directory=OUTPUT_DIRECTORY)