Spaces:

lakpriya
/

videogen_api

Sleeping

videogen_api / main.py

Lakpriya Seneviratna

chore: Add .gitignore and requirements.txt files

32007ab 5 months ago

15.6 kB

	import requests
	import praw
	import json
	import cv2
	import numpy as np
	import textwrap
	from gtts import gTTS
	from pydub import AudioSegment
	import subprocess
	import re
	import os
	import random
	import time
	import sys
	import uuid
	from googleapiclient.discovery import build
	from googleapiclient.errors import HttpError
	from googleapiclient.http import MediaFileUpload
	from oauth2client.client import flow_from_clientsecrets
	from oauth2client.file import Storage
	from oauth2client.tools import run_flow
	from google.auth.transport.requests import Request

	# Define the output folder path
	output_folder = 'output'

	# Constants
	SCOPES = ["https://www.googleapis.com/auth/youtube.upload"]
	CLIENT_SECRETS_FILE = "client_secrets.json" # Update with your client_secrets.json file path
	YOUTUBE_UPLOAD_SCOPE = "https://www.googleapis.com/auth/youtube.upload"
	DRIVE_SCOPE = "https://www.googleapis.com/auth/drive"
	YOUTUBE_API_SERVICE_NAME = "youtube"
	YOUTUBE_API_VERSION = "v3"
	MAX_RETRIES = 10
	RETRIABLE_STATUS_CODES = [500, 502, 503, 504]
	ELEVENLABS_KEY = "55bfc10fb7eecae379f73e6740807101"

	# Check if the folder exists, if not, create it
	if not os.path.exists(output_folder):
	os.makedirs(output_folder)

	banned_words = ["fuck", "pussy", "ass", "porn", "gay", "dick", "cock", "kill", "fucking", "shit", "bitch", "bullshit", "asshole","douchebag", "bitch", "motherfucker", "nigga","cunt", "whore", "piss", "shoot", "bomb", "palestine", "israel" ]

	def contains_banned_word(text, banned_words):
	for word in banned_words:
	if word in text.lower():
	return True
	return False

	def fetch_reddit_data(subreddit_name):
	# Reddit API Credentials
	client_id = 'TIacEazZS9FHWzDZ3T-3cA'
	client_secret = '6Urwdiqo_cC8Gt040K_rBhnR3r8CLg'
	user_agent = 'script by u/lakpriya1'

	# Initialize PRAW with your credentials
	reddit = praw.Reddit(client_id=client_id, client_secret=client_secret, user_agent=user_agent)

	subreddit = reddit.subreddit(subreddit_name)

	for _ in range(10): # Limit the number of attempts to 10
	post = subreddit.random()
	# Check if the title contains a pattern resembling a URL
	if post and not re.search(r'\w+\.\w+', post.title) and not contains_banned_word(post.title, banned_words) and not len(post.title) < 50:
	post_data = {'title': post.title}

	with open('top_post.json', 'w') as outfile:
	json.dump(post_data, outfile, indent=4)

	print("Top post data saved to top_post.json")
	return # Exit after finding a suitable post

	print("No suitable post found without a URL-like string in the title.")

	def read_json(filename):
	print("Reading data from", filename)
	with open(filename, 'r') as file:
	data = json.load(file)
	return data

	def wrap_text(text, wrap_width):
	return textwrap.wrap(text, width=wrap_width)

	def resize_background_image(image_path, frame_width, frame_height):
	print("Resizing background image")
	image = cv2.imread(image_path)
	h, w = image.shape[:2]
	scale = max(frame_width / w, frame_height / h)
	new_w, new_h = int(w * scale), int(h * scale)
	resized_image = cv2.resize(image, (new_w, new_h))

	# Cropping the resized image to fill the frame
	startx = new_w // 2 - (frame_width // 2)
	starty = new_h // 2 - (frame_height // 2)
	cropped_image = resized_image[starty:starty+frame_height, startx:startx+frame_width]
	return cropped_image

	def put_text_with_stroke(frame, text, position, font_scale, line_height, wrap_width, font_color=(255, 255, 255), stroke_color=(0, 0, 0)):
	font = cv2.FONT_HERSHEY_COMPLEX
	lines = wrap_text(text, wrap_width)

	# Calculate the total height of the text block
	total_text_height = line_height * len(lines)

	# Starting Y position to center text vertically
	start_y = (frame.shape[0] - total_text_height) // 2

	for line in lines:
	text_size = cv2.getTextSize(line, font, font_scale, 1)[0]
	# Calculate x coordinate for center alignment
	text_x = (frame.shape[1] - text_size[0]) // 2
	text_y = start_y + line_height

	# Draw text stroke (increase thickness for a bolder stroke)
	cv2.putText(frame, line, (text_x, text_y), font, font_scale, stroke_color, 8, cv2.LINE_AA)

	# Draw original text on top
	cv2.putText(frame, line, (text_x, text_y), font, font_scale, font_color, 2, cv2.LINE_AA)

	start_y += line_height

	def create_video_from_title(title, background_image, output_filename, audio_duration):
	print("Creating video from title")
	# Video properties
	fps = 24
	frame_width, frame_height = 720, 1280 # 9:16 aspect ratio
	frame_count = audio_duration * fps

	# Logo images
	top_logo = load_logo('logo.png', frame_width, frame_height, 'top')
	bottom_logo = load_logo('sub.png', frame_width, frame_height, 'bottom')

	# OpenCV VideoWriter
	fourcc = cv2.VideoWriter_fourcc(*'mp4v')
	out = cv2.VideoWriter(output_filename, fourcc, fps, (frame_width, frame_height))

	# Resize the background image
	background = resize_background_image(background_image, frame_width, frame_height)

	for i in range(int(np.floor(frame_count))):
	frame = background.copy() # Use the resized background image

	# Overlay logos
	frame = overlay_logo(frame, top_logo)
	frame = overlay_logo(frame, bottom_logo)

	# Add title to frame with text wrapping and highlight
	put_text_with_stroke(frame, title, (50, 500), 1, 50, 25, font_color=(255, 255, 255), stroke_color=(0, 0, 0)) # Adjust wrap_width and line_height as needed

	out.write(frame) # Write the frame to the video

	out.release()

	def fetch_random_nature_image(api_key):
	print("Fetching random nature image from Unsplash")
	url = f"https://api.unsplash.com/photos/random?query=nature&client_id={api_key}"
	response = requests.get(url)
	if response.status_code == 200:
	img_url = response.json()['urls']['regular']
	img_data = requests.get(img_url).content
	with open('nature_background.jpg', 'wb') as handler:
	handler.write(img_data)
	return 'nature_background.jpg'
	else:
	print("Failed to fetch image from Unsplash")
	return None

	def text_to_speech(text, output_file):
	print("Converting text to speech")
	tts = gTTS(text=text, lang='en')
	tts.save(output_file)
	return output_file

	def get_audio_duration(audio_file):
	print("Getting audio duration")
	audio = AudioSegment.from_mp3(audio_file)
	return len(audio) / 1000.0 # Convert to seconds

	def combine_audio_video(video_file, audio_file, output_file, audio_delay_seconds=0.3):
	# Construct the full path for the output file
	output_file = os.path.join(output_folder, output_file)

	# Add a delay to the audio start
	cmd = f'ffmpeg -i "{video_file}" -itsoffset {audio_delay_seconds} -i "{audio_file}" -c:v copy -c:a aac -strict experimental -map 0:v:0 -map 1:a:0 "{output_file}"'
	subprocess.call(cmd, shell=True)
	print("Successfully made the video:", output_file)

	def load_logo(logo_path, frame_width, frame_height, position='top'):
	logo = cv2.imread(logo_path, cv2.IMREAD_UNCHANGED) # Load with alpha channel
	logo_height, logo_width = logo.shape[:2]

	# Scaling down the logo if it's too big
	scale_factor = min(1, frame_width / 3 / logo_width, frame_height / 10 / logo_height)
	new_size = (int(logo_width * scale_factor1.3), int(logo_height scale_factor*1.3))
	logo = cv2.resize(logo, new_size, interpolation=cv2.INTER_AREA)

	# Positioning
	x_center = frame_width // 2 - logo.shape[1] // 2
	if position == 'top':
	y_pos = 100 # 10 pixels from the top
	else: # 'bottom'
	y_pos = frame_height - logo.shape[0] - 100 # 10 pixels from the bottom

	return logo, (x_center, y_pos)

	def overlay_logo(frame, logo_info):
	logo, (x, y) = logo_info
	y1, y2 = y, y + logo.shape[0]
	x1, x2 = x, x + logo.shape[1]

	if logo.shape[2] == 4: # If the logo has an alpha channel
	alpha_logo = logo[:, :, 3] / 255.0
	alpha_frame = 1.0 - alpha_logo
	for c in range(0, 3):
	frame[y1:y2, x1:x2, c] = (alpha_logo * logo[:, :, c] +
	alpha_frame * frame[y1:y2, x1:x2, c])
	else: # If the logo does not have an alpha channel
	frame[y1:y2, x1:x2] = logo

	return frame

	def get_authenticated_service():
	flow = flow_from_clientsecrets(CLIENT_SECRETS_FILE, scope=YOUTUBE_UPLOAD_SCOPE)
	storage = Storage(f"{sys.argv[0]}-oauth2.json")
	credentials = storage.get()
	if credentials is None or credentials.invalid:
	credentials = run_flow(flow, storage)
	return build(YOUTUBE_API_SERVICE_NAME, YOUTUBE_API_VERSION, credentials=credentials)

	def upload_video_to_drive(video_file, folder_id=None):
	"""Uploads a video to Google Drive."""
	# Check if the credentials are stored
	storage = Storage(f"{sys.argv[0]}-oauth2.json")
	credentials = storage.get()

	# If credentials are not available or are invalid, run the flow
	if not credentials or credentials.invalid:
	flow = flow_from_clientsecrets(CLIENT_SECRETS_FILE, scope=[DRIVE_SCOPE])
	credentials = run_flow(flow, storage)

	service = build('drive', 'v3', credentials=credentials)

	file_metadata = {
	'name': os.path.basename(video_file),
	'mimeType': 'video/mp4'
	}
	if folder_id:
	file_metadata['parents'] = [folder_id]

	media = MediaFileUpload(video_file, mimetype='video/mp4', resumable=True)
	file = service.files().create(body=file_metadata, media_body=media, fields='id').execute()

	print('File ID: %s' % file.get('id'))

	def initialize_upload(youtube, options):
	tags = None
	if 'keywords' in options and options['keywords']:
	tags = options['keywords'].split(",")

	body = dict(
	snippet=dict(
	title=options['title'],
	description=options['description'],
	tags=tags,
	categoryId=options['category']
	),
	status=dict(
	privacyStatus=options['privacyStatus']
	)
	)

	# Call the API's videos.insert method to create and upload the video.
	insert_request = youtube.videos().insert(
	part=",".join(body.keys()),
	body=body,
	# The chunksize parameter specifies the size of each chunk of data, in
	# bytes, that will be uploaded at a time. Set a higher value for
	# reliable connections as fewer chunks lead to faster uploads. Set a lower
	# value for better recovery on less reliable connections.
	#
	# Setting "chunksize" equal to -1 in the code below means that the entire
	# file will be uploaded in a single HTTP request. (If the upload fails,
	# it will still be retried where it left off.) This is usually a best
	# practice, but if you're using Python older than 2.6 or if you're
	# running on App Engine, you should set the chunksize to something like
	# 1024 * 1024 (1 megabyte).
	media_body=MediaFileUpload(options["file"], chunksize=-1, resumable=True)
	)

	resumable_upload(insert_request)

	# This method implements an exponential backoff strategy to resume a
	# failed upload.
	def resumable_upload(insert_request):
	response = None
	error = None
	retry = 0
	while response is None:
	try:
	print("Uploading file...")
	status, response = insert_request.next_chunk()
	if response is not None:
	if 'id' in response:
	print("Video id '%s' was successfully uploaded." % response['id'])
	else:
	exit("The upload failed with an unexpected response: %s" % response)
	except HttpError as e:
	if e.resp.status in RETRIABLE_STATUS_CODES:
	error = "A retriable HTTP error %d occurred:\n%s" % (e.resp.status,
	e.content)
	else:
	raise
	# except RETRIABLE_EXCEPTIONS as e:
	# error = "A retriable error occurred: %s" % e

	if error is not None:
	print(error)
	retry += 1
	if retry > MAX_RETRIES:
	exit("No longer attempting to retry.")

	max_sleep = 2 ** retry
	sleep_seconds = random.random() * max_sleep
	print("Sleeping %f seconds and then retrying..." % sleep_seconds)
	time.sleep(sleep_seconds)

	def eleven_labs_text_to_speech(text, output_file):
	voice_ids = {
	"ndntWUKwYjgJGYkvF6at",
	"SVLJSgUbrKWfY8HvF2Xd",
	"sjdiTCylizqR74A3ssv4",
	}
	# randomly pick one of the voices
	voice_id = random.choice(list(voice_ids))
	url = f"https://api.elevenlabs.io/v1/text-to-speech/{voice_id}"

	headers = {
	"Accept": "audio/mpeg",
	"Content-Type": "application/json",
	"xi-api-key": ELEVENLABS_KEY
	}

	data = {
	"text": text,
	"model_id": "eleven_monolingual_v1",
	"voice_settings": {
	"stability": 0.5,
	"similarity_boost": 0.5,
	"speed": 0.3,
	}
	}

	response = requests.post(url, json=data, headers=headers)
	if response.status_code == 200:
	with open(output_file, 'wb') as f:
	for chunk in response.iter_content(chunk_size=1024):
	f.write(chunk)
	print(f"Audio content written to {output_file}")
	else:
	print(f"Failed to synthesize speech: {response.content}")

	api_key = 'VhLwkCKi3iu5Pf37LXfz-Lp7hTW69EV8uw_hkLAPkiA' # Replace with your Unsplash API key
	background_image = fetch_random_nature_image(api_key)

	if background_image:
	# Example usage
	fetch_reddit_data('Glitch_in_the_Matrix')

	# Read data from JSON
	reddit_data = read_json('top_post.json') # Change filename if needed
	title = reddit_data.get('title')

	filename = "video_" + str(uuid.uuid4())

	# Convert text to speech
	# voiceover_file = text_to_speech(title, 'voiceover.mp3')
	voiceover_file = eleven_labs_text_to_speech(title, 'voiceover.mp3')

	# Get audio duration
	audio_duration = get_audio_duration('voiceover.mp3')

	# Create and save the video
	create_video_from_title(title, background_image, "reddit_post_video_cv2.mp4", audio_duration)

	# Combine audio and video
	combine_audio_video('reddit_post_video_cv2.mp4', 'voiceover.mp3', filename + '.mp4')

	options = {
	'file': 'output/'+ filename + '.mp4',
	'title': "Amazing Facts Revealed: Unveiling the World's Hidden Wonders #shorts",
	'description': "Welcome to our latest YouTube video, 'Amazing Facts Revealed: Unveiling the World's Hidden Wonders'! In this enthralling episode, we dive deep into the most astonishing and lesser-known facts about our world. From the mysteries of the deep sea to the enigmas of outer space, we cover it all. Get ready to be amazed by incredible scientific discoveries, historical secrets, and mind-blowing natural phenomena. Each fact is meticulously researched and presented with stunning visuals and engaging narration. Don't forget to like, share, and subscribe for more fascinating content. Stay curious and let's explore the wonders of our world together #shorts",
	'category': "22",
	'keywords': "facts, shorts, funny",
	'privacyStatus': "private"
	}

	# try:
	# youtube = get_authenticated_service()
	# initialize_upload(youtube, options)
	# upload_video_to_drive('output/'+ filename + '.mp4','1t2lcYNLgz6FTeabzccY_06rvcnTGdQiR')
	# except HttpError as e:
	# print("An HTTP error %d occurred:\n%s" % (e.resp.status, e.content))