a13_3_save_audio_only.py

#%%
import getpass,sys,socket
# add path for the libraryfrom import_basics import *
sys.path.pop(-1)
from moviepy.editor import ImageClip, AudioFileClip

from moviepy.editor import VideoFileClip, concatenate_videoclips
from moviepy.editor import TextClip
from moviepy.video.tools.subtitles import SubtitlesClip
import yfinance as yf

from youtube_data import *
from ai_moderator import *
from utils import *
from dataframe_stuff import *
from make_credentials import *
from spreadsheet import *

from pathlib import Path
from openai import OpenAI


def find_exchange(ticker):


    df1=pd.read_excel(f"/Users/{getpass.getuser()}/Library/CloudStorage/GoogleDrive-ryan.ichun9@gmail.com/My Drive/ibkr/2 import data/IBKR/4 exchange list/exchange list.xlsx",index_col=0)
    exchange1=0
    for i in range(len(df1)):
        if ticker == df1['ticker'][i]:
            exchange1=df1['Exchange'][i]
            #print("existing ticker exchange",ticker)
    if exchange1==0:
        print("not existing exchange info : ", ticker)
        
        url = "https://ycharts.com/companies/{}".format(ticker)
        payload = ""
        headers = {
            "cookie": "ycsessionid=2qz3d4y9pia7lsirwduwfoqsy68lxo0u; _ga=GA1.2.635129160.1644138754; _gid=GA1.2.916019816.1644138754; __gads=ID=93bc25b5583902a4-22af5cc377d00013:T=1644138753:S=ALNI_MZo9l0xXkE31mqmewQtnKQnTUUD5Q; __hstc=69688216.203ddbd23f614854901d1b6290dd0cc4.1644138757373.1644138757373.1644138757373.1; hubspotutk=203ddbd23f614854901d1b6290dd0cc4; __hssrc=1; _fbp=fb.1.1644138757715.487408360; _gcl_au=1.1.38652961.1644138758; quickflowsSingleSecurityCookieName=%7B%22displaySecurityId%22%3A%22AAPL%22%2C%22securityId%22%3A%22AAPL%22%7D; messagesUtk=a7090410a7a24598b5f7b00924eb45a1; page_view_ctr=3; __hssc=69688216.3.1644138757373",
            "authority": "ycharts.com",
            "cache-control": "max-age=0",
            "sec-ch-ua-mobile": "?0",
            "sec-ch-ua-platform": "macOS",
            "upgrade-insecure-requests": "1",
            "user-agent": "Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/97.0.4692.71 Safari/537.36",
            "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9",
            "sec-fetch-site": "cross-site",
            "sec-fetch-mode": "navigate",
            "sec-fetch-user": "?1",
            "sec-fetch-dest": "document",
            "referer": "https://www.google.com/",
            "accept-language": "en-US,en;q=0.9,ko;q=0.8"
        }
        response = requests.request("GET", url, data=payload, headers=headers)
        data=response.text
        exchange1=data.split("&nbsp;|&nbsp;")[1].split("\n")[1].replace(" ","")

        print("scrape ychart", ticker, exchange1)
        dictionary={"ticker":[ticker],"Exchange":[exchange1]}

        df=pd.DataFrame.from_dict(dictionary)
        df1=df1.append(df)
        df=df1.append(df)
        df=df.drop_duplicates(keep="last",subset="ticker")
        df=df.reset_index()
        df=df.drop(columns=["index"])
        df.to_excel(f"/Users/{getpass.getuser()}/Library/CloudStorage/GoogleDrive-ryan.ichun9@gmail.com/My Drive/ibkr/2 import data/IBKR/4 exchange list/exchange list.xlsx")
    return exchange1


def make_final_video(ticker):
    # video_files = ["video1.mp4", "video2.mp4", "video3.mp4"]  # Add the file paths of your video files
    inter_folder=f'data/youtube4/{ticker}/'
    video_files=os.listdir(inter_folder)
    # video_files=[inter_folder+item for item in video_files]
    # video_files
    new_list=[]
    for item in video_files:
        new_list.append(inter_folder+item)

    new_list = sorted(new_list)
    video_clips=[]
    for file in new_list:
        video_clips.append(VideoFileClip(file).resize(newsize=(1920, 1080)) )
    video_clips

    # video_clips = [VideoFileClip(file).resize(newsize=(1920, 1080)) for file in video_files]
    # video_clips

    # from moviepy.editor import VideoFileClip, VideoFileClipList
    # final_video = VideoFileClipList(video_clips).concatenate()
    final_video = concatenate_videoclips(video_clips)


    import moviepy.editor as mpe
    # final_video = mpe.concatenate(video_clips)

    # Write the concatenated video to a file
    # concat_clip.write_videofile("concatenated_video.mp4")
    timestamp1=str(int(datetime.now().timestamp()))
    final_video.write_videofile(f"data/youtube3/{timestamp1}.mp4", codec="libx264", fps=30)
    # video_clip.write_videofile(output_video_file, codec="libx264", fps=30)
    for clip in video_clips:
        clip.close()
    final_video.close()

    # video_audio(wjslist)
    # Iterate through the files and remove them
    
    remove_files(f'data/youtube4/{ticker}')
    # remove_files('data/youtube4')
    remove_files(f'data/audios/{ticker}')
    # remove_files('data/news_images')

def make_inter_videos(ticker,audio_path_list,image_files):
    for ii in range(len(audio_path_list))[0:]:
        try:
            audio_path=audio_path_list[ii]
            # image_name_prefix=search[:20]


            # image_name_prefix

            
            # imagelist=os.listdir(image_folder)
            # imagelist

            # image_name_prefix

            # imagelist=[image_folder+item for item in imagelist if image_name_prefix in item]
            # imagelist

            # image_files=imagelist
            # if len(imagelist)==0:
            #     filepath=image_folder+image_name_prefix+'.png'
            #     make_text_image(search,filepath)
            #     imagelist=[filepath]


            # image_files = ["image1.jpg", "image2.jpg", "image3.jpg", "image4.jpg", "image5.jpg"]

            # Audio file name (change this to match your audio file)
            audio_file = audio_path
            audio_file

            # fps=24
            # Video output file name
            video_path=f"data/youtube4/{ticker}"
            if not os.path.exists(video_path):
                os.makedirs(video_path)
            timestamp1=str(int(datetime.now().timestamp()))
            output_video_file = f"data/youtube4/{ticker}/{timestamp1}.mp4"

            audio_clip = AudioFileClip(audio_file)
            # audio_clip=audio_clip.volumex(1.7)
            frame_rate = 30
            audio_duration = audio_clip.duration
            # each_length=audio_duration/len(imagelist)
            # image_duration = max(3,int(each_length))
            image_duration=audio_duration
            duration=image_duration
            image_clips = [ImageSequenceClip([img], durations=[duration]) for img in image_files]
            # from moviepy.editor import ImageSequenceClip, VideoFileClip, concatenate_videoclips
            # Concatenate the image clips to create the final video
            video_clip = concatenate_videoclips(image_clips, method="compose")
            video_clip = video_clip.set_duration(audio_duration).set_audio(audio_clip)
            # Write the final video to a file using H.264 codec
            # video_clip.write_videofile(output_video_file, codec="libx264")

            # Write the final video to a file
            # final_video.write_videofile("output_with_subtitles.mp4", codec="libx264", fps=video_clip.fps)
            video_clip.write_videofile(output_video_file.replace('-',''), codec="libx264", fps=frame_rate)  # Adjust the fps value as needed
            # Clean up
            video_clip.close()
            print("ii: ",ii,len(audio_path_list))
        except Exception as e:
            print( 0 ,' = >>> some error = ',e)
def audio_download(folder,name_prefix,input1,role):
    path=f"data/audios/{folder}"
    if not os.path.exists(path):
        os.makedirs(path)
   
    actors = {
        'man1': 'echo',
        'man2': 'fable',
        'man3': 'onyx',
        'woman1': 'alloy',
        'woman2': 'nova',
        'woman3': 'shimmer'
    }

    speech_file_path = f"data/audios/{folder}/{name_prefix}.mp3"
    response = client.audio.speech.create(
    model="tts-1",
    voice=actors[role],
    input=input1
    )

    response.stream_to_file(speech_file_path)
    return speech_file_path
def get_stock_details(ticker):
    market_cap,industry, short_description,company_name,PE=0,0,0,0,0
    try:
        stock = yf.Ticker(ticker)
        
        # Info is a dictionary containing various details about the stock
        info = stock.info
        
        market_cap = stock.info.get('marketCap')
        market_cap=round(market_cap/1000000000,2)
        industry = info.get('industry', 'N/A')
        short_description = info.get('longBusinessSummary', 'N/A')
        company_name = short_description.split('.')[0]
        company_name
        PE = info.get('trailingPE')
    except Exception as e:
        print('error here 13: ',ticker,e)
        try:

            endpoint=f'https://api.polygon.io/v3/reference/tickers/{ticker}?apiKey={polygon_api_key}'
            response = requests.get(endpoint)
            # Raise an error if the request failed
            response.raise_for_status()
            # Parse the JSON result
            data = response.json()

            json_data=data['results']

            new_row = pd.DataFrame(json_data, index=[0])
            short_description=new_row['description'][0]
            market_cap=new_row['market_cap'][0]
            market_cap=round(market_cap/1000000000,2)
            company_name=new_row['name'][0]
        except Exception as e:
            print('double error ',ticker,e)
            
    return market_cap,industry, short_description,company_name,PE

# def audio_download(name_prefix,input1):
#     speech_file_path = f"data/audios/{name_prefix}.mp3"
#     response = client.audio.speech.create(
#     model="tts-1",
#     voice="alloy",
#     input=input1
#     )

#     response.stream_to_file(speech_file_path)
#     return 

# f'https://www.google.com/search?q={search}&tbm=isch'
ii=0

def save_news_images(list1):
    
    search_list=[item for item in list1 if len(item)>10]
    search_list

    for ii in range(len(search_list)):
        time.sleep(1)
        search=search_list[ii]
        driver.get(f'https://www.bing.com/images/search?q={search}&form=HDRSC3')


        ming=driver.find_elements(By.XPATH,'//img[@class="mimg"]')
        ming

        ming

        # ming
        # imgs=driver.find_elements(By.TAG_NAME,'img')
        # imgs
        for iii,item in enumerate(ming[:5]):
            content=item.get_attribute('src')
            content

            # image_url = 'https://example.com/image.jpg'

            # Send an HTTP GET request to the image URL
            response = requests.get(content)

            folder_name='data/news_images'
            name=search[:20]+f" {iii}"
            local_file_path = f'{folder_name}/{name}.png'

            # Check if the request was successful (HTTP status code 200)
            if response.status_code == 200:
                # Get the content of the response (the image data)
                image_data = response.content
                
                # Specify the local file path where you want to save the image
                # local_file_path = 'data/temp.jpg'
                
                # Open a local file in binary write mode and write the image data to it
                with open(local_file_path, 'wb') as file:
                    file.write(image_data)

    for ii in range(len(search_list)):
        # time.sleep(1)
        search=search_list[ii]
        name_prefix=search[:20]
        audio_download(name_prefix,search)
        print(ii)
    return search_list


# data:image/jpeg;base64,/9j/4AAQSkZJRgABAQAAAQABAAD/2wCEAAkGBwgHBgkIBwgKCgkLDRYPDQwMDRsUFRAWIB0iIiAdHx8kKDQsJCYxJx8fLT0tMTU3Ojo6Iys/RD84QzQ5OjcBCgoKDQwNGg8PGjclHyU3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3Nzc3N//AABEIAGQAZAMBIgACEQEDEQH/xAAbAAACAwEBAQAAAAAAAAAAAAAEBQADBgIBB//EADgQAAIBAwMBBgQEBAYDAAAAAAECAwAEEQUSITEGEyJBUWEUcYGRMqGx0RVC4fBScsHC0vEjJDP/xAAaAQACAwEBAAAAAAAAAAAAAAABAgMEBQAG/8QAJREAAgIBAwQCAwEAAAAAAAAAAAECEQMEEiETMUFRIjJSYYEF/9oADAMBAAIRAxEAPwDTNVbEiu81w/SvTIzzgvioHJNVsa8BwaehbC8+GqJagk4qp5OeaCRzYPNQUvWmLYIpfOMH2qeBFIpUnPFWrmq04ar1UsadiI9TrRUOc1UseOtERrUcmSRQSORXldKpxxUqIkORJXu8GqWqovg9aNAsvk6ZFU7qneZGCa5JFGgNnYbFcSHJrwkVwzU1AbLM4WhLiiRIMYqiTxGjEWQOlFxY4oZ5YIRmWRV+tLb/ALQQWgKsyoR13Hn7VHl1OOHdkmPBOXZGiO0DJIA9Saol1a1t/CCXf0FY86zNqVrI9mHnlWdIVXpktnj8vWhP4Pr1+oSdu5WSMFUVS2STjoOB9TWZl17fEeC5HTxj9uTaRarcXS95E6ouSNoAOK8ofRbH+GafHbyGQtkse9A3cn2JxUqo88vyLKxxr6jVpc1S7igjcZ6EVw09ekUDFcwszYPWve/4pe0oPnXPf4p9om8Na4OanxChSXIA88ml7zg1kdV1C8aXUMOyxw8I3oSwH71X1OZYIp13JMMOq6s2N3rVrbIW37h69BSyTWrq5u/h7aCVyH2t3aeEeIA5J+dU9mLG3u9PtzfF5mkIAyM7j3hOCT7VpdKvYIEuLdNtu3idpHAKvlx4R78Hz8xWJm1uWbqzShghGqRm4dB13V0kmimSC23FRtPiIyAOp9x5+fT0ZW+gaK1zdXWsMxYuQgB4G0ovOTj19athe6ZII0lkIVU8CDGCO7z9fCR19KZQ6BqF5I0sNhIQWYiR0I6kHqflVNzZPsk0C2kllatBLaIWiguXJGBt8IfkeXlmqrztNeXluyIGlPwjKqrlyOvPAwOvrWhteyd5Kkjztbwq7lmLOOpznpn1NXfwbR7J40vNat8f4EI8P5/6UrkvI+xexNaSPdRGS7UCTcRhuOPlmpT1peyMR2fF3Jx5qrY/JalL1EOkj4jBcSW08UlvMyMAAxOWDH0+RxW4Eokt45t6lXCncDwSfSkJ0KzTdBd3tvGzOQoBUEDBzweeoPn5+fFNtO0O+mit7GzfbsmBdANwwMHcW44J+nTFbmn1XSTb7GTlwOSDI7m3ihljlh3yyLiN842EHJOPPjIoNpDuxmt9D2P0z4UNdmSSYDLOHKjPsPSgtE7KaZey6h8Q0rG3uDDGyuR4MK33ycE+1Wl/oYlb5KMsUpcGQt1luJBHChdznCgZPSho9NsWaczxvIs7hnGRjg5HnX0RuyGhq5ihv5Y5yONs3iFZjtHo9x2fkR3XvreSVV70cbAc9ev9fboYs+p02oXybSRPpo5MbqKts70yz0p4o1hs7yUjcoCtHGg2kZGSfVh96dadbZtprix7PWzKjOpkuLhnxtyDxgjyo/QNKRtGhMNy9uGjYvgKxUuQzEN8x60SkaTLPHY6zDJK6OoVHxgsxbPhPJyaw543fDNFaleQPPaGHSnmt2tbWFYC4EFmOcLnqT1+lMItE1eWBDdazdyrgHCOsWB8lXp9aXa3rUlvPHonespuIGjIaMjCkNnaehGOK0Ecl4UjlMltgeIEpIP9+Kj6UmrGlqIp0JNN7LJeWUc91iZ/Fu7+aQ8hiOi/KiI+zcFvqllG0FvseKXKRR5B/CRwxP3pjawwW8cXxZASFHBkVjhw2TggHj+lJ9N1hNR1+P4W1RYIWnRUb+cb8fIfhoLE3YHqIpJ33HxsNOjJj2BSvBBKj8g1SrL7X9Hs7gxT/DRsB0kCgn7/AFH0qUNkvCH6kfZjI+wlkreOZigP4Qo4+tEz32j9l4O6gi5J5C4JYj3PX/SpqerajPGYtP0+dHxy0yMB+QOfyrG3XZntBcyGeZ0eQ/5xgeg8PSrGSUkviuSgoSfD7H0LStWttWsHmt8oB4WV+Np+lL+ylwpGtx4wy3rNjzIKr+xoDspbTaXp93bakHSZ23IQjsrDGMZ29aXWsOtad2hudSsLYy2czZKlXBkXA5Hh4Oc4/rXRlParXIrg9zokMOlNq15HrUyW16szPHOxZe8jPQqc9Rz+VPdR1TS20Ca2n1GC8KxEAlvE5xx08846VJ/4Jqqg39jdo6/ySWr4B+2PtQd9onZ97KdLK2kE5jbu/wD13Hixxjw+tM7ppMC33yg63u407DGW4D7fhVLrE5DEEDoc5Bx70vtNELJb3dquozM+1483YaNQf8W45PB9K9ZLiTsdDp8FvM15LBGjI0TgJwM5OKF7OjtFoZEc9v39p5qGbcvyyBUabU1a8ElTcGkNO089t8To8EsobUIpslV58BGGyfL+lF9qoln0iyd9SFhbg4Zmj3qSRxu4PpikGv6TY6oTqWlTSW18f/J3ckLpubrzleD7/rTLS9TlhsBYdpLMGKQbS0amRD8wBkUXKUri/wCHRi4SUkuBDb2lxfxLbw9q7d4txCI1qsy5HsAcGnXY2Ix6/HaMw72BDE4EezJx12+WQc0x02x0LSZHu9P7yWQAslvGd3PoB5Uq7OXE79p5b/UjHBNLMzsmT4QF2qBkcnp9qlgoxT55ojyucttx4vwVXHYu61C/vrmSNQHupdgYZ8O44/evac6h2h1wXTjT9Lga2H4GlYhmHrgdPlUplrpJUgPQW75PnMWo3e3c92kW3hlaVs+w45oU6/d5aJ76dBuIDAnHHoTzUS9kt0Cw2BlVwO7cAIFyB5n++BihZ72QZWWIAYG2QMWJ569Oc4zk/wDWAky80/YS2sTCVR8bcs+OV7wj9DVY7RXSdLq42jpi4bI+WDQVuFJk3PGp6J4+VPTy49akMp7qTKI7nIyFyQc8/OmoTn2Noe0N83hM07ufMXb7sfLNXDVLyZy4urjDeRkxt9cc+vtSaaZ/DM0rSDIYNtAHr0GOf3q5nkaZHVg285IG3PXjg+fln86VxGuXsZR3mpxKSJ5mCjkh28h6Zr0avqRjAF1cna3Vpnz9gaBs7pLcKjrjaNyqy/hJ6DBzxXTTRyT7khETB87g2FyeeR9f1oJNHW/YRFr91zvursc5DCZyo+xouO8vbjw2upyvz/LO+4D5E/3zSi4uAykKuDt/EpOCAfpUaKAJmS4uFZOpUgnJOf2Nc0db9j5r+9t5HWe9vQACSWlYbf79PPFWDUyY1P8AF76ZiRjbPIMcY9fcUptNXhVlQ96p4G9wCVz7nrXKyeMCSOR1cgLgqNx9MfSkqQbHcWsyIu17++jI8jcyf8qlL4gkG9AIn8R/+qkEe3lxUpa/YbYNcQx7sbeFQuPt09hwOlZ7UlEckKrnxpuPPTxHgDpj2qVKmwnSCLWBBahiCxO8nPnjn9QK5iPdRQyR+FpkO4ge7Yx8sVKlSeWBkhy8mxmPORu8+AMfrVqvgRkgMDjKnODlsZPmTxUqVzAgzULeMSSRpuUBXbIbnwnA5PypQZm3sBgFTjcvBON3Pz5qVKEOxwbYSG6tQ74VgSMr/lz+v6miNLbvsO/Lcj2ODjJHQ1KlJMKK1JImjP4IyQF8sAN+uwZ9ea4kja3mk7maVGikIRg/I61KlOgF8WqXMe+PKEI5UEryfnipUqVG4oJ//9k=

# with open(local_file_path, 'wb') as file:
#     #identify image to be captured
#     #write file
#     file.write(content.screenshot_as_png)
#     print(f"Image downloaded and saved to {local_file_path}")

import cv2
from moviepy.editor import VideoFileClip, AudioFileClip
from moviepy.video.io.ffmpeg_tools import ffmpeg_extract_subclip

# Directory containing the images and audio file
# def make_video(audio_folder,image_folder,image_name_prefix):

#     # List of image filenames (change these to match your file names)
#     imagelist=os.listdir(image_folder)
#     imagelist=[item for item in imagelist if image_name_prefix in item]
#     # image_files = ["image1.jpg", "image2.jpg", "image3.jpg", "image4.jpg", "image5.jpg"]

#     # Audio file name (change this to match your audio file)
#     audio_file = audio_folder+ f"{image_name_prefix}.mp3"

#     # Video output file name
#     output_video_file = f"data/youtube2/{image_name_prefix}.mp4"

#     # Frame rate (number of frames per second)
    
#     # Duration of each image in seconds
    
    
#     # Load the audio file
#     audio = AudioFileClip(audio_folder + audio_file)
#     audio=audio.volumex(1.7)
#     frame_rate = 24
    
#     audio_duration = audio.duration
#     each_length=audio_duration/len(imagelist)
#     image_duration = int(each_length)
#     # Create a video writer object
#     fourcc = cv2.VideoWriter_fourcc(*'mp4v')
#     video_writer = cv2.VideoWriter(output_video_file, fourcc, frame_rate, (audio.fps * 2, audio.fps * 2))

#     # Loop through the images and add them to the video
#     for image_file in image_files:
#         image = cv2.imread(image_folder + image_file)
#         for _ in range(int(audio.fps * image_duration)):
#             video_writer.write(image)

#     # Release the video writer
#     video_writer.release()

#     # Combine the video with the audio
#     final_video = VideoFileClip(output_video_file)
#     final_video = final_video.set_audio(audio)

#     # Write the final video to a file
#     final_video.write_videofile(output_video_file, codec="libx264")

#     # Clean up temporary files
#     final_video.close()


def remove_files(folder1):
    for file in os.listdir(folder1):
        file_path = os.path.join(folder1, file)
        try:
            if os.path.isfile(file_path):
                os.remove(file_path)
                print(f"Deleted: {file_path}")
        except Exception as e:
            print(f"Error deleting {file_path}: {str(e)}")

def youtube_upload(video_title,description):
    youtuber = YoutuberDummyParameters()


    # prepare the extractor for client
    youtube = youtuber.YoutubeExtractor(local_api=False)   


    timedelta1=0
    timedelta2=100
    today1=((datetime.now(timezone('US/Eastern'))-timedelta(timedelta1)).strftime("%Y-%m-%d %M%S"))
    today2=((datetime.now(timezone('US/Eastern'))-timedelta(timedelta1))).timestamp()
    past1=((datetime.now(timezone('US/Eastern'))-timedelta(timedelta2)).strftime("%Y-%m-%d %M%S"))
    past2=datetime.strptime('20210218', "%Y%m%d").timestamp()


    title= f'{today1}_{video_title}_news'
    file_name='data/youtube3/final.mp4'
    request = youtube.videos().insert(
    part="snippet,status",
    body={
        "snippet": {
        "categoryId": '22',
        "description": description,
        "title": title,
        "tags": 'news'
        },
        "status": {
        "privacyStatus": 'public'
        }
    },
    
    # TODO: For this request to work, you must replace "YOUR_FILE"
    # with a pointer to the actual file you are uploading.
    media_body=googleapiclient.http.MediaFileUpload(file_name,chunksize=-1, resumable=True)
    )


    # output= AuxMakeYoutubeRequest(request)


    request.next_chunk()


from PIL import Image, ImageDraw, ImageFont
def make_text_image(text,filepath):
    width = 400  # Adjust the width of the image
    height = 400  # Adjust the height of the image
    background_color = (255, 255, 255)  # RGB color (white in this example)

    image = Image.new('RGB', (width, height), background_color)
    draw = ImageDraw.Draw(image)
    # font = ImageFont.truetype("path_to_font_file.ttf", font_size)  # Replace with your font file path
    # OR
    font = ImageFont.load_default()  # Use a default font
    # text = "Hello, World!"  # Replace with your desired text
    text_color = (0, 0, 0)  # RGB color (black in this example)
    text_position = (50, 50)  # (x, y) coordinates of the text
    draw.text(text_position, text, fill=text_color, font=font)
    image.save(filepath)  # Specify the desired image format (e.g., PNG, JPEG)
    image.close()
import openai
from moviepy.editor import VideoFileClip, ImageSequenceClip
path1=f'{path_to_openai_api}'
with open(path1,'r') as f:
    key=f.readline()
os.environ["OPENAI_API_KEY"] = key
openai.api_key = key


from twilio.rest import Client
import yagmail
from datetime import datetime,timedelta
import pandas as pd
# Your Account SID from twilio.com/console
account_sid = "{account_sid_twilio}"
auth_token  = "{auth_token_twilio}"
client = Client(account_sid, auth_token)
sender='{id_yagmail}'
#receiver='bluerand3@gmail.com'
email1=sender
passw1='{password_yagmail}'
passw1='{password_yagmail}'
yag = yagmail.SMTP(user=sender,password=passw1)
content1='1'
subject1='1'
def send_email(to_email,title,content):
    yag.send(to=to_email,subject=title,contents=content)


import openai,getpass,os
path1=f'{path_to_openai_api}'
with open(path1,'r') as f:
    key=f.readline()
os.environ["OPENAI_API_KEY"] = key
openai.api_key = key


import openai,getpass,os
path1=f'{path_to_openai_api}'
with open(path1,'r') as f:
    key=f.readline()
os.environ["OPENAI_API_KEY"] = key
openai.api_key = key

from openai import OpenAI
client = OpenAI()

def gpt_answer(content,define):
    try:

        message_list3=[{"role": "system", "content" : define},
                    {"role": "user", "content" : str(content)},    
                    ]
        completion = client.chat.completions.create(model="gpt-3.5-turbo" , #"gpt-3.5-turbo", 
                    messages = message_list3)
        completion=completion.choices[0].message.content

    except Exception as e:
        completion='>> error = time out for gpt...'+str(e)
    return completion
# define='summarize based on why the stock is going up.'
# summary=gpt_answer(content,define)
# summary


def find_repeated_substrings(word_list, min_length=2, min_repeats=3):
    substring_counts = Counter()

    # Iterate over each word
    for word in word_list:
        length = len(word)
        # Generate substrings for each word
        for start in range(length):
            for end in range(start + min_length, length + 1):
                substring = word[start:end]
                substring_counts[substring] += 1

    # Filter based on minimum repeats
    return {sub: count for sub, count in substring_counts.items() if count >= min_repeats}

# Sample list of words
# words = ['이미스머리띠', '샤넬머리띠', '티아라', '명품머리띠', '산리오머리띠', '벨벳머리띠', '고양이머리띠', '왕관', '밴드', '눈']

# Find repeated substrings
# repeated_substrs = find_repeated_substrings(keyword_list, min_length=2, min_repeats=3)
# repeated_substrs

def find_longest_repeated_substrings(word_list, min_length=2, min_repeats=3):
    substring_counts = Counter()

    # Iterate over each word
    for word in word_list:
        length = len(word)
        # Generate substrings for each word
        for start in range(length):
            for end in range(start + min_length, length + 1):
                substring = word[start:end]
                substring_counts[substring] += 1

    # Filter and find the longest repeated substring
    repeated_substrs = {sub: count for sub, count in substring_counts.items() if count >= min_repeats}
    longest_substring = max(repeated_substrs, key=lambda x: (repeated_substrs[x], len(x)), default=None)

    return longest_substring

from selenium import webdriver
import undetected_chromedriver as uc
from webdriver_manager.chrome import ChromeDriverManager
from selenium.webdriver.common.keys import Keys
from selenium.webdriver.chrome.service import Service
import pickle
import time 
import pandas as pd
from selenium.webdriver.common.by import By
from fake_useragent import UserAgent
import requests
import os
import re
from collections import Counter
# Create download folder if not exist
# Specify the folder name you want to create
folder_name = "taobao_download"
# Check if the folder already exists, and if not, create it
if not os.path.exists(folder_name):
    os.mkdir(folder_name)
    print(f"Folder '{folder_name}' created successfully.")
else:
    print(f"Folder '{folder_name}' already exists.")


import re

def scroll_down(driver, num_scrolling):
    # Finds the body element of the web page.
    body = driver.find_element(By.TAG_NAME, 'body')
    # Iterates over the `num_scrolling` argument and scrolls down the page by one page each time.
    for i in range(num_scrolling):
        body.send_keys(Keys.PAGE_DOWN)
        time.sleep(0.5)
        body.send_keys(Keys.PAGE_DOWN)
        time.sleep(0.5)
    return
def extract_number(text):
    
    match = re.search(r'\((\d+)\)', text)
    if match:
        return int(match.group(1))
    else:
        return int(0)


from datetime import datetime,timedelta
import sys,os,copy,ast,socket,random,math,webbrowser,getpass,time,shutil,requests,re
import numpy as np
import pandas as pd
from pytz import timezone
import matplotlib.pyplot as plt
from newsapi import NewsApiClient

def fetch_news_for_query(api_key, query, language='en', page_size=5):
    newsapi = NewsApiClient(api_key=api_key)

    # Search for articles with the given query
    articles = newsapi.get_everything(q=query,
                                      language=language,
                                      sort_by="relevancy",  # Sort by relevancy to the query
                                      page_size=page_size)

    articles_list = articles.get('articles')
    if not articles_list:
        print("No news found!")
        return
    list1=[]
    for article in articles_list:
        title = article.get('title')
        description = article.get('description')
        print(f"Title: {title}")
        # print(f"Description: {description}\n")
        list1.append((title,description))
    return list1


newsapi_org='{newsapi_org}'
newsapi_org2='34ebf11591e045c4bbd2586c400c8b59'

def generate_company_name(ticker):
    
    endpoint=f"https://api.polygon.io/v3/reference/tickers/{ticker}?apiKey={polygon_api_key}"
    # Make the request
    response = requests.get(endpoint)

    # Raise an error if the request failed
    response.raise_for_status()

    # Parse the JSON result
    data = response.json()
    data
    print("data: ",data)

    company_name=data['results']['name'].split('.')[0]
    print("company_name: ",company_name)
    return company_name


import pyautogui as pt
tickers=['LPG','JAKK','LXEO','RMBS','VRNS']
tickers=['ZS','NET','CRWD','NOW','NU','KTOS','DDOG','DCBO','CLS','QLYS','PCAR','MLM','GRMN','PTC','FDS','DKNG','AKAM','VRT','MANH','NTNX','GWRE','FIX','ENSG','OBDC','GPI']


for ticker in tickers[9:]:
    
    exchange=find_exchange(ticker)
    url=f'https://www.tradingview.com/chart/tMeJexox/?symbol={exchange}%3A{ticker}'
    
    screenshot_path=f'data/tradingview_images/{ticker}.png'
    

    company_name=generate_company_name(ticker)
    company_name
    try:
        news=fetch_news_for_query(newsapi_org, query=f'{company_name}',page_size=10)
    except:
        news=fetch_news_for_query(newsapi_org2, query=f'{company_name}',page_size=10)


    url1=f'https://api.polygon.io/v2/reference/news?ticker={ticker}&apiKey={polygon_api_key}'
    response = requests.get(url1)

    # Raise an error if the request failed
    # response.raise_for_status()

    # Parse the JSON result
    data = response.json()
    data

    new_list2=[]
    dt=pd.DataFrame(data['results'])
    for i in range(len(dt))[:5]:
        d2=dt['description'][i]
        new_list2.append(d2)
    print("\n>> len(new_list2)= ", len(str(new_list2)))

    # define=f'summarize based on why the {company_name} stock is going up.'
    define='give me news anchors Jim and Kelly summarizing about the given news.'
    news2=gpt_answer(define,str(new_list2))

    print("\n>> len(news2)= ", len(news2))
    news2


    lines = news2.split('\n')

    # Initialize an empty dictionary to store the dialogue
    dialogue_dict = []
    lines

    # Iterate over each line
    for line in lines:
        # Split each line into speaker and dialogue
        if ': ' in line:
            speaker, dialogue = line.split(': ', 1)
            # Add the dialogue to the dictionary under the speaker's name
            # This will overwrite if the speaker already exists. If you want to append, you can modify this part.
            dialogue_dict.append((speaker,dialogue)) 
    dialogue_dict


    # news=fetch_news_for_query(newsapi_org, query=f'{ticker} stock',page_size=10)
    news=str(news)
    define=f'summarize based on why the {company_name} stock is going up.'
    news=gpt_answer(define,news)
    news

    MC,industry, description,company_name,PE_ratio = get_stock_details(ticker)
    description

    audio_path=[]

    a1=audio_download(ticker,'a1',description,'man1')
    audio_path.append(a1)

    a2=audio_download(ticker,'a2',news,'woman1')
    audio_path.append(a2)

    # audio_path3=audio_generator(news,'woman1')


    for ii,(actor,content) in enumerate(dialogue_dict):
        if actor =='Jim':
            a1=audio_download(ticker,f'b{ii}',content,'man3')
        elif actor=='Kelly':
            a1=audio_download(ticker,f'b{ii}',content,'woman2')
        else:
            a1=audio_download(ticker,f'b{ii}',content,'man2')
        print(ii,actor)
        audio_path.append(a1)


    # audio_path.pop(2)
    audio_path

    image_files=[screenshot_path]
    # make_inter_videos(ticker,audio_path,image_files)

# %%