diff --git a/.gitignore b/.gitignore
new file mode 100644
index 0000000..022f7f9
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,7 @@
+
+.env
+__pycache__/custom_tools.cpython-310.pyc
+email_pairs.csv
+faq.csv
+past_email_mbox.csv
+Sent.mbox
diff --git a/app.py b/app.py
new file mode 100644
index 0000000..55d36c7
--- /dev/null
+++ b/app.py
@@ -0,0 +1,54 @@
+from dotenv import find_dotenv, load_dotenv
+
+from langchain.agents import initialize_agent
+from langchain.agents import AgentType
+from langchain.chat_models import ChatOpenAI
+from langchain.prompts import MessagesPlaceholder
+from langchain.memory import ConversationSummaryBufferMemory
+from langchain.chains.summarize import load_summarize_chain
+from langchain.schema import SystemMessage
+from custom_tools import CreateEmailDraftTool, GenerateEmailResponseTool, ReplyEmailTool, EscalateTool, ProspectResearchTool, CategoriseEmailTool
+
+load_dotenv()
+llm = ChatOpenAI(temperature=0, model="gpt-3.5-turbo-0613")
+
+system_message = SystemMessage(
+    content="""
+    You are an email inbox assistant of an AI youtube channel called "AI Jason", 
+    who is creating AI educational content, 
+    Your goal is to handle all the incoming emails by categorising them based on 
+    guideline and decide on next steps
+    """
+)
+
+tools = [
+    CategoriseEmailTool(),
+    ProspectResearchTool(),
+    EscalateTool(),
+    ReplyEmailTool(),
+    CreateEmailDraftTool(),
+    GenerateEmailResponseTool(),
+]
+
+agent_kwargs = {
+    "extra_prompt_messages": [MessagesPlaceholder(variable_name="memory")],
+    "system_message": system_message,
+}
+memory = ConversationSummaryBufferMemory(
+    memory_key="memory", return_messages=True, llm=llm, max_token_limit=1000)
+
+agent = initialize_agent(
+    tools,
+    llm,
+    agent=AgentType.OPENAI_FUNCTIONS,
+    verbose=True,
+    agent_kwargs=agent_kwargs,
+    memory=memory,
+)
+
+
+test_email = """
+xxxxxxx
+"""
+
+agent({"input": test_email})
diff --git a/custom_tools.py b/custom_tools.py
new file mode 100644
index 0000000..12d90c1
--- /dev/null
+++ b/custom_tools.py
@@ -0,0 +1,464 @@
+import os
+from dotenv import load_dotenv, find_dotenv
+import openai
+
+from langchain import PromptTemplate
+from langchain.agents import initialize_agent, Tool
+from langchain.agents import AgentType
+from langchain.chat_models import ChatOpenAI
+from langchain.prompts import MessagesPlaceholder
+from langchain.memory import ConversationSummaryBufferMemory
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain.chains.summarize import load_summarize_chain
+from langchain.tools import BaseTool
+from pydantic import BaseModel, Field
+from typing import Type
+from bs4 import BeautifulSoup
+import requests
+import json
+from langchain.schema import SystemMessage
+
+load_dotenv(find_dotenv())
+openai.api_key = os.environ.get("OPENAI_API_KEY")
+llm = ChatOpenAI(temperature=0, model="gpt-3.5-turbo-16k-0613")
+
+
+# CATEGORISE EMAIL
+def check_consulting_email(lates_reply: str):
+    prompt = f"""
+    EMAIL: {lates_reply}
+    ---
+
+    Above is an email about Job offer / consulting; Your goal is identify if all information above is mentioned:
+    1. What's the problem the prospect is trying to solve? 
+    2. Their budget
+
+    If all info above is collected, return YES, otherwise, return NO; (Return ONLY YES or NO)
+
+    ANSWER: 
+    """
+
+    all_needs_collected_result = openai.ChatCompletion.create(
+        model="gpt-4",
+        messages=[
+            {"role": "user", "content": prompt}
+        ]
+    )
+
+    all_needs_collected = all_needs_collected_result["choices"][0]["message"]["content"]
+
+    return all_needs_collected
+
+
+def categorise_email(lates_reply: str):
+    categorise_prompt = f"""
+    EMAIL: {lates_reply}
+    ---
+
+    Your goal is to categorise the email based on categories below:
+
+    1. COLLABORATION/SPONSORSHIP: These are emails where companies or individuals are reaching out to propose a collaboration or sponsorship opportunity with AI Jason. They often include details about their product or service and how they envision the partnership.
+
+    2. JOB_OFFER/CONSULTING: These emails involve individuals or companies reaching out to AI Jason with a specific job or project they want him to work on. This could range from developing an AI application to leading a specific activity.
+
+    3. QUESTIONS: These emails involve individuals reaching out to AI Jason with specific questions or inquiries. This could be about his videos, his knowledge on a specific topic, or his thoughts on a specific AI tool or technology.
+
+    4. NON_REPLY: These are auto emails that don't need any response or involve companies or individuals reaching out to AI Jason to offer their services. This could be a marketing agency offering to help him find sponsorship opportunities or a company offering a specific tool or service they think he might find useful.
+
+    5. OTHER: These are emails that don't fit into any of the above categories.
+
+    CATEGORY (Return ONLY the category name in capital):
+    """
+
+    category_result = openai.ChatCompletion.create(
+        model="gpt-4",
+        messages=[
+            {"role": "user", "content": categorise_prompt}
+        ]
+    )
+
+    category = category_result["choices"][0]["message"]["content"]
+
+    if category == "JOB_OFFER/CONSULTING":
+        all_needs_collected = check_consulting_email(lates_reply)
+        if all_needs_collected == "YES":
+            return {
+                "Step 1": """Forward the email to jason.zhou.design@gmail.com, with summary of 1.What's the problem the prospect is trying to solve?  2.Their budget"""
+            }
+        else:
+            return {
+                "Step 1": "Generate email response to the prospect to collect further info based on guidelines",
+                "Step 2": "Send generated email response to prospect",
+            }
+    else:
+        if category == "COLLABORATION/SPONSORSHIP":
+            return {
+                "Step 1": "Research about the prospect & company",
+                "Step 2": "Forward the email to jason.zhou.design@gmail.com, with the research results included"
+            }
+        else:
+            if category == "NON_REPLY":
+                return f"This email has already been taken care of or replied before, nothing needs to be done now"
+            else:
+                return {
+                    "Step 1": "Generate email response based on guidelines",
+                    "Step 2": "Create email draft with the generated response"
+                }
+
+
+class CategoriseEmailInput(BaseModel):
+    lates_reply: str = Field(description="Latest reply from the prospect ")
+
+
+class CategoriseEmailTool(BaseTool):
+    name = "categorise_email"
+    description = "use this to categorise email to decide what to do next"
+    args_schema: Type[BaseModel] = CategoriseEmailInput
+
+    def _run(self, lates_reply: str):
+        return categorise_email(lates_reply)
+
+    def _arun(self, url: str):
+        raise NotImplementedError(
+            "get_stock_performance does not support async")
+
+
+# WRITE EMAIL
+def generate_email_response(email_thread: str, category: str):
+    # URL endpoint
+    url = "https://api-f1db6c.stack.tryrelevance.com/latest/studios/6af484b0-a8bf-4545-91b8-75d46ac8f354/trigger_limited"
+
+    # Headers
+    headers = {
+        "Content-Type": "application/json"
+    }
+
+    # Payload (data)
+    data = {
+        "params": {
+            "client_email": email_thread,
+            "goal": "write email response" if category != "CONSULTING FOLLOW UP" else "for each consulting email, we need to collect 1. Their use case & problem they are trying to solve 2. Their budget; Try to collect those info from them",
+        },
+        "project": "f86edbc1-fcb6-41f9-b9b6-be14a6f06412"
+    }
+
+    # Send POST request
+    response = requests.post(url, headers=headers, json=data)
+
+    return response.text
+
+
+class GenerateEmailResponseInput(BaseModel):
+    """Inputs for scrape_website"""
+    email_thread: str = Field(description="The original full email thread")
+    category: str = Field(
+        description='category of email, can ONLY be "CONSULTING FOLLOW UP" or "OTHER" ')
+
+
+class GenerateEmailResponseTool(BaseTool):
+    name = "generate_email_response"
+    description = "use this to generate the email response based on specific guidelines, voice & tone & knowledge for AI Jason"
+    args_schema: Type[BaseModel] = GenerateEmailResponseInput
+
+    def _run(self, email_thread: str, category: str):
+        return generate_email_response(email_thread, category)
+
+    def _arun(self, url: str):
+        raise NotImplementedError("failed to escalate")
+
+
+# RESEARCH AGENT
+
+def summary(objective, content):
+    text_splitter = RecursiveCharacterTextSplitter(
+        separators=["\n\n", "\n"], chunk_size=10000, chunk_overlap=500)
+    docs = text_splitter.create_documents([content])
+    map_prompt = """
+    Write a summary of the following text for {objective}:
+    "{text}"
+    SUMMARY:
+    """
+    map_prompt_template = PromptTemplate(
+        template=map_prompt, input_variables=["text", "objective"])
+
+    summary_chain = load_summarize_chain(
+        llm=llm,
+        chain_type='map_reduce',
+        map_prompt=map_prompt_template,
+        combine_prompt=map_prompt_template,
+        verbose=False
+    )
+
+    output = summary_chain.run(input_documents=docs, objective=objective)
+
+    return output
+
+
+def scrape_website(objective: str, url: str):
+    # scrape website, and also will summarize the content based on objective if the content is too large
+    # objective is the original objective & task that user give to the agent, url is the url of the website to be scraped
+
+    # Define the headers for the request
+    headers = {
+        'Cache-Control': 'no-cache',
+        'Content-Type': 'application/json',
+    }
+
+    # Define the data to be sent in the request
+    data = {
+        "url": url
+    }
+
+    # Convert Python object to JSON string
+    data_json = json.dumps(data)
+
+    # Send the POST request
+    response = requests.post(
+        "https://chrome.browserless.io/content?token=xxxxxxxxxxxxxxxxxxxxxxxxxxx", headers=headers, data=data_json)
+
+    # Check the response status code
+    if response.status_code == 200:
+        soup = BeautifulSoup(response.content, "html.parser")
+        text = soup.get_text()
+        if len(text) > 10000:
+            output = summary(objective, text)
+            return output
+        else:
+            return text
+    else:
+        return f"HTTP request failed with status code {response.status_code}"
+
+
+class ScrapeWebsiteInput(BaseModel):
+    """Inputs for scrape_website"""
+    objective: str = Field(
+        description="The objective & task that users give to the agent")
+    url: str = Field(description="The url of the website to be scraped")
+
+
+class ScrapeWebsiteTool(BaseTool):
+    name = "scrape_website"
+    description = "useful when you need to get data from a website url, passing both url and objective to the function; DO NOT make up any url, the url should only be from the search results"
+    args_schema: Type[BaseModel] = ScrapeWebsiteInput
+
+    def _run(self, objective: str, url: str):
+        return scrape_website(objective, url)
+
+    def _arun(self, url: str):
+        raise NotImplementedError(
+            "get_stock_performance does not support async")
+
+
+def search(query):
+    url = "https://google.serper.dev/search"
+
+    payload = json.dumps({
+        "q": query
+    })
+
+    headers = {
+        'X-API-KEY': 'xxxxxxxxxxxxxxxxxxxxx',
+        'Content-Type': 'application/json'
+    }
+
+    response = requests.request("POST", url, headers=headers, data=payload)
+
+    return response.text
+
+
+def prospect_research(email_or_name: str, company: str):
+    tools = [
+        Tool(
+            name="Search",
+            func=search,
+            description="useful for when you need to answer questions about current events, data. You should ask targeted questions"
+        ),
+        ScrapeWebsiteTool(),
+    ]
+
+    system_message = SystemMessage(
+        content="""You are a world class researcher, who can do detailed research on any topic and produce facts based results; 
+                you do not make things up, you will try as hard as possible to gather facts & data to back up the research
+                
+                Please make sure you complete the objective above with the following rules:
+                1/ You should do enough research to gather as much information as possible about the objective
+                2/ If there are url of relevant links & articles, you will scrape it to gather more information
+                3/ After scraping & search, you should think "is there any new things i should search & scraping based on the data I collected to increase research quality?" If answer is yes, continue; But don't do this more than 3 iteratins
+                4/ You should not make things up, you should only write facts & data that you have gathered
+                5/ In the final output, You should include all reference data & links to back up your research; You should include all reference data & links to back up your research
+                6/ In the final output, You should include all reference data & links to back up your research; You should include all reference data & links to back up your research"""
+    )
+
+    agent_kwargs = {
+        "extra_prompt_messages": [MessagesPlaceholder(variable_name="memory")],
+        "system_message": system_message,
+    }
+    memory = ConversationSummaryBufferMemory(
+        memory_key="memory", return_messages=True, llm=llm, max_token_limit=1000)
+
+    agent = initialize_agent(
+        tools,
+        llm,
+        agent=AgentType.OPENAI_FUNCTIONS,
+        verbose=False,
+        agent_kwargs=agent_kwargs,
+        memory=memory,
+    )
+
+    message = f"Research about {company} and {email_or_name}; What does the company do, and who the person is"
+
+    result = agent({"input": message})
+
+    return result
+
+
+class ProspectResearchInput(BaseModel):
+    """Inputs for scrape_website"""
+    email_or_name: str = Field(
+        description="The original email address or name of prospect")
+    company: str = Field(description="The company name of prospect")
+
+
+class ProspectResearchTool(BaseTool):
+    name = "prospect_research"
+    description = "useful when you need to research about a prospect, passing both email and company to the function, return the summary of its company as well as the prospect"
+    args_schema: Type[BaseModel] = ProspectResearchInput
+
+    def _run(self, email_or_name: str, company: str):
+        return prospect_research(email_or_name, company)
+
+    def _arun(self, url: str):
+        raise NotImplementedError("failed to escalate")
+
+
+# ESCALATE
+
+def escalate(original_email_address: str, message: str, additional_context: str):
+    # URL to send the POST request to
+    url = 'https://hooks.zapier.com/hooks/catch/15616669/38qwq19/'
+
+    # Data to send in the POST request
+    data = {
+        "prospect email": original_email_address,
+        "prospect message": message,
+        "additional context": additional_context
+    }
+
+    # Send the POST request
+    response = requests.post(url, data=data)
+
+    # Check the response
+    if response.status_code == 200:
+        return ('This email has been escalated to Jason, he will take care of it from here, nothing needs to be done now')
+    else:
+        return ('Failed to send POST request:', response.status_code)
+
+
+class EscalateInput(BaseModel):
+    """Inputs for scrape_website"""
+    message: str = Field(
+        description="The original email thread & message that was received, cc the original copy for escalation")
+    original_email_address: str = Field(
+        description="The email address that sent the message/email")
+    additional_context: str = Field(
+        description="additional context about the prospect, can be the company/prospct background research OR the consulting request details like use case, budget, etc.")
+
+
+class EscalateTool(BaseTool):
+    name = "escalate_to_jason"
+    description = "useful when you need to escalate the case to jason or others, passing both message and original_email_address to the function"
+    args_schema: Type[BaseModel] = EscalateInput
+
+    def _run(self, original_email_address: str, message: str, additional_context: str):
+        return escalate(original_email_address, message, additional_context)
+
+    def _arun(self, url: str):
+        raise NotImplementedError("failed to escalate")
+
+
+# REPLY EMAIL
+def reply_email(message: str, email_address: str, subject: str):
+    return f"An email has been sent to {email_address}"
+
+    # URL to send the POST request to
+    url = 'https://hooks.zapier.com/hooks/catch/15616669/38qaaau/'
+
+    # Data to send in the POST request
+    data = {
+        "Email": email_address,
+        "Subject": subject,
+        "Reply": message
+    }
+
+    # Send the POST request
+    response = requests.post(url, data=data)
+
+    # Check the response
+    if response.status_code == 200:
+        return ('Email reply has been created successfully')
+    else:
+        return ('Failed to send POST request:', response.status_code)
+
+
+class ReplyEmailInput(BaseModel):
+    """Inputs for scrape_website"""
+    message: str = Field(
+        description="The generated response message to be sent to the email address")
+    email_address: str = Field(
+        description="Destination email address to send email to")
+    subject: str = Field(description="subject of the email")
+
+
+class ReplyEmailTool(BaseTool):
+    name = "reply_email"
+    description = "use this to send emails"
+    args_schema: Type[BaseModel] = ReplyEmailInput
+
+    def _run(self, message: str, email_address: str, subject: str):
+        return reply_email(message, email_address, subject)
+
+    def _arun(self, url: str):
+        raise NotImplementedError("failed to escalate")
+
+
+# CREATE EMAIL DRAFT
+def create_email_draft(prospect_email_address: str, subject: str, generated_reply: str):
+    # URL to send the POST request to
+    url = 'https://hooks.zapier.com/hooks/catch/15616669/38ikw12/'
+
+    # Data to send in the POST request
+    data = {
+        "email": prospect_email_address,
+        "subject": subject,
+        "reply": generated_reply
+    }
+
+    # Send the POST request
+    response = requests.post(url, data=data)
+
+    # Check the response
+    if response.status_code == 200:
+        return ('Email draft has been created successfully')
+    else:
+        return ('Failed to send POST request:', response.status_code)
+
+
+class CreateEmailDraftInput(BaseModel):
+    """Inputs for scrape_website"""
+    prospect_email_address: str = Field(
+        description="The prospect's email address")
+    subject: str = Field(description="The original email subject")
+    generated_reply: str = Field(
+        description="Generated email reply to prospect")
+
+
+class CreateEmailDraftTool(BaseTool):
+    name = "create_email_draft"
+    description = "use this to create email draft for jason to review & send"
+    args_schema: Type[BaseModel] = CreateEmailDraftInput
+
+    def _run(self, prospect_email_address: str, subject: str, generated_reply: str):
+        return create_email_draft(prospect_email_address, subject, generated_reply)
+
+    def _arun(self, url: str):
+        raise NotImplementedError("failed to escalate")
diff --git a/email_cleaning.py b/email_cleaning.py
new file mode 100644
index 0000000..76a3cc1
--- /dev/null
+++ b/email_cleaning.py
@@ -0,0 +1,64 @@
+import os
+from dotenv import find_dotenv, load_dotenv
+import openai
+import json, csv
+
+load_dotenv(find_dotenv())
+openai.api_key = os.environ.get("OPENAI_API_KEY")
+
+def parse_email(email_thread):
+
+    system_prompt = """
+    You are an expert of convert raw email thread into original message / reply pairs. 
+    You are given a raw email thread that Jason reply to others, your goal is to convert it into original message / reply pairs. 
+    - orignal_message: the last message sent to Jason, if it is a long email thread, only take the last message
+    - jason_reply: Jason's reply to the original message
+
+    if there is only one message in the thread, that should be jason_reply
+
+    The exported format should look something like 
+    {
+        "original_message": "xxxx",
+        "jason_reply": "xxxx"
+    }
+    """
+
+    response = openai.ChatCompletion.create(
+        model="gpt-4",
+        messages=[
+            {"role": "system", "content": system_prompt},
+            {"role": "user", "content": email_thread}
+        ]
+    )
+
+    return response["choices"][0]["message"]["content"]
+
+def process_csv(input_csv_path, output_csv_path):
+    with open(input_csv_path, newline='', encoding='utf-8') as csvfile:
+        csv_reader = csv.DictReader(csvfile)
+        processed_data = []
+        
+        for row in csv_reader:
+            text = row['Body']  # Get the text from the 'body' column
+            json_string = parse_email(text)
+            print(json_string)
+            json_data = json.loads(json_string)  # Convert JSON string to dictionary
+            original_message = json_data.get('original_message', '')
+            jason_reply = json_data.get('jason_reply', '')
+            # Append original row data and new columns to processed_data
+            processed_data.append([original_message, jason_reply])
+    
+    # Write processed data to a new CSV file
+    with open(output_csv_path, mode='w', newline='', encoding='utf-8') as csvfile:
+        csv_writer = csv.writer(csvfile)
+        # Write header
+        csv_writer.writerow(['original_message', 'jason_reply'])
+        # Write data rows
+        csv_writer.writerows(processed_data)
+
+# Paths to your input and output CSV files
+input_csv_path = 'past_email_final_mboxt.csv'
+output_csv_path = 'email_pairs.csv'
+
+# Call the function to process the CSV file
+process_csv(input_csv_path, output_csv_path)
diff --git a/extract_faq.py b/extract_faq.py
new file mode 100644
index 0000000..96649a6
--- /dev/null
+++ b/extract_faq.py
@@ -0,0 +1,96 @@
+import csv
+import json
+from dotenv import find_dotenv, load_dotenv
+from langchain.prompts import PromptTemplate
+from langchain.chat_models import ChatOpenAI
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain.chains.summarize import load_summarize_chain
+
+load_dotenv()
+llm = ChatOpenAI(temperature=0, model_name="gpt-4")
+
+def load_csv(file_path):
+    # Create a list to hold dictionaries
+    data_list = []
+
+    # Open the CSV file and read its content
+    with open(file_path, 'r') as csv_file:
+        csv_reader = csv.DictReader(csv_file)
+        
+        # For each row, append it as a dictionary to the list
+        for row in csv_reader:
+            data_list.append(row)
+
+    return data_list
+
+def extract_faq(text_data):
+    text_splitter = RecursiveCharacterTextSplitter(
+        chunk_size=3000, 
+        chunk_overlap=20,
+        length_function = len,
+        is_separator_regex=False)
+
+    texts = text_splitter.split_text(text_data)
+    docs = text_splitter.create_documents(texts)
+
+
+    map_prompt = """
+    PAST EMAILS:
+    {text}
+    ----
+
+    You are a smart AI assistant, above is some past emails from AI Jason (an AI youtuber), 
+    your goal is to learn & extract common FAQ about AI Jason 
+    (include both question & answer, return results in JSON):
+    """
+    map_prompt_template = PromptTemplate(template=map_prompt, input_variables=["text"])
+
+    combine_prompt = """
+    The following is set of FAQ about AI Jason (an AI youtuber):
+    {text}
+    Take these and distill it into a final, consolidated array of faq, 
+    include both question & answer (in JSON format). 
+    
+    array of FAQ:
+    """
+    combine_prompt_template = PromptTemplate(template=combine_prompt, input_variables=["text"])
+
+    summary_chain = load_summarize_chain(llm=llm,
+                                        chain_type='map_reduce',
+                                        map_prompt=map_prompt_template,
+                                        combine_prompt=combine_prompt_template,
+                                        verbose=True
+                                        )
+
+    output = summary_chain.run(docs)
+    faqs = json.loads(output)
+
+    return faqs
+
+def save_json_to_csv(data, file_name):
+    with open(file_name, mode='w', newline='', encoding='utf-8') as file:
+        # Get the keys (column names) from the first dictionary in the list
+        fieldnames = data[0].keys()
+        
+        # Create a CSV dict writer object
+        writer = csv.DictWriter(file, fieldnames=fieldnames)
+        
+        # Write the header row
+        writer.writeheader()
+        
+        # Write the data rows
+        for entry in data:
+            writer.writerow(entry)
+
+
+# Print or save the JSON data
+past_emails = load_csv("email_pairs.csv")
+
+# Extracting Jason's replies
+jasons_replies = [entry["jason_reply"] for entry in past_emails]
+jasons_replies_string = json.dumps(jasons_replies)
+
+faqs = extract_faq(jasons_replies_string)
+
+save_json_to_csv(faqs, "faq.csv")
+
diff --git a/mbox_to_csv.py b/mbox_to_csv.py
new file mode 100644
index 0000000..9941ced
--- /dev/null
+++ b/mbox_to_csv.py
@@ -0,0 +1,43 @@
+import mailbox
+import csv
+from email import policy
+from email.parser import BytesParser
+
+def get_body(message):
+    if message.is_multipart():
+        for part in message.walk():
+            if part.is_multipart():
+                for subpart in part.walk():
+                    if subpart.get_content_type() == 'text/plain':
+                        return subpart.get_payload(decode=True)
+            elif part.get_content_type() == 'text/plain':
+                return part.get_payload(decode=True)
+    else:
+        return message.get_payload(decode=True)
+
+def mbox_to_csv(mbox_file_path, csv_file_path):
+    mbox = mailbox.mbox(mbox_file_path)
+
+    with open(csv_file_path, mode='w', newline='', encoding='utf-8') as file:
+        writer = csv.writer(file)
+        writer.writerow(['Subject', 'From', 'Date', 'To', 'Message-ID', 'Body'])
+
+        for message in mbox:
+            body = get_body(message)  # Get the message body using the new get_body function
+            if body:
+                body = body.decode('utf-8', errors='replace').replace('\n', ' ').replace('\r', '')
+            else:
+                body = ''
+            writer.writerow([
+                message['subject'],
+                message['from'],
+                message['date'],
+                message['to'],
+                message['message-id'],
+                body
+            ])
+
+# Usage
+mbox_file_path = 'Sent.mbox'  # replace with the path to your MBOX file
+csv_file_path = 'past_email_mbox.csv'  # replace with the desired path for the output CSV file
+mbox_to_csv(mbox_file_path, csv_file_path)