ProjectManager/conversation_analyzer.py at main · tinycrops/ProjectManager · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
#!/usr/bin/env python3
import json
import os
import subprocess
import argparse
from dotenv import load_dotenv
from google import genai

# Import the export functions from discord-export.py
from discord_export import (
    check_docker, export_discord_channel, compress_conversation,
    load_last_timestamp, save_last_timestamp, get_most_recent_timestamp
)

def setup_gemini_model():
    """Configure and return Gemini model instance."""
    load_dotenv()
    api_key = os.getenv("GEMINI_API_KEY")
    if not api_key:
        raise ValueError("GEMINI_API_KEY not found in environment variables")

    client = genai.Client(api_key=api_key)

    # Create a chat with the model
    chat = client.chats.create(
        model="gemini-2.0-flash",
        config=genai.types.GenerateContentConfig(
            system_instruction="You are an AI assistant that analyzes Discord conversation data. Provide insights, summaries, and answer questions about the conversations.",
            max_output_tokens=8192,
            temperature=1,
            top_p=0.95,
            top_k=40
        )
    )

    return chat

def analyze_conversation(chat_session, conversation_summary):
    """Interactive conversation analysis with Gemini."""
    # Initial context setting
    context_prompt = f"""Here's a Discord conversation summary to analyze. I'll be asking questions about it:

{conversation_summary}

Please keep your responses focused on the content of this conversation."""

    response = chat_session.send_message(context_prompt)

    print("\nConversation loaded! You can now ask questions about it.")
    print("Type 'quit' or 'exit' to end the session.\n")

    while True:
        question = input("\nWhat would you like to know about the conversation? > ")

        if question.lower() in ['quit', 'exit']:
            break

        try:
            response = chat_session.send_message(question)
            print("\nAnalysis:", response.text)
        except Exception as e:
            print(f"\nError getting response: {e}")

def main():
    parser = argparse.ArgumentParser(description='Export Discord chat and analyze with Gemini')
    parser.add_argument('channel_id', help='Discord channel ID to export')
    parser.add_argument('-o', '--output', help='Output filename', default='analysis_report.md')
    parser.add_argument('--start-date', help='Start date in ISO format (e.g., "2023-01-01")')
    parser.add_argument('--end-date', help='End date in ISO format (e.g., "2023-12-31")')
    parser.add_argument('--force-full', action='store_true', help='Force full export instead of incremental')
    args = parser.parse_args()

    # Load environment variables
    load_dotenv()
    discord_token = os.getenv('DISCORD_TOKEN')

    if not discord_token:
        print("Error: DISCORD_TOKEN not found in .env file")
        return

    # Set up directories
    output_dir = os.path.join(os.getcwd(), "team_chat")
    os.makedirs(output_dir, exist_ok=True)

    # Determine start date for export
    start_date = args.start_date
    if not start_date and not args.force_full:
        start_date = load_last_timestamp(args.channel_id)
        if start_date:
            print(f"Performing incremental export from {start_date}")
        else:
            print("No previous timestamp found. Performing full export.")

    # Export Discord chat
    if not check_docker():
        return

    if not export_discord_channel(args.channel_id, output_dir, discord_token,
                                start_date, args.end_date):
        return

    # Process exported JSON
    print("Waiting for export to complete...")
    import time
    time.sleep(5)  # Increased delay to 5 seconds

    json_files = [f for f in os.listdir(output_dir) if f.endswith('.json')]
    matching_files = [f for f in json_files if args.channel_id in f]

    if not matching_files:
        print(f"Error: No JSON file found containing channel ID: {args.channel_id}")
        return

    json_path = os.path.join(output_dir, matching_files[0])
    print(f"Processing exported conversation from: {json_path}")

    try:
        with open(json_path, "r", encoding="utf-8") as f:
            conversation = json.load(f)

        # Save the most recent timestamp for next time
        latest_timestamp = get_most_recent_timestamp(conversation)
        if latest_timestamp:
            save_last_timestamp(args.channel_id, latest_timestamp)
            print(f"Saved latest message timestamp: {latest_timestamp}")

    except (json.JSONDecodeError, FileNotFoundError) as e:
        print(f"Error processing JSON file: {e}")
        return

    # Compress conversation and analyze with Gemini
    print("Compressing conversation...")
    summary = compress_conversation(conversation)

    print("Initializing Gemini model...")
    chat_session = setup_gemini_model()

    print("Starting interactive analysis...")
    try:
        analyze_conversation(chat_session, summary)
    except Exception as e:
        print(f"Error during interactive session: {e}")
        return

    # Add final delay to ensure Gemini completes
    time.sleep(2)

if __name__ == "__main__":
    main()