Compare commits

...

2 Commits

Author SHA1 Message Date
80c115b57d embedded datasets 2025-08-11 01:51:43 +01:00
aa9f2dc618 updated embedder 2025-08-11 01:51:34 +01:00
10 changed files with 6976 additions and 6976 deletions

File diff suppressed because one or more lines are too long

File diff suppressed because one or more lines are too long

File diff suppressed because one or more lines are too long

View File

@@ -1 +1 @@
message_id,timestamp_utc,author_id,author_name,author_nickname,content,attachment_urls,embeds message_id,timestamp_utc,author_id,author_name,author_nickname,content,attachment_urls,embeds
1 message_id timestamp_utc author_id author_name author_nickname content attachment_urls embeds

File diff suppressed because one or more lines are too long

View File

@@ -1 +1 @@
message_id,timestamp_utc,author_id,author_name,author_nickname,content,attachment_urls,embeds message_id,timestamp_utc,author_id,author_name,author_nickname,content,attachment_urls,embeds
1 message_id timestamp_utc author_id author_name author_nickname content attachment_urls embeds

File diff suppressed because one or more lines are too long

File diff suppressed because one or more lines are too long

File diff suppressed because one or more lines are too long

View File

@@ -100,11 +100,11 @@ def process_csvs_in_directory(directory_path: str, model_name: str = 'all-MiniLM
if __name__ == '__main__': if __name__ == '__main__':
# Define the directory where your CSV files are located. # Define the directory where your CSV files are located.
# The script will look for a folder named 'csv_data' in the current directory. # The script will look for a folder named 'csv_data' in the current directory.
CSV_DIRECTORY = 'csv_data' CSV_DIRECTORY = '../discord_chat_logs'
# This function will create the 'csv_data' directory and some sample # This function will create the 'csv_data' directory and some sample
# files if they don't exist. You can comment this out if you have your own files. # files if they don't exist. You can comment this out if you have your own files.
create_sample_files(CSV_DIRECTORY) # create_sample_files(CSV_DIRECTORY)
# Run the main processing function on the directory # Run the main processing function on the directory
process_csvs_in_directory(CSV_DIRECTORY) process_csvs_in_directory(CSV_DIRECTORY)