Rename to guilddump + add role dump + add embed dump

2025-05-09 12:15:10 +02:00 · 2022-05-08 18:45:18 +02:00 · 2022-05-08 18:45:18 +02:00 · ca0231f038
commit ca0231f038
parent f542b5bdd0
2 changed files with 58 additions and 22 deletions
--- a/README.md
+++ b/README.md
@ -1,11 +1,11 @@
-# GuildSC
+# GuildDump
-A `python3` driven tool for scraping messages, channels and members of discord servers.
+A `python3` driven tool for dumping messages, channels and members of discord servers.
 ## Setup
-The server you want to scrape must contain a bot within your control (or at least you have to know the token of the bot).
+The server you want to dump must contain a bot within your control (or at least you have to know the token of the bot).
-The bot also needs the `member` intent to enabled in order to scrape members.
+The bot also needs the `member` intent to enabled in order to dump members.
 You this additional `pip3` requirements:
 ```shell
@ -16,8 +16,8 @@ $ pip3 install discord.py simple_term_menu
 You can download the script or run it with this:
 ```shell
-$ curl -s https://raw.githubusercontent.com/ByteDream/guildsc/main/guildsc.py -o guildsc.py
+$ curl -s https://raw.githubusercontent.com/ByteDream/guildsc/main/guildsc.py -o guilddump.py
-$ python3 guildsc.py
+$ python3 guilddump.py
 ```
 ## License
--- a/guilddump.py
+++ b/guilddump.py
@ -146,7 +146,7 @@ async def request_max_messages() -> int:
    return int(await input_prompt(f'Max messages to fetch per channel (default: 1000): ', default='1000', checker=checker))
-async def scrape_channels(guild: discord.Guild, channel_writer):
+async def dump_channels(guild: discord.Guild, channel_writer):
    channel_writer.writerow(['id', 'created_at', 'name', 'type'])
    for channel in await guild.fetch_channels():
@ -168,8 +168,8 @@ async def scrape_channels(guild: discord.Guild, channel_writer):
        ])
-async def scrape_members(guild: discord.Guild, limit: int, user_writer):
+async def dump_members(guild: discord.Guild, limit: int, user_writer):
-    user_writer.writerow(['id', 'joined_at', 'name', 'nick', 'premium_since'])
+    user_writer.writerow(['id', 'joined_at', 'name', 'nick', 'is_bot', 'premium_since'])
    async for member in guild.fetch_members(limit=limit):
        user_writer.writerow([
@ -177,14 +177,32 @@ async def scrape_members(guild: discord.Guild, limit: int, user_writer):
            int(time.mktime(member.joined_at.timetuple())),
            str(member),
            member.nick,
            member.bot,
            int(time.mktime(member.premium_since.timetuple())) if member.premium_since else 0
        ])
-async def scrape_messages(channel: discord.TextChannel, limit: int, message_writer, attachment_writer, reaction_writer):
+async def dump_roles(guild: discord.Guild, role_writer):
-    message_writer.writerow(['id', 'author_id', 'created_at', 'modified at', 'content'])
+    role_writer.writerow(['id', 'created_at', 'name', 'position', 'permissions', 'member_count', 'is_mentionable', 'color'])
-    attachment_writer.writerow(['message_id', 'type', 'size', 'filename', 'url', 'spoiler'])
+
-    reaction_writer.writerow(['message_id', 'name', 'reaction_count', 'animated'])
+    for role in await guild.fetch_roles():
        role_writer.writerow([
            role.id,
            role.created_at,
            role.name,
            role.position,
            role.permissions,
            len(role.members),
            role.mentionable,
            role.color
        ])
 async def dump_messages(channel: discord.TextChannel, limit: int, message_writer, attachment_writer, reaction_writer, embed_writer):
    message_writer.writerow(['id', 'author_id', 'created_at', 'modified_at', 'content'])
    attachment_writer.writerow(['message_id', 'type', 'size', 'filename', 'url', 'is_spoiler'])
    reaction_writer.writerow(['message_id', 'name', 'reaction_count', 'is_animated'])
    embed_writer.writerow(['message_id', 'title', 'description', 'footer', 'image', 'thumbnail', 'video', 'author', 'field_count', 'color'])
    async for message in channel.history(limit=limit):
        message_writer.writerow([
@ -212,6 +230,20 @@ async def scrape_messages(channel: discord.TextChannel, limit: int, message_writ
                    reaction.count,
                    False if isinstance(reaction.emoji, str) else reaction.emoji.animated
                ])
        if message.embeds:
            for embed in message.embeds:
                embed_writer.writerow([
                    message.id,
                    embed.title if embed.title else None,
                    embed.description if embed.description else None,
                    embed.footer.text if embed.footer else None,
                    embed.image.url if embed.image else None,
                    embed.thumbnail.url if embed.thumbnail else None,
                    embed.video.url if embed.video else None,
                    embed.author.name if embed.author else None,
                    len(embed.fields),
                    embed.color if embed.color else None
                ])
 async def main():
@ -231,25 +263,29 @@ async def main():
        selected_channels = await request_channels(guild)
-        print('Starting scraping, this make take a while...')
+        print('Starting dumping, this make take a while...')
        with directory.joinpath('channels.csv').open('w+') as channels:
-            await scrape_channels(guild, csv.writer(channels))
+            await dump_channels(guild, csv.writer(channels))
-            print('Scraped channels')
+            print('Dumped channels')
        with directory.joinpath('members.csv').open('w+') as members:
-            await scrape_members(guild, max_members, csv.writer(members))
+            await dump_members(guild, max_members, csv.writer(members))
-            print('Scraped members')
+            print('Dumped members')
        with directory.joinpath('roles.csv').open('w+') as roles:
            await dump_roles(guild, csv.writer(roles))
            print('Dumped roles')
        for channel in selected_channels:
            if isinstance(channel, discord.TextChannel):
                dir = directory.joinpath(str(channel.id))
                dir.mkdir()
-                with dir.joinpath('messages.csv').open('w+') as messages, dir.joinpath('attachments.csv').open('w+') as attachments, dir.joinpath('reactions.csv').open('w+') as reactions:
+                with dir.joinpath('messages.csv').open('w+') as messages, dir.joinpath('attachments.csv').open('w+') as attachments, dir.joinpath('reactions.csv').open('w+') as reactions, dir.joinpath('embeds.csv').open('w+') as embeds:
-                    await scrape_messages(channel, max_messages, csv.writer(messages), csv.writer(attachments), csv.writer(reactions))
+                    await dump_messages(channel, max_messages, csv.writer(messages), csv.writer(attachments), csv.writer(reactions), csv.writer(embeds))
-                    print(f'Scraped channel {channel.id} (#{channel.name})')
+                    print(f'Dumped channel {channel.id} (#{channel.name})')
-        print('Finished scraping')
+        print('Finished dumping')
    finally:
        await client.close()