straw-bot-snippets/strawcog.py at main · greshbasic/straw-bot-snippets · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
# hey! this file is used to set up web scrapping for StrawBot's "One Piece" related group of reference commands. In particular op_wiki and ch_sum.
# op_wiki will grab information and an image about a given search term (if found) from the One Piece Fandom Wiki
# ch_sum will grab the short summary of a chapter (if found) from the One Piece Fandom Wiki

class StrawCog(commands.Cog):
    def __init__(self):
        self.httpx_client = AsyncClient()

    @commands.command()
    async def op_wiki(self, ctx, *search_term):
        """ -Returns a One Piece Wiki article"""
        if not search_term:
            await ctx.reply("Please input a search term")
            return

        # search term needs to match EXACTLY with the title of the article
        # otherwise article will not be found, going through this
        # correction process allows what would be misses to be hits
        joined_search_term = " ".join(search_term)
        joined_search_term = joined_search_term.title() # Article Titles Traditionally Follow a Pattern Such as This
        proper_capital = ""
        for i in range(len(joined_search_term)):
            if i == 0:
                proper_capital += joined_search_term[i].upper()
            # devil fruits are romanized as "X X no Mi" (such as Mera Mera no Mi, meaning Flame Flame Fruit)
            elif joined_search_term[i:i+3].upper() == "NO ":
                proper_capital += joined_search_term[i].lower()
            else:
                proper_capital += joined_search_term[i]
        joined_search_term = proper_capital

        # common abbreviations that need to be capitalized in order to be properly recognized
        if joined_search_term.lower() == "cp9" or joined_search_term.lower() == "cp0" or joined_search_term.lower() == "ssg":
            joined_search_term = joined_search_term.upper()

        formatted_search_term = joined_search_term.replace(' ', '_')
        url = f"https://onepiece.fandom.com/wiki/{formatted_search_term}"

        response = requests.get(url)

        if response.status_code == 200:
            soup = BeautifulSoup(response.content, 'html.parser')
            for data in soup(['style', 'script']):
                data.decompose()

            # getting primary description of article
            paragraphs = soup.find_all('p')
            first_paragraph = paragraphs[1]
            CLEANR = re.compile('<.*?>')
            first_paragraph = re.sub(CLEANR,"",first_paragraph)
            first_paragraph = re.sub("[\(\[].*?[\)\]]", "", first_paragraph)

            # getting thumbnail if it exists
            image_url = None
            image_element = soup.find('img', class_='pi-image-thumbnail')
            if image_element:
                relative_image_url = image_element['src']
                image_url = urljoin(url, relative_image_url)

            embed=discord.Embed(title="One Piece Wiki <a:StrawHat:1108291618441789460>",description=first_paragraph,url=url, color=0xFF0000)
            embed.set_image(url=image_url)

            # checking for a bounty and getting it if it exists
            bounty_element = soup.find('div', attrs={'class': 'pi-item', 'data-source': 'bounty'})

            current_bounty = None
            if bounty_element:
                bounty = bounty_element.text.strip()
                bounty_strip = bounty[8:]
                for i in range(len(bounty_strip)):
                    # most recent bounty formatted as BOUNTY[Citation Number]
                    if bounty_strip[i] == "[":
                        current_bounty = bounty_strip[:i]
                        break

            # checking for age element if the character is alive
            age_element = soup.find('div', attrs={'class': 'pi-item', 'data-source': 'age'})
            # checking for age element if the character is dead
            age2_element = soup.find('div', attrs={'class': 'pi-item', 'data-source': 'age2'})
            age = None # way to determine if article isn't about a living thing

            if age_element and not age2_element:
                age = age_element.text.strip()
                age = age[5:]

                for i in range(len(age)):
                    # age formatted as: Over 1000[Citation Number]
                    if age[i:i+2].lower() == "ov":
                        age = "Over 1000"
                        break
                    if "(a" in age:
                        # characters that lived through pre-timeskip have their age
                        # formatted as: (AGE-2) (pre-timeskip) AGE (after timeskip)[Citation Number]
                        if age[i:i+2] == "(a":
                            age = age[i-3:i]
                            break
                    else:
                        # characters that died prior to the 2 year time skip
                        # have their age formatted as: AGE[Citation Number]
                        if age[i] == "[":
                            age = age[:i]
                            break

            elif age2_element:
                age = age2_element.text.strip()
                age = age[14:]
                for i in range(len(age)):
                    # this covers both characters that died before timeskip and characters that died after
                    if age[i] == "[" or age[i] == "(":
                        age = age[:i] + " (DEAD)"
                        break

            # article is about a pirate with a known age
            if current_bounty != None and age != None:
                embed.set_footer(text=f"BOUNTY: {current_bounty} | AGE: {age}",icon_url="https://cdn.discordapp.com/emojis/572643868726525952.png?v=1")
            # article is about a pirate with unknown age
            elif current_bounty != None:
                embed.set_footer(text=f"BOUNTY: {current_bounty}",icon_url="https://cdn.discordapp.com/emojis/572643868726525952.png?v=1")
            # article is about a non-pirate with a known age
            elif age != None:
                embed.set_footer(text=f"AGE: {age}",icon_url="https://cdn.discordapp.com/emojis/868749522724085780.png?v=1")

            try:
                await ctx.reply(embed=embed)
            except:
                error = "The page you requested *is* valid, but the fandom client has issues on its end preventing the request from being properly processed. You can press the hyperlink above to go directly to the article instead if you'd like. Sorry!"
                embed=discord.Embed(title="One Piece Wiki <a:StrawHat:1108291618441789460>",description=error, url=url, color=0xFF0000)
                embed.set_image(url='https://media.tenor.com/Vs9QNG3lQZUAAAAS/luffy-one-piece.gif') # sad gif :(
                await ctx.reply(embed=embed)
        else:
            # invalid search term
            embed=discord.Embed(title="One Piece Wiki <a:StrawHat:1108291618441789460>",description=f"Could not find an article for: {joined_search_term}", color=0xFF0000)
            await ctx.reply(embed=embed)

    @commands.command()
    async def ch_sum(self, ctx, chapter_number):
          """ -Returns a One Piece chapter's summary"""
        if not chapter_number or not chapter_number.isnumeric():
            return

        url = f"https://onepiece.fandom.com/wiki/Chapter_{chapter_number}"
        response = requests.get(url)

        if response.status_code == 200:
            soup = BeautifulSoup(response.content, 'html.parser')
            for data in soup(['style', 'script']):
                data.decompose()

            # getting primary description of article
            paragraphs = soup.find_all('p')
            first_paragraph = paragraphs[3]
            sec_paragraph = paragraphs[4]
            summary = f"{first_paragraph}\n{sec_paragraph}"
            CLEANR = re.compile('<.*?>')
            summary = re.sub(CLEANR, "", summary)
            summary = re.sub("[\(\[].*?[\)\]]", "", summary)

        await ctx.reply(summary)