From 3a4383bfad1797763018661b86e97d1d00070dc3 Mon Sep 17 00:00:00 2001
From: CryZFix <cryzfix@gmail.com>
Date: Tue, 14 Nov 2023 14:08:49 +0400
Subject: [PATCH] Fix source - Fixed getting the number of all chapters -
 Changed the way to get the content of the chapter

---
 sources/en/s/shanghaifantasy.py | 16 ++++++++++++++--
 1 file changed, 14 insertions(+), 2 deletions(-)

diff --git a/sources/en/s/shanghaifantasy.py b/sources/en/s/shanghaifantasy.py
index fb59b37f1..3af3f5eb2 100644
--- a/sources/en/s/shanghaifantasy.py
+++ b/sources/en/s/shanghaifantasy.py
@@ -1,5 +1,6 @@
 # -*- coding: utf-8 -*-
 import logging
+import re
 
 from lncrawl.core.crawler import Crawler
 
@@ -15,7 +16,10 @@ def read_novel_info(self):
         soup = self.get_soup(self.novel_url)
 
         novel_id = soup.select_one("div#likebox").attrs["data-novel"]
-        total_chapters = soup.select("div.grid p.text-sm")[1].text.split(": ")[1]
+        total_chapters_text = soup.select("div.grid p.text-sm")[1].text.split(": ")[1]
+        total_chapters = sum(int(num) for num in re.findall(r"\b\d+\b", total_chapters_text))
+        if total_chapters == 0:
+            total_chapters = 999
         get_novel_json = self.get_response(self.wp_json_novel % novel_id).json()
 
         novel_title = get_novel_json["title"]["rendered"]
@@ -48,5 +52,13 @@ def read_novel_info(self):
 
     def download_chapter_body(self, chapter):
         soup = self.get_soup(chapter["url"])
-        content = soup.select_one("div.contenta")
+        possible_chap_id = soup.select_one("a.comment-reply-link")
+        if possible_chap_id:
+            chap_id = possible_chap_id.attrs["data-postid"]
+        else:
+            possible_chap_id = soup.select_one("input#comment_post_ID")
+            chap_id = possible_chap_id.attrs["value"]
+        data = self.get_json("https://shanghaifantasy.com/wp-json/wp/v2/posts/%s" % chap_id)["content"]["rendered"]
+        soup = self.make_soup(data.replace("\n", " "))
+        content = soup.find("body")
         return self.cleaner.extract_contents(content)