Merge pull request #74 from Dimlitter/rootphantomer/issue73

rootphantomer · web-flow · commit 3d9399c10eeb · 2025-04-09T17:00:18.000+08:00
爬取评论的脚本jdspider
diff --git a/auto_comment_plus.py b/auto_comment_plus.py
@@ -323,7 +323,7 @@ def ordinary(N, opts=None):
                     "pid_data: %s,这个订单估计是京东外卖的，会导致此次评价失败，请把该 %s 商品手工评价后再运行程序。"
                     % (pid, oname),
                 )
-                exit(0)
+                continue
             opts["logger"].info(f"\t{i}.开始评价订单\t{oname}[{oid}]并晒图")
             url2 = "https://club.jd.com/myJdcomments/saveProductComment.action"
             opts["logger"].debug("URL: %s", url2)
diff --git a/config.yml b/config.yml
@@ -1,2 +1,2 @@
 user:
-  cookie: "''"
+  cookie: ''' '''
diff --git a/jdspider.py b/jdspider.py
@@ -33,7 +33,7 @@ def __init__(self, categlory):
         self.startUrl = "https://search.jd.com/Search?keyword=%s&enc=utf-8" % (
             quote(categlory)
         )
-        self.commentBaseUrl = "https://sclub.jd.com/comment/productPageComments.action?"
+        self.commentBaseUrl = "https://api.m.jd.com/?"
         self.headers = {
             "accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,"
             "*/*;q=0.8,application/signed-exchange;v=b3;q=0.9",
@@ -74,15 +74,20 @@ def __init__(self, categlory):
         self.iplist = {"http": [], "https": []}
 
     def getParamUrl(self, productid: str, page: str, score: str):
-        params = {  # 用于控制页数，页面信息数的数据，非常重要，必不可少，要不然会被JD识别出来，爬不出相应的数据。
-            "productId": "%s" % productid,
-            "score": "%s" % score,  # 1表示差评，2表示中评，3表示好评
-            "sortType": "5",
-            "page": "%s" % page,
-            "pageSize": "10",
-            "isShadowSku": "0",
-            "rid": "0",
-            "fold": "1",
+        params = {
+            "appid": "item-v3",
+            "functionId": "pc_club_productPageComments",
+            "client": "pc",
+            "body": {  # 用于控制页数，页面信息数的数据，非常重要，必不可少，要不然会被JD识别出来，爬不出相应的数据。
+                "productId": "%s" % productid,
+                "score": "%s" % score,  # 1表示差评，2表示中评，3表示好评
+                "sortType": "5",
+                "page": "%s" % page,
+                "pageSize": "10",
+                "isShadowSku": "0",
+                "rid": "0",
+                "fold": "1",
+            },
         }
         default_logger.info("params:" + str(params))
         url = self.commentBaseUrl + urlencode(params)
@@ -148,7 +153,7 @@ def getData(
                     default_logger.info(
                         "爬取商品评价的 url 链接是" + url + "，商品的 id 是：" + id_
                     )
-                    response = requests.get(url, params=param)
+                    response = requests.get(url)
                 except Exception as e:
                     default_logger.warning(e)
                     break

Original file line number	Diff line number	Diff line change
`@@ -323,7 +323,7 @@ def ordinary(N, opts=None):`
`323`	`323`	`"pid_data: %s,这个订单估计是京东外卖的，会导致此次评价失败，请把该 %s 商品手工评价后再运行程序。"`
`324`	`324`	`% (pid, oname),`
`325`	`325`	`)`
`326`		`- exit(0)`
	`326`	`+ continue`
`327`	`327`	`opts["logger"].info(f"\t{i}.开始评价订单\t{oname}[{oid}]并晒图")`
`328`	`328`	`url2 = "https://club.jd.com/myJdcomments/saveProductComment.action"`
`329`	`329`	`opts["logger"].debug("URL: %s", url2)`
Original file line number	Diff line number	Diff line change
`@@ -1,2 +1,2 @@`
`1`	`1`	`user:`
`2`		`- cookie: "''"`
	`2`	`+ cookie: ''' '''`