fish 3 months ago
parent
commit
77fb7ce9d5
4 changed files with 7 additions and 8 deletions
  1. 2 1
      .env
  2. 1 1
      README.md
  3. 1 1
      crawl_sse/cninfo.py
  4. 3 5
      docker-compose.debug.yml

+ 2 - 1
.env

@@ -1,2 +1,3 @@
-year = [ 2025, 2024, 2023, 2022, 2021, 2020, 2019, 2018, 2017, 2016, 2015, 2014, 2013, 2012, 2011, 2010 ]
+year = [ 202501, 202502, 202503, 202504, 
+2024, 2023, 2022, 2021, 2020, 2019, 2018, 2017, 2016, 2015, 2014, 2013, 2012, 2011, 2010 ]
 cookie = 

+ 1 - 1
README.md

@@ -51,6 +51,6 @@ docs/上市公司分析.ipynb
 
 Licensed under the [Apache 2.0](LICENSE) © [liuyuqi.gov@msn.cn](https://github.com/jianboy)
 
+## Reference
 
 
-## Reference

+ 1 - 1
crawl_sse/cninfo.py

@@ -18,7 +18,7 @@ class Cninfo(object):
     ''' 
     巨潮资讯
     '''
-    years =[ 2025, 2024, 2023, 2022, 2021, 2020, 2019, 2018, 2017, 2016, 2015, 2014, 2013, 2012, 2011, 2010 ]
+    years =[ 202501 ]
     host = "http://www.cninfo.com.cn"
     headers = {
         "Accept": "*/*",

+ 3 - 5
docker-compose.debug.yml

@@ -1,11 +1,9 @@
-version: '3.4'
 
 services:
   crawlsse:
-    image: crawlsse
+    image: sift-docker.pkg.coding.net/flutter-team/dev-container/crawl_sse:1.0.1
     build:
       context: .
       dockerfile: ./Dockerfile
-    command: ["sh", "-c", "pip install debugpy -t /tmp && python /tmp/debugpy --wait-for-client --listen 0.0.0.0:5678 main.py "]
-    ports:
-      - 5678:5678
+    command: ["python", "main.py", "crawl", "--extractor", "cninfo"]
+