Skip to content
项目
群组
代码片段
帮助
当前项目
正在载入...
登录 / 注册
切换导航面板
Z
zzsn_spider
概览
概览
详情
活动
周期分析
版本库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
统计图
问题
0
议题
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
CI / CD
CI / CD
流水线
作业
日程表
图表
维基
Wiki
代码片段
代码片段
成员
成员
折叠边栏
关闭边栏
活动
图像
聊天
创建新问题
作业
提交
问题看板
Open sidebar
王景浩
zzsn_spider
Commits
5cebbe1d
提交
5cebbe1d
authored
12月 21, 2023
作者:
薛凌堃
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
REITs专题脚本维护
上级
2e31675f
隐藏空白字符变更
内嵌
并排
正在显示
27 个修改的文件
包含
140 行增加
和
59 行删除
+140
-59
LawRules_2_shenzhen.py
REITs专题数据/LawRules_2_shenzhen.py
+3
-1
LawRules_shenzhen.py
REITs专题数据/LawRules_shenzhen.py
+3
-1
RuleGuide_shanghai.py
REITs专题数据/RuleGuide_shanghai.py
+2
-1
RuleGuide_shenzhen.py
REITs专题数据/RuleGuide_shenzhen.py
+2
-1
policy_beijing.py
REITs专题数据/policy_beijing.py
+8
-7
policy_chongqing.py
REITs专题数据/policy_chongqing.py
+3
-2
policy_fujian.py
REITs专题数据/policy_fujian.py
+3
-2
policy_guangdong.py
REITs专题数据/policy_guangdong.py
+3
-2
policy_guangxi.py
REITs专题数据/policy_guangxi.py
+3
-2
policy_gwy.py
REITs专题数据/policy_gwy.py
+3
-2
policy_hainan.py
REITs专题数据/policy_hainan.py
+3
-2
policy_heilongjiang.py
REITs专题数据/policy_heilongjiang.py
+3
-2
policy_hubei.py
REITs专题数据/policy_hubei.py
+3
-2
policy_jiangsu.py
REITs专题数据/policy_jiangsu.py
+3
-2
policy_jiangxi.py
REITs专题数据/policy_jiangxi.py
+3
-2
policy_jilin.py
REITs专题数据/policy_jilin.py
+3
-2
policy_liaoning.py
REITs专题数据/policy_liaoning.py
+3
-2
policy_neimenggu.py
REITs专题数据/policy_neimenggu.py
+3
-2
policy_shandong.py
REITs专题数据/policy_shandong.py
+3
-2
policy_shanghai.py
REITs专题数据/policy_shanghai.py
+3
-2
policy_shanxi.py
REITs专题数据/policy_shanxi.py
+3
-2
policy_sichuan.py
REITs专题数据/policy_sichuan.py
+3
-2
policy_tianjin.py
REITs专题数据/policy_tianjin.py
+3
-2
policy_yunnan.py
REITs专题数据/policy_yunnan.py
+3
-2
policy_zhejiang.py
REITs专题数据/policy_zhejiang.py
+3
-2
reits.py
REITs专题数据/reits.py
+20
-8
start.py
REITs专题数据/start.py
+42
-0
没有找到文件。
REITs专题数据/LawRules
-2-
shenzhen.py
→
REITs专题数据/LawRules
_2_
shenzhen.py
浏览文件 @
5cebbe1d
import
re
import
re
...
...
@@ -89,6 +89,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -133,6 +134,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
''
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
REITs专题数据/LawRules
-
shenzhen.py
→
REITs专题数据/LawRules
_
shenzhen.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -142,6 +142,7 @@ def doJob():
'content'
:
fjcontent
,
'contentWithTag'
:
''
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -172,6 +173,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
str
(
contentWithTag
),
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
REITs专题数据/RuleGuide
-
shanghai.py
→
REITs专题数据/RuleGuide
_
shanghai.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -117,6 +117,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
str
(
contentWithTag
),
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
REITs专题数据/RuleGuide
-
shenzhen.py
→
REITs专题数据/RuleGuide
_
shenzhen.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -79,6 +79,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
str
(
contentWithTag
),
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
REITs专题数据/policy
-
beijing.py
→
REITs专题数据/policy
_
beijing.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -129,8 +129,8 @@ def getFjContent(url):
# 北京市人民政府 https://www.beijing.gov.cn/so/s?siteCode=1100000088&tab=zcfg&qt=REITs
def
beijing
():
if
not
os
.
path
.
exists
(
'./相关政策/北京市人民政府/政策文件'
):
os
.
makedirs
(
'./相关政策/北京市人民政府/政策文件'
)
#
if not os.path.exists('./相关政策/北京市人民政府/政策文件'):
#
os.makedirs('./相关政策/北京市人民政府/政策文件')
policy1
=
Policy1
()
url
=
'https://www.beijing.gov.cn/so/ss/query/s'
payload
=
{
...
...
@@ -288,6 +288,7 @@ def beijing():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -299,7 +300,7 @@ def beijing():
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729041207245328385'
,
'sid'
:
'1729041207245328385'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
@@ -311,6 +312,6 @@ def beijing():
time
.
sleep
(
random
.
randint
(
10
,
20
))
num
+=
1
if
__name__
==
'__main__'
:
beijing
()
baseCore
.
close
()
#
if __name__ == '__main__':
#
beijing()
#
baseCore.close()
REITs专题数据/policy
-
chongqing.py
→
REITs专题数据/policy
_
chongqing.py
浏览文件 @
5cebbe1d
import
json
import
json
...
...
@@ -174,6 +174,7 @@ def getData(data_, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -185,7 +186,7 @@ def getData(data_, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729045755020103681'
,
'sid'
:
'1729045755020103681'
}
try
:
...
...
REITs专题数据/policy
-
fujian.py
→
REITs专题数据/policy
_
fujian.py
浏览文件 @
5cebbe1d
import
time
import
time
...
...
@@ -148,6 +148,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -159,7 +160,7 @@ def doJob():
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729043067106865154'
,
'sid'
:
'1729043067106865154'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
guangdong.py
→
REITs专题数据/policy
_
guangdong.py
浏览文件 @
5cebbe1d
import
datetime
import
datetime
...
...
@@ -150,6 +150,7 @@ def getData(data_, num,sid):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -161,7 +162,7 @@ def getData(data_, num,sid):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
sid
,
'sid'
:
sid
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
guangxi.py
→
REITs专题数据/policy
_
guangxi.py
浏览文件 @
5cebbe1d
import
json
import
json
...
...
@@ -123,6 +123,7 @@ def getData(data_, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -134,7 +135,7 @@ def getData(data_, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729045187128119298'
,
'sid'
:
'1729045187128119298'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
gwy.py
→
REITs专题数据/policy
_
gwy.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -156,6 +156,7 @@ def getData(data_, num):
'content'
:
content
,
'contentWithTag'
:
str
(
contentWithTag
),
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -167,7 +168,7 @@ def getData(data_, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729028548502597633'
,
'sid'
:
'1729028548502597633'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
hainan.py
→
REITs专题数据/policy
_
hainan.py
浏览文件 @
5cebbe1d
import
time
import
time
...
...
@@ -114,6 +114,7 @@ def getData(div, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -125,7 +126,7 @@ def getData(div, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729045345312100353'
,
'sid'
:
'1729045345312100353'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
heilongjiang.py
→
REITs专题数据/policy
_
heilongjiang.py
浏览文件 @
5cebbe1d
#coding=utf-8
#coding=utf-8
...
...
@@ -110,6 +110,7 @@ def getContent(num, title, publishDate, summary, id, pub_hao, organ,type):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -121,7 +122,7 @@ def getContent(num, title, publishDate, summary, id, pub_hao, organ,type):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729042585839841281'
,
'sid'
:
'1729042585839841281'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
hubei.py
→
REITs专题数据/policy
_
hubei.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -120,6 +120,7 @@ def getData(driver, data_, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -131,7 +132,7 @@ def getData(driver, data_, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
.
replace
(
'</em>'
,
''
)
.
replace
(
'<em>'
,
''
),
'createDate'
:
time_now
,
'sid'
:
'1729044085724860418'
,
'sid'
:
'1729044085724860418'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
jiangsu.py
→
REITs专题数据/policy
_
jiangsu.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -91,6 +91,7 @@ def getContentA(url, num, publishDate, title, origin, summary):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -102,7 +103,7 @@ def getContentA(url, num, publishDate, title, origin, summary):
'issuedNumber'
:
''
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729042894974537730'
,
'sid'
:
'1729042894974537730'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
jiangxi.py
→
REITs专题数据/policy
_
jiangxi.py
浏览文件 @
5cebbe1d
import
time
import
time
...
...
@@ -136,6 +136,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -147,7 +148,7 @@ def doJob():
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729043445107838978'
,
'sid'
:
'1729043445107838978'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
jilin.py
→
REITs专题数据/policy
_
jilin.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -161,6 +161,7 @@ def getData(num, title, url, origin, publishDate, summary):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -172,7 +173,7 @@ def getData(num, title, url, origin, publishDate, summary):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729042375596158978'
,
'sid'
:
'1729042375596158978'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
liaoning.py
→
REITs专题数据/policy
_
liaoning.py
浏览文件 @
5cebbe1d
import
time
import
time
...
...
@@ -69,6 +69,7 @@ def doJob():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -80,7 +81,7 @@ def doJob():
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729042213737967618'
,
'sid'
:
'1729042213737967618'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
neimenggu.py
→
REITs专题数据/policy
_
neimenggu.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -194,6 +194,7 @@ def getContent(num, data):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -205,7 +206,7 @@ def getContent(num, data):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729041959772860417'
,
'sid'
:
'1729041959772860417'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
shandong.py
→
REITs专题数据/policy
_
shandong.py
浏览文件 @
5cebbe1d
import
time
import
time
...
...
@@ -137,6 +137,7 @@ def getData(soup, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -148,7 +149,7 @@ def getData(soup, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729043593615560705'
,
'sid'
:
'1729043593615560705'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
shanghai.py
→
REITs专题数据/policy
_
shanghai.py
浏览文件 @
5cebbe1d
import
json
import
json
...
...
@@ -117,6 +117,7 @@ def getData(data_, driver, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -128,7 +129,7 @@ def getData(data_, driver, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729042751554506754'
,
'sid'
:
'1729042751554506754'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
shanxi.py
→
REITs专题数据/policy
_
shanxi.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -136,6 +136,7 @@ def getContent(num, data):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -147,7 +148,7 @@ def getContent(num, data):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729041791539326977'
,
'sid'
:
'1729041791539326977'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
sichuan.py
→
REITs专题数据/policy
_
sichuan.py
浏览文件 @
5cebbe1d
import
time
import
time
...
...
@@ -112,6 +112,7 @@ def getData(data_, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -123,7 +124,7 @@ def getData(data_, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729046053927178241'
,
'sid'
:
'1729046053927178241'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
tianjin.py
→
REITs专题数据/policy
_
tianjin.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -143,6 +143,7 @@ def getContent(num, title, pub_time, origin, organ, url, pub_hao, summary):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
pub_time
,
...
...
@@ -154,7 +155,7 @@ def getContent(num, title, pub_time, origin, organ, url, pub_hao, summary):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729041400674045953'
,
'sid'
:
'1729041400674045953'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
yunnan.py
→
REITs专题数据/policy
_
yunnan.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -155,6 +155,7 @@ def getData(div, num):
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -166,7 +167,7 @@ def getData(div, num):
'issuedNumber'
:
pub_hao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729046848292892673'
,
'sid'
:
'1729046848292892673'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/policy
-
zhejiang.py
→
REITs专题数据/policy
_
zhejiang.py
浏览文件 @
5cebbe1d
import
os
import
os
...
...
@@ -508,6 +508,7 @@ def getDatas(page):
'content'
:
content
,
'contentWithTag'
:
contentWithTag
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -519,7 +520,7 @@ def getDatas(page):
'issuedNumber'
:
''
,
'summary'
:
''
,
'createDate'
:
time_now
,
'sid'
:
'1730472253306552321'
,
'sid'
:
'1730472253306552321'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
REITs专题数据/reits.py
浏览文件 @
5cebbe1d
impor
t
os
impor
t
os
...
...
@@ -284,6 +284,7 @@ def reform():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate_
,
...
...
@@ -295,7 +296,7 @@ def reform():
'issuedNumber'
:
pubHao
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729029275400646658'
,
'sid'
:
'1729029275400646658'
}
# DataList.append(dic_info)
try
:
...
...
@@ -421,6 +422,7 @@ def zhengquanqihuo():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -432,7 +434,7 @@ def zhengquanqihuo():
'summary'
:
''
,
'topicClassification'
:
''
,
'createDate'
:
time_now
,
'sid'
:
'1729030277461815298'
,
'sid'
:
'1729030277461815298'
}
try
:
baseCore
.
sendkafka
(
dic_info
,
topic
)
...
...
@@ -482,7 +484,8 @@ def sse():
# if not os.path.exists(path):
# os.makedirs(path)
for
page
in
range
(
0
,
int
(
total_page
)):
url_page
=
f
'http://query.sse.com.cn/search/getESSearchDoc.do?page={page}&limit=10&publishTimeEnd=&publishTimeStart=&orderByDirection=DESC&orderByKey=score&searchMode=fuzzy&spaceId=3&keyword=REITs&siteName=sse&keywordPosition=title
%2
Cpaper_content&channelId=10001&channelCode=8640
%2
C8641
%2
C8642
%2
C8643
%2
C8644
%2
C8645
%2
C8646
%2
C8647
%2
C8648
%2
C8649
%2
C8650
%2
C8651
%2
C8652
%2
C8653
%2
C8654
%2
C8655
%2
C8656
%2
C8657
%2
C8658
%2
C8659
%2
C8660
%2
C8661
%2
C8685
%2
C9348
%2
C12632
%2
C12768
%2
C12769
%2
C12770
%2
C12771
%2
C12772
%2
C12773
%2
C12774
%2
C12775
%2
C12776
%2
C12777
%2
C12778
%2
C12779
%2
C12780
%2
C12781
%2
C12782
%2
C12783
%2
C12784
%2
C12785
%2
C12786
%2
C12787
%2
C12788
%2
C12789
%2
C12790
%2
C12791
%2
C12792
%2
C12793
%2
C12794
%2
C12795
%2
C12796
%2
C12797
%2
C12798
%2
C12799
%2
C12800
%2
C12801
%2
C12802
%2
C12803
%2
C12804
%2
C12805
%2
C12806
%2
C12807
%2
C12808
%2
C12809
%2
C12810
%2
C12811
%2
C12812
%2
C13061
%2
C13282
%2
C13283
%2
C13284
%2
C13285
%2
C13286
%2
C13287
%2
C13288
%2
C13289
%2
C13294
%2
C13364
%2
C13365
%2
C13366
%2
C13367
%2
C14595
%2
C14596
%2
C14597
%2
C14598
%2
C14599
%2
C14600
%2
C14601
%2
C14602
%2
C14603
%2
C14604
%2
C14605
%2
C14606&trackId=50619067167713018335655119683810&_=1699508921761'
t
=
int
(
time
.
time
())
url_page
=
f
'http://query.sse.com.cn/search/getESSearchDoc.do?page={page}&limit=10&publishTimeEnd=&publishTimeStart=&orderByDirection=DESC&orderByKey=score&searchMode=fuzzy&spaceId=3&keyword=REITs&siteName=sse&keywordPosition=title
%2
Cpaper_content&channelId=10001&channelCode=8640
%2
C8641
%2
C8642
%2
C8643
%2
C8644
%2
C8645
%2
C8646
%2
C8647
%2
C8648
%2
C8649
%2
C8650
%2
C8651
%2
C8652
%2
C8653
%2
C8654
%2
C8655
%2
C8656
%2
C8657
%2
C8658
%2
C8659
%2
C8660
%2
C8661
%2
C12632&trackId=24278800487459370386559742313666&_={t}'
data
=
policy
.
getrequest_json
(
headers
,
url_page
)
newslist
=
data
[
'data'
][
'knowledgeList'
]
# print(newslist)
...
...
@@ -534,6 +537,7 @@ def sse():
'content'
:
content
,
'contentWithTag'
:
''
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -545,7 +549,7 @@ def sse():
'issuedNumber'
:
''
,
'summary'
:
summary
,
'createDate'
:
time_now
,
'sid'
:
'1729035244826374145'
,
'sid'
:
'1729035244826374145'
}
# DataList.append(dic_info)
try
:
...
...
@@ -603,6 +607,7 @@ def sse():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
,
'publishDate'
:
publishDate
,
...
...
@@ -625,7 +630,7 @@ def sse():
except
Exception
as
e
:
log
.
info
(
f
"error!!!{newsUrl}"
)
log
.
info
(
e
)
log
.
info
(
f
'====第{page}页====处理结束,
已采集{num}条数据=
================'
)
log
.
info
(
f
'====第{page}页====处理结束,================'
)
# 河北省人民政府
...
...
@@ -636,7 +641,7 @@ def hebei():
num
=
0
webname
=
'河北省人民政府'
url
=
"https://www.hebei.gov.cn/search/pcRender?pageId=b97a38833f7343cebc31dec44544f684"
appNames
=
[
'信息公开'
]
appNames
=
[
'信息公开'
,
'热点专题'
]
for
appName
in
appNames
:
payload
=
{
'qAnd'
:
' '
,
'qOr'
:
' '
,
...
...
@@ -820,6 +825,9 @@ def hebei():
'attachmentIds'
:
id_list
,
'author'
:
''
,
'content'
:
content
,
'checkStatus'
:
1
,
'deleteFlag'
:
0
,
'id'
:
''
,
'contentWithTag'
:
contentWithTag_str
,
'title'
:
title
.
replace
(
'
\n
'
,
''
),
'publishDate'
:
publishDate
,
...
...
@@ -933,6 +941,7 @@ def guizhou():
'content'
:
content
,
'contentWithTag'
:
contentWithTag_str
,
'deleteFlag'
:
0
,
'checkStatus'
:
1
,
'id'
:
''
,
'title'
:
title
.
replace
(
'
\n
'
,
''
),
'publishDate'
:
publishDate
,
...
...
@@ -966,7 +975,10 @@ if __name__=="__main__":
reform
()
# shenzhen()
zhengquanqihuo
()
sse
()
try
:
sse
()
except
:
pass
hebei
()
guizhou
()
...
...
REITs专题数据/start.py
0 → 100644
浏览文件 @
5cebbe1d
import
reits
import
reits
import
policy_beijing
,
policy_chongqing
,
policy_fujian
,
policy_guangdong
import
policy_guangxi
,
policy_gwy
,
policy_hainan
,
policy_heilongjiang
,
policy_hubei
,
policy_jiangsu
import
policy_jiangxi
,
policy_jilin
,
policy_liaoning
,
policy_neimenggu
,
policy_shandong
,
policy_hubei
import
policy_shanxi
,
policy_sichuan
,
policy_tianjin
,
policy_yunnan
,
policy_zhejiang
import
RuleGuide_shanghai
,
RuleGuide_shenzhen
import
LawRules_shenzhen
,
LawRules_2_shenzhen
if
__name__
==
"__mian__"
:
policy_beijing
.
beijing
()
reits
.
sse
()
reits
.
reform
()
reits
.
hebei
()
reits
.
guizhou
()
reits
.
zhengquanqihuo
()
policy_chongqing
.
doJob
()
policy_fujian
.
doJob
()
policy_guangdong
.
doJob
()
policy_guangxi
.
doJob
()
policy_gwy
.
doJob
()
policy_hainan
.
doJob
()
policy_heilongjiang
.
doJob
()
policy_hubei
.
doJob
()
policy_jiangsu
.
doJob
()
policy_jiangxi
.
doJob
()
policy_jilin
.
doJob
()
policy_liaoning
.
doJob
()
policy_neimenggu
.
doJob
()
policy_shandong
.
doJob
()
policy_hubei
.
doJob
()
policy_shanxi
.
doJob
()
policy_sichuan
.
doJob
()
policy_tianjin
.
doJob
()
policy_yunnan
.
doJob
()
policy_zhejiang
.
doJob
()
RuleGuide_shanghai
.
doJob
()
RuleGuide_shenzhen
.
doJob
()
LawRules_shenzhen
.
doJob
()
LawRules_2_shenzhen
.
doJob
()
\ No newline at end of file
编写
预览
Markdown
格式
0%
重试
或
添加新文件
添加附件
取消
您添加了
0
人
到此讨论。请谨慎行事。
请先完成此评论的编辑!
取消
请
注册
或者
登录
后发表评论