您现在的位置: 首页 > 网站导航收录 > 百科知识百科知识
python易于上手,你都用python做什么?
数据,爬虫,申请人python易于上手,你都用python做什么?
发布时间:2020-12-06加入收藏来源:互联网点击:
首先,当然是进入你需要共享文件的目录下
然后根据python版本的不同,选择执行如下命令:
Python2
python -m SimpleHTTPServer 9999
Python3
python -m http.server 9999
数据分析
主要是根据中间件的不同来写一些脚本,比如链接Elasticsearch 、链接Kafka、链接Mysql,链接Redis,在开发之中,可以快速的获取到数据,验证想法
希望能帮到你
回答于 2019-09-11 08:43:50
在律所里分析判决书!相当有用!
上代码:
import docx, csv, docxpy
import re
from get_file_path import all_file_list
with open('process_book' + '.csv', 'a+', encoding='utf-8') as file:
writer = csv.writer(file)
writer.writerow([
'案号', '法院名称', '原审地'
'再审申请人1', '再审申请人1住址',
'再审申请人2', '再审申请人2住址',
'再审申请人3', '再审申请人3住址',
'再审申请人一审地位', '再审申请人二审地位',
'被申请人1住址', '被申请人2住址', '被申请人3住址',
'被申请人的类型,0自然人,1公司法人,2机关法人',
'再审申请人是否有律师', '被申请人是否有律师',
'合议庭人数', '审判长姓名', '审判员1', '审判员2'
])
for read_docx in all_file_list:
file = docx.Document(read_docx)
print('------docx已经顺利读出文件,开始处理中------')
file2 = docxpy.process(read_docx)
print('------docxpy已经顺利读出文件,开始处理中------')
# 案号
try:
number = file.paragraphs[7].text
except Exception as e:
number = '出错'
print(number)
'''
找案件地域,注意最高院的情况
'''
# 提取再审法院名称
court_name = re.findall(r'审理法院: (.*)', file2)[0]
# 找不服哪级法院判决,然后丢出去
case_district = re.findall(r'(.*)不服(.*)人民法院', file2)
for district in case_district:
case_district = re.findall(r'[一-龥]{3}', district[1])[0]
'''
这里开始找再审申请人的信息
'''
appellant_name_list = []
appellant_name_0 = appellant_name_1 = appellant_name_2 = appellant_name_3 = ''
instance_appellant_name = re.findall(r'再审申请人(.*):(.*),', file2)
if instance_appellant_name:
for name in instance_appellant_name:
large_list = name.split(',')
if '男' in large_list:
appellant_name_list.append(large_list[0])
elif '女' in large_list:
appellant_name_list.append(large_list[0])
else:
appellant_name_list.append(large_list[0])
for get_appellant_name in range(len(appellant_name_list)):
locals()['appellant_name_' + str(get_appellant_name)] = appellant_name_list[get_appellant_name]
instance_appellant_name = re.findall(r'再审申请人(.*):(.*)。住所', file2)
if len(appellant_name_0) == 0: # 稍微变态模式
for name in instance_appellant_name:
appellant_name_list.append(name)
for get_appellant_name in range(len(appellant_name_list)):
locals()['appellant_name_' + str(get_appellant_name)] = appellant_name_list[get_appellant_name]
if not appellant_name_list: # 超级变态
instance_appellant_name = re.findall(r'再审申请人(.*):(.*)。
', file2)
for name in instance_appellant_name:
appellant_name_list.append(name)
for get_appellant_name in range(len(appellant_name_list)):
locals()['appellant_name_' + str(get_appellant_name)] = appellant_name_list[get_appellant_name]
# 判断再审申请人是否有律师:
appellant_have_lawyer = 0
appellant_have_lawyer_result = re.findall(r'再审申请人([\s\S]*委托诉讼代理人:.*', file2)
for lawyer_is in appellant_have_lawyer_result:
if '律师' in lawyer_is:
appellant_have_lawyer = 1
else:
appellant_have_lawyer = 0
# 判断被申请人是否有律师:
retrial_respondent_have_lawyer = 0
retrial_respondent_lawyer_result = re.findall(r'被申请人([\s\S]*委托诉讼代理人:.*', file2)
for lawyer_is in retrial_respondent_lawyer_result:
if '律师' in lawyer_is:
retrial_respondent_have_lawyer = 1
else:
retrial_respondent_have_lawyer = 0
# 定义空字符串用于接收循环体返回内容
# 审判长
chief_judge = ''
# 审判员列表
judge_list = []
# 审判员
judge_officer_0 = judge_officer_1 = ''
# 合议庭总人数
collegiate_bench_num = None
# 找合议庭信息
for read_docx in file.paragraphs:
'''
这里先找合议庭成员的信息
'''
chief_judge_all = re.findall(r'审判长 (.+)', read_docx.text)
for k in chief_judge_all:
chief_judge = k.replace(' ', '') # 取到审判长名字
judge_officer_all = re.findall(r'审判员 (.+)', read_docx.text)
for k in judge_officer_all:
judge_list.append(k.replace(' ', '')) # 取到所有审判员列表
# 计算合议庭总人数
collegiate_bench_num = 1 + len(judge_list)
# 为审判员动态赋值
for get_judge_officer in range(len(judge_list)):
locals()['judge_officer_' + str(get_judge_officer)] = judge_list[get_judge_officer]
# 再审申请人的住址
appellant_address_list = []
appellant_address_0 = appellant_address_1 = appellant_address_2 = appellant_address_3 = ''
appellant_address_result = re.findall(r'再审申请人(.*):.*住所地(.*)。', file2) # 法人住址,'住所地三字全'
if appellant_address_result:
for addr in appellant_address_result:
appellant_address_list.append(addr.strip(':'))
for detail_addr in range(len(appellant_address_list)):
locals()['appellant_address_' + str(detail_addr)] = appellant_address_list[detail_addr]
else:
appellant_address_result = re.findall(r'再审申请人(.*):.*住(.+)。', file2) # 自然人住址,'住'开始
for addr in appellant_address_result:
appellant_address_list.append(addr.strip(':'))
for detail_addr in range(len(appellant_address_list)):
locals()['appellant_address_' + str(detail_addr)] = appellant_address_list[detail_addr]
# 被申请人住址:
respondent_address_list = []
respondent_address_0 = respondent_address_1 = respondent_address_2 = respondent_address_3 = ''
respondent_address_result = re.findall(r'被申请人(.*):.*住所地(.*)。', file2) # 法人住址,'住所地三字全'
if respondent_address_result:
for addr in respondent_address_result:
respondent_address_list.append(addr.strip(':'))
for detail_addr in range(len(respondent_address_list)):
locals()['respondent_address_' + str(detail_addr)] = respondent_address_list[detail_addr]
下一篇:返回列表
相关链接 |
||
网友回复(共有 0 条回复) |