Skip to content
Projects
Groups
Snippets
Help
Loading...
Sign in
Toggle navigation
F
ffm-baseline
Project
Project
Details
Activity
Cycle Analytics
Repository
Repository
Files
Commits
Branches
Tags
Contributors
Graph
Compare
Charts
Issues
0
Issues
0
List
Board
Labels
Milestones
Merge Requests
0
Merge Requests
0
CI / CD
CI / CD
Pipelines
Jobs
Schedules
Charts
Wiki
Wiki
Members
Members
Collapse sidebar
Close sidebar
Activity
Graph
Charts
Create a new issue
Jobs
Commits
Issue Boards
Open sidebar
ML
ffm-baseline
Commits
a1908523
Commit
a1908523
authored
Jan 13, 2021
by
张彦钊
Browse files
Options
Browse Files
Download
Email Patches
Plain Diff
add
parent
e5c5dc82
Hide whitespace changes
Inline
Side-by-side
Showing
1 changed file
with
31 additions
and
1 deletion
+31
-1
hosipatl_name.py
zyz/hosipatl_name.py
+31
-1
No files found.
zyz/hosipatl_name.py
View file @
a1908523
...
...
@@ -9,14 +9,44 @@ import pandas as pd
# 抽取医院名字简称
def
get_city_names
():
db
=
pymysql
.
connect
(
host
=
'172.16.30.143'
,
port
=
3306
,
user
=
'work'
,
passwd
=
'BJQaT9VzDcuPBqkd'
,
db
=
'zhengxing'
)
cursor
=
db
.
cursor
()
sql_active
=
"select name from api_city;"
cursor
.
execute
(
sql_active
)
result
=
cursor
.
fetchall
()
name_list
=
pd
.
DataFrame
(
list
(
result
))[
0
]
.
values
.
tolist
()
print
(
name_list
[:
10
])
db
.
close
()
return
name_list
def
name_short
():
db
=
pymysql
.
connect
(
host
=
'172.16.30.143'
,
port
=
3306
,
user
=
'work'
,
passwd
=
'BJQaT9VzDcuPBqkd'
,
db
=
'zhengxing'
)
cursor
=
db
.
cursor
()
sql_active
=
"select name from api_hospital;"
cursor
.
execute
(
sql_active
)
result
=
cursor
.
fetchall
()
name_list
=
pd
.
DataFrame
(
list
(
result
))[
0
]
.
values
.
tolist
()
name_list
=
pd
.
DataFrame
(
list
(
result
))[
0
]
.
values
.
tolist
()[:
20
]
db
.
close
()
print
(
name_list
[:
10
])
names
=
[
"医疗"
,
"门诊"
,
"研究所"
,
"有限"
,
"公司"
,
"医学"
,
"诊所"
,
"中心"
,
"医美"
,
"集团"
,
"卫生"
,
"机构"
,
"专业"
,
"光学"
,
"国际"
,
"连锁"
,
"综合"
,
"专科"
,
""
]
location
=
[
"街道"
,
"社区"
,]
city_list
=
get_city_names
()
stop_words
=
names
+
location
+
city_list
new_names
=
[]
for
name
in
name_list
:
for
word
in
stop_words
:
name
=
re
.
sub
(
word
,
''
,
name
)
new_names
.
append
(
name
)
df
=
pd
.
DataFrame
()
df
[
'old_name'
]
=
name_list
df
[
'new_name'
]
=
new_names
print
(
df
.
head
(
6
))
df
.
to_csv
(
"/home/gmuser/"
+
"12.csv"
,
index
=
None
)
# number = list()
# for i in cover:
...
...
Write
Preview
Markdown
is supported
0%
Try again
or
attach a new file
Attach a file
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Cancel
Please
register
or
sign in
to comment