-
Notifications
You must be signed in to change notification settings - Fork 0
/
generateWordList.py
40 lines (33 loc) · 1.08 KB
/
generateWordList.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
import requests,json,string
from urllib.parse import urlparse
#this api has many public api url
APIdatabaseURL = "http://apis.io/api/apis?limit=1000"
words = []
while True:
response = requests.get(APIdatabaseURL)
jsonResponse = json.loads(response.content)
#if there's no data then finish
if(len(jsonResponse['data'])==0):
break
#get look at data
for data in jsonResponse['data']:
if('baseURL' in data):
#get the url path component
path = urlparse(data['baseURL']).path
#slipt it
paths = path.split("/")
#add all the path to the list
for i in range(1,len(paths)):
# print(paths[i])
if(paths[i] not in words):
words.append(paths[i])
#go to next page
APIdatabaseURL = jsonResponse[' paging']['next']
#remove the word that is too long in the result list
for word in words:
if len(word)>20:
words.remove(word)
#write it to the file
with open('wordList', 'w') as f:
for item in words:
f.write("%s\n" % item)