-
Notifications
You must be signed in to change notification settings - Fork 1
/
ma_filter.py
58 lines (46 loc) · 2.01 KB
/
ma_filter.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
###########################################################################
# Copyright 2015 by ACANETS Lab at University of Massachusetts Lowell #
# #
# Licensed under the Apache License, Version 2.0 (the "License"); #
# you may not use this file except in compliance with the License. #
# You may obtain a copy of the License at #
# #
# http://www.apache.org/licenses/LICENSE-2.0 #
# #
# Unless required by applicable law or agreed to in writing, software #
# distributed under the License is distributed on an "AS IS" BASIS, #
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.#
# See the License for the specific language governing permissions and #
# limitations under the License. #
###########################################################################
# This script is used for filtering the bad url from ma_list and keep the good url
import os
import json
import sys
import re
from query_diy import get_service_locator
ma = get_service_locator("service-type=ma") #return all the MA hostnames
print ma
f = open('dataset/ma_list180924','w+')
json.dump(ma,f)
f.close()
filtered_ma = []
count = 1.0
bar_length = 100
for i in ma:
response = os.system('ping -c 3 ' + i[7:len(i)-25]) #Use ping tool to check the network connection
if response == 0:
filtered_ma.append(i)
print filtered_ma
# Print a progress bar
percentage = (count/len(ma))*100
hashes = '#' * int(percentage)
spaces = ' ' * (bar_length - len(hashes))
print "\n"
print str(int(percentage)) + "% [" + hashes + spaces + "]"
print "\n"
count = count + 1.0
# Write the filter result to a new file
fp = open('dataset/filtered_ma_list180924', 'w+')
json.dump(filtered_ma,fp)
fp.close()