-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfindSimilarity.py
70 lines (57 loc) · 1.74 KB
/
findSimilarity.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
import csv
import urllib.request
from bs4 import BeautifulSoup
"""
according to html's lineNum --- res code
read file find similar function report the line
确定函数名称
确定错误行号 找到对应错误代码的行号 错误代码 对应在函数名称下面的多少行
"""
# Python program to convert a list
# to string using join() function
# Function to convert
def listToString(s):
# initialize an empty string
str1 = "\n"
# return string
return (str1.join(s))
def find_function():
pass
def visitUrl(url):
resp = urllib.request.urlopen(url)
htmls = resp.read().decode("utf-8")
return htmls
def saveHtml(file_name, file_text):
with open(file_name.replace('/', '_') + '.html', 'w', encoding='utf-8') as f:
f.write(file_text)
def visitHtmlFile(urlname):
with open(urlname.replace('/', '_'), 'r', encoding='utf-8') as f:
htmlpage=f.readlines()
# Driver code
# s = ['Geeks', 'for', 'Geeks']
htmlpage=listToString(htmlpage)
return htmlpage
with open('bug reports - numpy-f2py.csv','r',encoding='utf-8') as f:
row = csv.DictReader(f, delimiter = ',')
# titles=next(row)
# print(titles)
"""
,function,line,length,url,file,s_function,s_line,status,error type
"""
for line in row:
print(line['file'])
print(line['function'])
print(line)
funcname=line['function']
url=line['url']
htmlpage = visitHtmlFile(url)
"""
# get html from url
htmlpage=visitUrl(url)
saveHtml(url,htmlpage)
print(htmlpage)
"""
soup=BeautifulSoup(htmlpage,'html.parser')
print(soup)
pass
"""http:__192.168.5.61:20000_report-c53a24.html#EndPath.html"""