import re
content = '''
<tr><td>1001</td><td>張三<br /></td></tr>
<tr><td>1002</td><td>李四</td></tr>
<tr><td>1003</td><td><B>Tom</B></td></tr>
'''
stu=re.findall("(\d+).*>(\w+)<",content)
print(stu)
list_dict=[[("學號",i[0]),("姓名",i[1])] for i in stu]
stu_info=[dict(i) for i in list_dict]
print(stu_info)
或者用bs4也行。