1 import sys
2 f=open(sys.argv[1],'r')
3 pid_list=[]
4 for i in f.readlines():
5 if i.startswith('<p id=') :
6 list_tmp=i.split('"')[1]
7 pid_list.append(list_tmp)
8 print pid_list