|
|
发表于 2017-9-28 16:16:31
|
显示全部楼层
- html = '''
- <td class="tdbbs tdbrs">2017-09-01</td>
- <td class="tdbbs tdbrs">637564</td>
- <td class="tdbb tdbrs" align="center">
- <table width="300" border="0" cellpadding="0" cellspacing="0" class="m0a">
- <tr>
- <td><span class="Bwi dB8x"></span></td>
- <td><span class="Bwi dB6x"></span></td>
- <td><span class="Bwi dB2x"></span></td>
- <td><span class="Bwi dB1x"></span></td>
- <td><span class="Bwi dB7x"></span></td>
- <td><span class="Bwi dB5x"></span></td>
- <td><span class="Bwi dB10x"></span></td>
- <td><span class="Bwi dB3x"></span></td>
- <td><span class="Bwi dB9x"></span></td>
- <td><span class="Bwi dB4x"></span></td>
- </tr>
- </table>
- </td>
-
-
- <td class="tdbbs tdbrs">2017-09-01</td>
- <td class="tdbbs tdbrs">637563</td>
- <td class="tdbb tdbrs" align="center">
- <table width="300" border="0" cellpadding="0" cellspacing="0" class="m0a">
- <tr>
- <td><span class="Bwi dB10x"></span></td>
- <td><span class="Bwi dB2x"></span></td>
- <td><span class="Bwi dB1x"></span></td>
- <td><span class="Bwi dB8x"></span></td>
- <td><span class="Bwi dB4x"></span></td>
- <td><span class="Bwi dB9x"></span></td>
- <td><span class="Bwi dB3x"></span></td>
- <td><span class="Bwi dB7x"></span></td>
- <td><span class="Bwi dB6x"></span></td>
- <td><span class="Bwi dB5x"></span></td>
- </tr>
- </table>'''
- import re
- titles=re.findall('<td class="tdbbs tdbrs">(\d+?)</td>', html)
- contents = re.findall('<td><span class="Bwi dB(\d+)x"></span></td>',html)
- for t in range(len(titles)):
- print(titles[t])
- print(contents[10*t:10*t+10])
复制代码
637564
['8', '6', '2', '1', '7', '5', '10', '3', '9', '4']
637563
['10', '2', '1', '8', '4', '9', '3', '7', '6', '5']
[Finished in 0.1s] |
|