def crawPlateConceptDataSource(link): currentList = [] startContext = PlateConceptNetSpiderUtils.returnStartContext(link,'<tbody>') startContext = PlateConceptNetSpiderUtils.filterContextByTarget(startContext,'<tbody>','</tbody>') startContext = PlateConceptNetSpiderUtils.filterAfterContext(startContext,'</tr>') len = PlateConceptNetSpiderUtils.findAllTarget(startContext,'<tr') for i in range(len): targetContext = PlateConceptNetSpiderUtils.divisionTarget(startContext,'<tr','</tr>') startContext = targetContext['nextContext'] currentContext = targetContext['targetContext'] currentContext = PlateConceptNetSpiderUtils.removeSpecialCharacter(currentContext) linkUrl = PlateConceptNetSpiderUtils.filterContextByTarget(currentContext,'<td>','</a>') platename = PlateConceptNetSpiderUtils.filterAfterContext(linkUrl,'>') linkUrl = PlateConceptNetSpiderUtils.filterContextByTarget(linkUrl,'href="','">') currentContext = PlateConceptNetSpiderUtils.filterAfterContext(currentContext,'</td>') currentContext = PlateConceptNetSpiderUtils.filterAfterContext(currentContext,'</td>') risedecline = float(PlateConceptNetSpiderUtils.filterContextByTarget(currentContext,'>','%'))/100 inmoney = PlateConceptNetSpiderUtils.filterContextByTarget(currentContext,'<td>','</td>') currentContext = PlateConceptNetSpiderUtils.filterAfterContext(currentContext,'</td>') outmoney = PlateConceptNetSpiderUtils.filterContextByTarget(currentContext,'<td>','</td>') currentContext = PlateConceptNetSpiderUtils.filterAfterContext(currentContext,'</td>') currentmoney= PlateConceptNetSpiderUtils.filterContextByTarget(currentContext,'>','</TD>') totalmoney = PlateConceptNetSpiderUtils.filterContextByTarget(currentContext,'<td>','</td>') currentList.append([platename,linkUrl,risedecline,inmoney,outmoney,currentmoney,totalmoney]) return currentList