From 03ebc9751e497953a22444e54cdc7104cdb07260 Mon Sep 17 00:00:00 2001 From: ghoshorn Date: Wed, 23 Mar 2016 22:40:33 +0800 Subject: [PATCH] =?UTF-8?q?=E9=80=9A=E8=BF=87ucas=E6=8E=A5=E5=8F=A3?= =?UTF-8?q?=EF=BC=8C=E8=8E=B7=E5=BE=97=E5=AD=A6=E6=A0=A1=E5=90=8D=E7=A7=B0?= =?UTF-8?q?=E7=AD=89?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- get_school_names_from_ucas.py | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) create mode 100644 get_school_names_from_ucas.py diff --git a/get_school_names_from_ucas.py b/get_school_names_from_ucas.py new file mode 100644 index 0000000..a173da9 --- /dev/null +++ b/get_school_names_from_ucas.py @@ -0,0 +1,24 @@ +# -*- coding: utf-8 -*- +import urllib2 +# import json +from lxml import etree +import sys +reload(sys) +sys.setdefaultencoding("utf-8") +# import requests +# import pdb + +if __name__=="__main__": + url='http://edu.ucas.ac.cn:8080/TRRP_SEP/WebService/PredictiveSearch.asmx/GetAllPredictionsWithCodeInfo?className=jzs010114&codeOrName=' + try: + response=urllib2.urlopen(url+'中国科学院') + cont=response.read() + tree=etree.HTML(cont) + for codeinfo in tree.getchildren()[0].getchildren()[0].getchildren(): + print codeinfo[2].text + else: + print "空" + # pdb.set_trace() + # print cont + except Exception, e: + pass \ No newline at end of file