int begin = line.indexOf("href="down")    int end = line.indexOf("pdf",begin)    if(end>begin){        url = "http://www.qconbeijing.com/"+line[begin+6..end+2]        println "downloading "+url        ("wget "+url).execute()    }}" />     int begin = line.indexOf("href="down")    int end = line.indexOf("pdf",begin)    if(end>begin){        url = "http://www.qconbeijing.com/"+line[begin+6..end+2]        println "downloading "+url        ("wget "+url).execute()    }}"/> li3huo.com – QCon BeiJing 2010 PPT

QCon BeiJing 2010 PPT

Posted on Tue 11 May 2010 in it

InfoQ把2010年QCon的ppt放出来了,可以用如下代码进行抓取:

def url = "http://www.qconbeijing.com/agenda.html"

url.toURL().text.eachLine {line->
    int begin = line.indexOf("href="down")
    int end = line.indexOf("pdf",begin)
    if(end>begin){
        url = "http://www.qconbeijing.com/"+line[begin+6..end+2]
        println "downloading "+url
        ("wget "+url).execute()
    }
}